]> git.proxmox.com Git - pve-container.git/blame - src/PVE/LXC.pm
Don't apply snapshot config in snapshot_commit
[pve-container.git] / src / PVE / LXC.pm
CommitLineData
f76a2828
DM
1package PVE::LXC;
2
3use strict;
4use warnings;
d14a9a1b 5use POSIX qw(EINTR);
f76a2828 6
34fdb3d7
WB
7use Socket;
8
f76a2828 9use File::Path;
2cfae16e
WB
10use File::Spec;
11use Cwd qw();
3cc56749 12use Fcntl qw(O_RDONLY);
f76a2828
DM
13
14use PVE::Cluster qw(cfs_register_file cfs_read_file);
f1ba1a4b 15use PVE::Exception qw(raise_perm_exc);
c65e0a6d 16use PVE::Storage;
f76a2828
DM
17use PVE::SafeSyslog;
18use PVE::INotify;
a3249355 19use PVE::JSONSchema qw(get_standard_option);
1bfe8728 20use PVE::Tools qw($IPV6RE $IPV4RE dir_glob_foreach lock_file lock_file_full);
68fba17b 21use PVE::Network;
52389a07 22use PVE::AccessControl;
228a5a1d 23use PVE::ProcFSTools;
688afc63 24use Time::HiRes qw (gettimeofday);
f76a2828
DM
25
26use Data::Dumper;
27
27916659
DM
28my $nodename = PVE::INotify::nodename();
29
688afc63
WL
30my $cpuinfo= PVE::ProcFSTools::read_cpuinfo();
31
f9897acd 32our $COMMON_TAR_FLAGS = [ '--sparse', '--numeric-owner', '--acls',
fc4e132e
WB
33 '--xattrs',
34 '--xattrs-include=user.*',
4132377b
WB
35 '--xattrs-include=security.capability',
36 '--warning=no-xattr-write' ];
fc4e132e 37
27916659 38cfs_register_file('/lxc/', \&parse_pct_config, \&write_pct_config);
f76a2828 39
769fbfab
WB
40my $rootfs_desc = {
41 volume => {
42 type => 'string',
43 default_key => 1,
da990295 44 format => 'pve-lxc-mp-string',
769fbfab
WB
45 format_description => 'volume',
46 description => 'Volume, device or directory to mount into the container.',
47 },
48 backup => {
49 type => 'boolean',
50 format_description => '[1|0]',
51 description => 'Whether to include the mountpoint in backups.',
52 optional => 1,
53 },
54 size => {
72d583ff
WB
55 type => 'string',
56 format => 'disk-size',
769fbfab 57 format_description => 'DiskSize',
769fbfab
WB
58 description => 'Volume size (read only value).',
59 optional => 1,
60 },
471dd315
WB
61 acl => {
62 type => 'boolean',
63 format_description => 'acl',
64 description => 'Explicitly enable or disable ACL support.',
65 optional => 1,
66 },
67 ro => {
68 type => 'boolean',
69 format_description => 'ro',
70 description => 'Read-only mountpoint (not supported with bind mounts)',
71 optional => 1,
72 },
50df544c
WB
73 quota => {
74 type => 'boolean',
75 format_description => '[0|1]',
76 description => 'Enable user quotas inside the container (not supported with zfs subvolumes)',
77 optional => 1,
78 },
769fbfab 79};
822de0c3 80
27916659 81PVE::JSONSchema::register_standard_option('pve-ct-rootfs', {
769fbfab 82 type => 'string', format => $rootfs_desc,
8fbd2935 83 description => "Use volume as container root.",
27916659
DM
84 optional => 1,
85});
86
52389a07
DM
87PVE::JSONSchema::register_standard_option('pve-lxc-snapshot-name', {
88 description => "The name of the snapshot.",
89 type => 'string', format => 'pve-configid',
90 maxLength => 40,
91});
92
27916659 93my $confdesc = {
09d3ec42
DM
94 lock => {
95 optional => 1,
96 type => 'string',
97 description => "Lock/unlock the VM.",
98 enum => [qw(migrate backup snapshot rollback)],
99 },
27916659
DM
100 onboot => {
101 optional => 1,
102 type => 'boolean',
103 description => "Specifies whether a VM will be started during system bootup.",
104 default => 0,
117636e5 105 },
27916659 106 startup => get_standard_option('pve-startup-order'),
bb1ac2de
DM
107 template => {
108 optional => 1,
109 type => 'boolean',
110 description => "Enable/disable Template.",
111 default => 0,
112 },
27916659
DM
113 arch => {
114 optional => 1,
115 type => 'string',
116 enum => ['amd64', 'i386'],
117 description => "OS architecture type.",
118 default => 'amd64',
117636e5 119 },
27916659
DM
120 ostype => {
121 optional => 1,
122 type => 'string',
238b7e3e
DM
123 enum => ['debian', 'ubuntu', 'centos', 'fedora', 'opensuse', 'archlinux', 'alpine', 'unmanaged'],
124 description => "OS type. This is used to setup configuration inside the container, and corresponds to lxc setup scripts in /usr/share/lxc/config/<ostype>.common.conf. Value 'unmanaged' can be used to skip and OS specific setup.",
a3249355 125 },
4f958489
DM
126 console => {
127 optional => 1,
128 type => 'boolean',
129 description => "Attach a console device (/dev/console) to the container.",
130 default => 1,
131 },
27916659
DM
132 tty => {
133 optional => 1,
134 type => 'integer',
135 description => "Specify the number of tty available to the container",
136 minimum => 0,
137 maximum => 6,
0d0ca400 138 default => 2,
611fe3aa 139 },
27916659
DM
140 cpulimit => {
141 optional => 1,
142 type => 'number',
c31ad455 143 description => "Limit of CPU usage. Note if the computer has 2 CPUs, it has a total of '2' CPU time. Value '0' indicates no CPU limit.",
27916659
DM
144 minimum => 0,
145 maximum => 128,
146 default => 0,
147 },
148 cpuunits => {
149 optional => 1,
150 type => 'integer',
c31ad455 151 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to the weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
27916659
DM
152 minimum => 0,
153 maximum => 500000,
81bee809 154 default => 1024,
27916659
DM
155 },
156 memory => {
157 optional => 1,
158 type => 'integer',
159 description => "Amount of RAM for the VM in MB.",
160 minimum => 16,
161 default => 512,
162 },
163 swap => {
164 optional => 1,
165 type => 'integer',
166 description => "Amount of SWAP for the VM in MB.",
167 minimum => 0,
168 default => 512,
169 },
170 hostname => {
171 optional => 1,
172 description => "Set a host name for the container.",
159aad3e 173 type => 'string', format => 'dns-name',
27916659
DM
174 maxLength => 255,
175 },
176 description => {
177 optional => 1,
178 type => 'string',
179 description => "Container description. Only used on the configuration web interface.",
180 },
181 searchdomain => {
182 optional => 1,
159aad3e 183 type => 'string', format => 'dns-name-list',
c31ad455 184 description => "Sets DNS search domains for a container. Create will automatically use the setting from the host if you neither set searchdomain nor nameserver.",
27916659
DM
185 },
186 nameserver => {
187 optional => 1,
159aad3e 188 type => 'string', format => 'address-list',
c31ad455 189 description => "Sets DNS server IP address for a container. Create will automatically use the setting from the host if you neither set searchdomain nor nameserver.",
27916659
DM
190 },
191 rootfs => get_standard_option('pve-ct-rootfs'),
09d3ec42
DM
192 parent => {
193 optional => 1,
194 type => 'string', format => 'pve-configid',
195 maxLength => 40,
196 description => "Parent snapshot name. This is used internally, and should not be modified.",
197 },
198 snaptime => {
199 optional => 1,
200 description => "Timestamp for snapshots.",
201 type => 'integer',
202 minimum => 0,
203 },
aca816ad
DM
204 cmode => {
205 optional => 1,
206 description => "Console mode. By default, the console command tries to open a connection to one of the available tty devices. By setting cmode to 'console' it tries to attach to /dev/console instead. If you set cmode to 'shell', it simply invokes a shell inside the container (no login).",
207 type => 'string',
208 enum => ['shell', 'console', 'tty'],
209 default => 'tty',
210 },
7e806596
AG
211 protection => {
212 optional => 1,
213 type => 'boolean',
c31ad455 214 description => "Sets the protection flag of the container. This will prevent the CT or CT's disk remove/update operation.",
7e806596
AG
215 default => 0,
216 },
425b62cb
WB
217 unprivileged => {
218 optional => 1,
219 type => 'boolean',
220 description => "Makes the container run as unprivileged user. (Should not be modified manually.)",
221 default => 0,
222 },
f76a2828
DM
223};
224
e576f689
DM
225my $valid_lxc_conf_keys = {
226 'lxc.include' => 1,
227 'lxc.arch' => 1,
228 'lxc.utsname' => 1,
229 'lxc.haltsignal' => 1,
230 'lxc.rebootsignal' => 1,
231 'lxc.stopsignal' => 1,
232 'lxc.init_cmd' => 1,
233 'lxc.network.type' => 1,
234 'lxc.network.flags' => 1,
235 'lxc.network.link' => 1,
236 'lxc.network.mtu' => 1,
237 'lxc.network.name' => 1,
238 'lxc.network.hwaddr' => 1,
239 'lxc.network.ipv4' => 1,
240 'lxc.network.ipv4.gateway' => 1,
241 'lxc.network.ipv6' => 1,
242 'lxc.network.ipv6.gateway' => 1,
243 'lxc.network.script.up' => 1,
244 'lxc.network.script.down' => 1,
245 'lxc.pts' => 1,
246 'lxc.console.logfile' => 1,
247 'lxc.console' => 1,
248 'lxc.tty' => 1,
249 'lxc.devttydir' => 1,
250 'lxc.hook.autodev' => 1,
251 'lxc.autodev' => 1,
252 'lxc.kmsg' => 1,
253 'lxc.mount' => 1,
254 'lxc.mount.entry' => 1,
255 'lxc.mount.auto' => 1,
312e9850 256 'lxc.rootfs' => 'lxc.rootfs is auto generated from rootfs',
e576f689 257 'lxc.rootfs.mount' => 1,
312e9850
WB
258 'lxc.rootfs.options' => 'lxc.rootfs.options is not supported' .
259 ', please use mountpoint options in the "rootfs" key',
e576f689
DM
260 # lxc.cgroup.*
261 'lxc.cap.drop' => 1,
262 'lxc.cap.keep' => 1,
263 'lxc.aa_profile' => 1,
264 'lxc.aa_allow_incomplete' => 1,
265 'lxc.se_context' => 1,
266 'lxc.seccomp' => 1,
267 'lxc.id_map' => 1,
268 'lxc.hook.pre-start' => 1,
269 'lxc.hook.pre-mount' => 1,
270 'lxc.hook.mount' => 1,
271 'lxc.hook.start' => 1,
53775872 272 'lxc.hook.stop' => 1,
e576f689
DM
273 'lxc.hook.post-stop' => 1,
274 'lxc.hook.clone' => 1,
275 'lxc.hook.destroy' => 1,
276 'lxc.loglevel' => 1,
277 'lxc.logfile' => 1,
278 'lxc.start.auto' => 1,
279 'lxc.start.delay' => 1,
280 'lxc.start.order' => 1,
281 'lxc.group' => 1,
282 'lxc.environment' => 1,
e576f689
DM
283};
284
769fbfab
WB
285my $netconf_desc = {
286 type => {
287 type => 'string',
288 optional => 1,
289 description => "Network interface type.",
290 enum => [qw(veth)],
291 },
292 name => {
293 type => 'string',
294 format_description => 'String',
295 description => 'Name of the network device as seen from inside the container. (lxc.network.name)',
296 pattern => '[-_.\w\d]+',
297 },
298 bridge => {
299 type => 'string',
300 format_description => 'vmbr<Number>',
301 description => 'Bridge to attach the network device to.',
302 pattern => '[-_.\w\d]+',
a7c080a7 303 optional => 1,
769fbfab
WB
304 },
305 hwaddr => {
306 type => 'string',
307 format_description => 'MAC',
308 description => 'Bridge to attach the network device to. (lxc.network.hwaddr)',
309 pattern => qr/(?:[a-f0-9]{2}:){5}[a-f0-9]{2}/i,
310 optional => 1,
311 },
312 mtu => {
313 type => 'integer',
314 format_description => 'Number',
315 description => 'Maximum transfer unit of the interface. (lxc.network.mtu)',
07521af1 316 minimum => 64, # minimum ethernet frame is 64 bytes
769fbfab
WB
317 optional => 1,
318 },
319 ip => {
320 type => 'string',
321 format => 'pve-ipv4-config',
322 format_description => 'IPv4Format/CIDR',
323 description => 'IPv4 address in CIDR format.',
324 optional => 1,
325 },
326 gw => {
327 type => 'string',
328 format => 'ipv4',
329 format_description => 'GatewayIPv4',
330 description => 'Default gateway for IPv4 traffic.',
331 optional => 1,
332 },
333 ip6 => {
334 type => 'string',
335 format => 'pve-ipv6-config',
336 format_description => 'IPv6Format/CIDR',
337 description => 'IPv6 address in CIDR format.',
338 optional => 1,
339 },
340 gw6 => {
341 type => 'string',
342 format => 'ipv6',
343 format_description => 'GatewayIPv6',
344 description => 'Default gateway for IPv6 traffic.',
345 optional => 1,
346 },
347 firewall => {
348 type => 'boolean',
349 format_description => '[1|0]',
350 description => "Controls whether this interface's firewall rules should be used.",
351 optional => 1,
352 },
353 tag => {
354 type => 'integer',
355 format_description => 'VlanNo',
356 minimum => '2',
357 maximum => '4094',
23eb2244
WB
358 description => "VLAN tag for this interface.",
359 optional => 1,
360 },
361 trunks => {
362 type => 'string',
363 pattern => qr/\d+(?:;\d+)*/,
364 format_description => 'vlanid[;vlanid...]',
365 description => "VLAN ids to pass through the interface",
769fbfab
WB
366 optional => 1,
367 },
368};
369PVE::JSONSchema::register_format('pve-lxc-network', $netconf_desc);
370
27916659
DM
371my $MAX_LXC_NETWORKS = 10;
372for (my $i = 0; $i < $MAX_LXC_NETWORKS; $i++) {
373 $confdesc->{"net$i"} = {
374 optional => 1,
1a0a239c 375 type => 'string', format => $netconf_desc,
769fbfab 376 description => "Specifies network interfaces for the container.",
27916659 377 };
90bc31f7
DM
378}
379
da990295
DC
380PVE::JSONSchema::register_format('pve-lxc-mp-string', \&verify_lxc_mp_string);
381sub verify_lxc_mp_string{
382 my ($mp, $noerr) = @_;
383
384 # do not allow:
385 # /./ or /../
386 # /. or /.. at the end
387 # ../ at the beginning
388
389 if($mp =~ m@/\.\.?/@ ||
390 $mp =~ m@/\.\.?$@ ||
391 $mp =~ m@^\.\./@){
392 return undef if $noerr;
393 die "$mp contains illegal character sequences\n";
394 }
395 return $mp;
396}
397
769fbfab
WB
398my $mp_desc = {
399 %$rootfs_desc,
400 mp => {
401 type => 'string',
da990295 402 format => 'pve-lxc-mp-string',
769fbfab
WB
403 format_description => 'Path',
404 description => 'Path to the mountpoint as seen from inside the container.',
769fbfab
WB
405 },
406};
407PVE::JSONSchema::register_format('pve-ct-mountpoint', $mp_desc);
408
69202f71
WB
409my $unuseddesc = {
410 optional => 1,
411 type => 'string', format => 'pve-volume-id',
412 description => "Reference to unused volumes.",
413};
414
02c9d10c
AD
415my $MAX_MOUNT_POINTS = 10;
416for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
417 $confdesc->{"mp$i"} = {
418 optional => 1,
769fbfab 419 type => 'string', format => $mp_desc,
566d5f81 420 description => "Use volume as container mount point (experimental feature).",
02c9d10c
AD
421 optional => 1,
422 };
423}
424
69202f71
WB
425my $MAX_UNUSED_DISKS = $MAX_MOUNT_POINTS;
426for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
427 $confdesc->{"unused$i"} = $unuseddesc;
428}
429
27916659
DM
430sub write_pct_config {
431 my ($filename, $conf) = @_;
f76a2828 432
27916659 433 delete $conf->{snapstate}; # just to be sure
f76a2828 434
27916659
DM
435 my $generate_raw_config = sub {
436 my ($conf) = @_;
f76a2828 437
27916659 438 my $raw = '';
cbb03fea 439
27916659
DM
440 # add description as comment to top of file
441 my $descr = $conf->{description} || '';
442 foreach my $cl (split(/\n/, $descr)) {
443 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
a12a36e0 444 }
fff3a342 445
27916659 446 foreach my $key (sort keys %$conf) {
09d3ec42 447 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' ||
e576f689 448 $key eq 'snapshots' || $key eq 'snapname' || $key eq 'lxc';
545d10ba
DM
449 my $value = $conf->{$key};
450 die "detected invalid newline inside property '$key'\n" if $value =~ m/\n/;
451 $raw .= "$key: $value\n";
a12a36e0 452 }
e576f689
DM
453
454 if (my $lxcconf = $conf->{lxc}) {
455 foreach my $entry (@$lxcconf) {
456 my ($k, $v) = @$entry;
457 $raw .= "$k: $v\n";
458 }
459 }
460
27916659 461 return $raw;
a12a36e0 462 };
160f0941 463
27916659 464 my $raw = &$generate_raw_config($conf);
a12a36e0 465
27916659
DM
466 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
467 $raw .= "\n[$snapname]\n";
468 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
f76a2828
DM
469 }
470
f76a2828
DM
471 return $raw;
472}
473
27916659
DM
474sub check_type {
475 my ($key, $value) = @_;
822de0c3 476
27916659 477 die "unknown setting '$key'\n" if !$confdesc->{$key};
822de0c3 478
27916659
DM
479 my $type = $confdesc->{$key}->{type};
480
481 if (!defined($value)) {
482 die "got undefined value\n";
483 }
484
485 if ($value =~ m/[\n\r]/) {
486 die "property contains a line feed\n";
487 }
822de0c3 488
27916659
DM
489 if ($type eq 'boolean') {
490 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
491 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
492 die "type check ('boolean') failed - got '$value'\n";
493 } elsif ($type eq 'integer') {
494 return int($1) if $value =~ m/^(\d+)$/;
495 die "type check ('integer') failed - got '$value'\n";
496 } elsif ($type eq 'number') {
497 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
498 die "type check ('number') failed - got '$value'\n";
499 } elsif ($type eq 'string') {
500 if (my $fmt = $confdesc->{$key}->{format}) {
501 PVE::JSONSchema::check_format($fmt, $value);
502 return $value;
503 }
cbb03fea 504 return $value;
822de0c3 505 } else {
27916659 506 die "internal error"
822de0c3 507 }
822de0c3
DM
508}
509
27916659 510sub parse_pct_config {
f76a2828
DM
511 my ($filename, $raw) = @_;
512
513 return undef if !defined($raw);
514
27916659 515 my $res = {
f76a2828 516 digest => Digest::SHA::sha1_hex($raw),
27916659 517 snapshots => {},
f76a2828
DM
518 };
519
27916659 520 $filename =~ m|/lxc/(\d+).conf$|
f76a2828
DM
521 || die "got strange filename '$filename'";
522
523 my $vmid = $1;
524
27916659
DM
525 my $conf = $res;
526 my $descr = '';
527 my $section = '';
528
529 my @lines = split(/\n/, $raw);
530 foreach my $line (@lines) {
531 next if $line =~ m/^\s*$/;
532
533 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
534 $section = $1;
535 $conf->{description} = $descr if $descr;
536 $descr = '';
537 $conf = $res->{snapshots}->{$section} = {};
538 next;
a12a36e0 539 }
a12a36e0 540
27916659
DM
541 if ($line =~ m/^\#(.*)\s*$/) {
542 $descr .= PVE::Tools::decode_text($1) . "\n";
543 next;
f76a2828 544 }
5d186e16 545
545d10ba 546 if ($line =~ m/^(lxc\.[a-z0-9_\-\.]+)(:|\s*=)\s*(.*?)\s*$/) {
e576f689
DM
547 my $key = $1;
548 my $value = $3;
a23d627d
WB
549 my $validity = $valid_lxc_conf_keys->{$key} || 0;
550 if ($validity eq 1 || $key =~ m/^lxc\.cgroup\./) {
e576f689 551 push @{$conf->{lxc}}, [$key, $value];
a23d627d 552 } elsif (my $errmsg = $validity) {
312e9850 553 warn "vm $vmid - $key: $errmsg\n";
e576f689
DM
554 } else {
555 warn "vm $vmid - unable to parse config: $line\n";
556 }
557 } elsif ($line =~ m/^(description):\s*(.*\S)\s*$/) {
27916659
DM
558 $descr .= PVE::Tools::decode_text($2);
559 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
560 $conf->{snapstate} = $1;
fe9a4ab3 561 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S.*)\s*$/) {
27916659 562 my $key = $1;
5d186e16 563 my $value = $2;
27916659
DM
564 eval { $value = check_type($key, $value); };
565 warn "vm $vmid - unable to parse value of '$key' - $@" if $@;
566 $conf->{$key} = $value;
5d186e16 567 } else {
27916659 568 warn "vm $vmid - unable to parse config: $line\n";
5d186e16 569 }
7dfc49cc
DM
570 }
571
27916659 572 $conf->{description} = $descr if $descr;
5d186e16 573
27916659
DM
574 delete $res->{snapstate}; # just to be sure
575
576 return $res;
f76a2828
DM
577}
578
579sub config_list {
580 my $vmlist = PVE::Cluster::get_vmlist();
581 my $res = {};
582 return $res if !$vmlist || !$vmlist->{ids};
583 my $ids = $vmlist->{ids};
584
585 foreach my $vmid (keys %$ids) {
586 next if !$vmid; # skip CT0
587 my $d = $ids->{$vmid};
588 next if !$d->{node} || $d->{node} ne $nodename;
589 next if !$d->{type} || $d->{type} ne 'lxc';
590 $res->{$vmid}->{type} = 'lxc';
591 }
592 return $res;
593}
594
595sub cfs_config_path {
596 my ($vmid, $node) = @_;
597
598 $node = $nodename if !$node;
27916659 599 return "nodes/$node/lxc/$vmid.conf";
f76a2828
DM
600}
601
9c2d4ce9
DM
602sub config_file {
603 my ($vmid, $node) = @_;
604
605 my $cfspath = cfs_config_path($vmid, $node);
606 return "/etc/pve/$cfspath";
607}
608
f76a2828 609sub load_config {
d18499cf 610 my ($vmid, $node) = @_;
f76a2828 611
d18499cf
TL
612 $node = $nodename if !$node;
613 my $cfspath = cfs_config_path($vmid, $node);
f76a2828
DM
614
615 my $conf = PVE::Cluster::cfs_read_file($cfspath);
c31ad455 616 die "container $vmid does not exist\n" if !defined($conf);
f76a2828
DM
617
618 return $conf;
619}
620
5b4657d0
DM
621sub create_config {
622 my ($vmid, $conf) = @_;
623
624 my $dir = "/etc/pve/nodes/$nodename/lxc";
625 mkdir $dir;
626
5b4657d0
DM
627 write_config($vmid, $conf);
628}
629
630sub destroy_config {
631 my ($vmid) = @_;
632
27916659 633 unlink config_file($vmid, $nodename);
5b4657d0
DM
634}
635
f76a2828
DM
636sub write_config {
637 my ($vmid, $conf) = @_;
638
639 my $cfspath = cfs_config_path($vmid);
640
641 PVE::Cluster::cfs_write_file($cfspath, $conf);
642}
643
d14a9a1b 644# flock: we use one file handle per process, so lock file
c31ad455 645# can be called multiple times and will succeed for the same process.
d14a9a1b
DM
646
647my $lock_handles = {};
648my $lockdir = "/run/lock/lxc";
649
3cc56749 650sub config_file_lock {
d14a9a1b 651 my ($vmid) = @_;
cbb03fea 652
53396388 653 return "$lockdir/pve-config-${vmid}.lock";
d14a9a1b
DM
654}
655
3cc56749 656sub lock_config_full {
2d3f23be 657 my ($vmid, $timeout, $code, @param) = @_;
d14a9a1b 658
3cc56749 659 my $filename = config_file_lock($vmid);
d14a9a1b 660
3cc56749
FG
661 mkdir $lockdir if !-d $lockdir;
662
663 my $res = lock_file($filename, $timeout, $code, @param);
664
665 die $@ if $@;
666
667 return $res;
668}
669
670sub lock_config_mode {
671 my ($vmid, $timeout, $shared, $code, @param) = @_;
672
673 my $filename = config_file_lock($vmid);
d14a9a1b 674
f99e8278
AD
675 mkdir $lockdir if !-d $lockdir;
676
3cc56749 677 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
f76a2828 678
2d3f23be 679 die $@ if $@;
f76a2828
DM
680
681 return $res;
682}
683
3cc56749
FG
684sub lock_config {
685 my ($vmid, $code, @param) = @_;
686
687 return lock_config_full($vmid, 10, $code, @param);
688}
689
ec52ac21
DM
690sub option_exists {
691 my ($name) = @_;
692
693 return defined($confdesc->{$name});
694}
f76a2828
DM
695
696# add JSON properties for create and set function
697sub json_config_properties {
698 my $prop = shift;
699
700 foreach my $opt (keys %$confdesc) {
09d3ec42 701 next if $opt eq 'parent' || $opt eq 'snaptime';
27916659
DM
702 next if $prop->{$opt};
703 $prop->{$opt} = $confdesc->{$opt};
704 }
705
706 return $prop;
707}
708
822de0c3
DM
709# container status helpers
710
711sub list_active_containers {
cbb03fea 712
822de0c3
DM
713 my $filename = "/proc/net/unix";
714
715 # similar test is used by lcxcontainers.c: list_active_containers
716 my $res = {};
cbb03fea 717
822de0c3
DM
718 my $fh = IO::File->new ($filename, "r");
719 return $res if !$fh;
720
721 while (defined(my $line = <$fh>)) {
722 if ($line =~ m/^[a-f0-9]+:\s\S+\s\S+\s\S+\s\S+\s\S+\s\d+\s(\S+)$/) {
723 my $path = $1;
27916659 724 if ($path =~ m!^@/var/lib/lxc/(\d+)/command$!) {
822de0c3
DM
725 $res->{$1} = 1;
726 }
727 }
728 }
729
730 close($fh);
cbb03fea 731
822de0c3
DM
732 return $res;
733}
f76a2828 734
5c752bbf
DM
735# warning: this is slow
736sub check_running {
737 my ($vmid) = @_;
738
739 my $active_hash = list_active_containers();
740
741 return 1 if defined($active_hash->{$vmid});
cbb03fea 742
5c752bbf
DM
743 return undef;
744}
745
10fc3ba5 746sub get_container_disk_usage {
73e03cb7 747 my ($vmid, $pid) = @_;
10fc3ba5 748
73e03cb7 749 return PVE::Tools::df("/proc/$pid/root/", 1);
10fc3ba5
DM
750}
751
688afc63
WL
752my $last_proc_vmid_stat;
753
754my $parse_cpuacct_stat = sub {
755 my ($vmid) = @_;
756
757 my $raw = read_cgroup_value('cpuacct', $vmid, 'cpuacct.stat', 1);
758
759 my $stat = {};
760
761 if ($raw =~ m/^user (\d+)\nsystem (\d+)\n/) {
762
763 $stat->{utime} = $1;
764 $stat->{stime} = $2;
765
766 }
767
768 return $stat;
769};
770
f76a2828
DM
771sub vmstatus {
772 my ($opt_vmid) = @_;
773
774 my $list = $opt_vmid ? { $opt_vmid => { type => 'lxc' }} : config_list();
775
822de0c3 776 my $active_hash = list_active_containers();
cbb03fea 777
688afc63
WL
778 my $cpucount = $cpuinfo->{cpus} || 1;
779
780 my $cdtime = gettimeofday;
781
782 my $uptime = (PVE::ProcFSTools::read_proc_uptime(1))[0];
783
f76a2828 784 foreach my $vmid (keys %$list) {
f76a2828 785 my $d = $list->{$vmid};
10fc3ba5 786
d5588ee3
DM
787 eval { $d->{pid} = find_lxc_pid($vmid) if defined($active_hash->{$vmid}); };
788 warn $@ if $@; # ignore errors (consider them stopped)
cbb03fea 789
d5588ee3 790 $d->{status} = $d->{pid} ? 'running' : 'stopped';
f76a2828
DM
791
792 my $cfspath = cfs_config_path($vmid);
238a56cb 793 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
cbb03fea 794
27916659 795 $d->{name} = $conf->{'hostname'} || "CT$vmid";
238a56cb 796 $d->{name} =~ s/[\s]//g;
cbb03fea 797
9db5687d 798 $d->{cpus} = $conf->{cpulimit} || $cpucount;
44da0641 799
d5588ee3
DM
800 if ($d->{pid}) {
801 my $res = get_container_disk_usage($vmid, $d->{pid});
27916659
DM
802 $d->{disk} = $res->{used};
803 $d->{maxdisk} = $res->{total};
804 } else {
805 $d->{disk} = 0;
806 # use 4GB by default ??
807 if (my $rootfs = $conf->{rootfs}) {
44a9face 808 my $rootinfo = parse_ct_rootfs($rootfs);
27916659
DM
809 $d->{maxdisk} = int(($rootinfo->{size} || 4)*1024*1024)*1024;
810 } else {
811 $d->{maxdisk} = 4*1024*1024*1024;
10fc3ba5 812 }
238a56cb 813 }
cbb03fea 814
238a56cb
DM
815 $d->{mem} = 0;
816 $d->{swap} = 0;
95df9a12
DM
817 $d->{maxmem} = ($conf->{memory}||512)*1024*1024;
818 $d->{maxswap} = ($conf->{swap}//0)*1024*1024;
e901d418 819
238a56cb
DM
820 $d->{uptime} = 0;
821 $d->{cpu} = 0;
e901d418 822
238a56cb
DM
823 $d->{netout} = 0;
824 $d->{netin} = 0;
f76a2828 825
238a56cb
DM
826 $d->{diskread} = 0;
827 $d->{diskwrite} = 0;
bb1ac2de
DM
828
829 $d->{template} = is_template($conf);
f76a2828 830 }
cbb03fea 831
238a56cb
DM
832 foreach my $vmid (keys %$list) {
833 my $d = $list->{$vmid};
d5588ee3
DM
834 my $pid = $d->{pid};
835
836 next if !$pid; # skip stopped CTs
f76a2828 837
88a8696b
TL
838 my $ctime = (stat("/proc/$pid"))[10]; # 10 = ctime
839 $d->{uptime} = time - $ctime; # the method lxcfs uses
22a77285 840
238a56cb
DM
841 $d->{mem} = read_cgroup_value('memory', $vmid, 'memory.usage_in_bytes');
842 $d->{swap} = read_cgroup_value('memory', $vmid, 'memory.memsw.usage_in_bytes') - $d->{mem};
b5289322
AD
843
844 my $blkio_bytes = read_cgroup_value('blkio', $vmid, 'blkio.throttle.io_service_bytes', 1);
1e647c7c 845 my @bytes = split(/\n/, $blkio_bytes);
b5289322 846 foreach my $byte (@bytes) {
1e647c7c
DM
847 if (my ($key, $value) = $byte =~ /(Read|Write)\s+(\d+)/) {
848 $d->{diskread} = $2 if $key eq 'Read';
849 $d->{diskwrite} = $2 if $key eq 'Write';
850 }
b5289322 851 }
688afc63
WL
852
853 my $pstat = &$parse_cpuacct_stat($vmid);
854
855 my $used = $pstat->{utime} + $pstat->{stime};
856
857 my $old = $last_proc_vmid_stat->{$vmid};
858 if (!$old) {
859 $last_proc_vmid_stat->{$vmid} = {
860 time => $cdtime,
861 used => $used,
862 cpu => 0,
863 };
864 next;
865 }
866
867 my $dtime = ($cdtime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
868
869 if ($dtime > 1000) {
870 my $dutime = $used - $old->{used};
871
872 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
873 $last_proc_vmid_stat->{$vmid} = {
874 time => $cdtime,
875 used => $used,
876 cpu => $d->{cpu},
877 };
878 } else {
879 $d->{cpu} = $old->{cpu};
880 }
238a56cb 881 }
cbb03fea 882
68b8f4d1
WL
883 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
884
885 foreach my $dev (keys %$netdev) {
886 next if $dev !~ m/^veth([1-9]\d*)i/;
887 my $vmid = $1;
888 my $d = $list->{$vmid};
889
890 next if !$d;
891
892 $d->{netout} += $netdev->{$dev}->{receive};
893 $d->{netin} += $netdev->{$dev}->{transmit};
894
895 }
896
f76a2828
DM
897 return $list;
898}
899
7c921c80
WB
900sub classify_mountpoint {
901 my ($vol) = @_;
902 if ($vol =~ m!^/!) {
903 return 'device' if $vol =~ m!^/dev/!;
904 return 'bind';
905 }
906 return 'volume';
907}
908
44a9face
DM
909my $parse_ct_mountpoint_full = sub {
910 my ($desc, $data, $noerr) = @_;
27916659
DM
911
912 $data //= '';
913
1b2c1e8c 914 my $res;
44a9face 915 eval { $res = PVE::JSONSchema::parse_property_string($desc, $data) };
1b2c1e8c 916 if ($@) {
ca7feb1a
WB
917 return undef if $noerr;
918 die $@;
27916659
DM
919 }
920
bf4a209a 921 if (defined(my $size = $res->{size})) {
ca7feb1a
WB
922 $size = PVE::JSONSchema::parse_size($size);
923 if (!defined($size)) {
924 return undef if $noerr;
925 die "invalid size: $size\n";
926 }
927 $res->{size} = $size;
27916659
DM
928 }
929
7c921c80
WB
930 $res->{type} = classify_mountpoint($res->{volume});
931
27916659 932 return $res;
44a9face
DM
933};
934
935sub parse_ct_rootfs {
936 my ($data, $noerr) = @_;
937
938 my $res = &$parse_ct_mountpoint_full($rootfs_desc, $data, $noerr);
939
940 $res->{mp} = '/' if defined($res);
941
942 return $res;
943}
944
945sub parse_ct_mountpoint {
946 my ($data, $noerr) = @_;
947
948 return &$parse_ct_mountpoint_full($mp_desc, $data, $noerr);
27916659 949}
7dfc49cc 950
dde7b02b 951sub print_ct_mountpoint {
4fee75fd 952 my ($info, $nomp) = @_;
7c921c80
WB
953 my $skip = [ 'type' ];
954 push @$skip, 'mp' if $nomp;
6708ba93 955 return PVE::JSONSchema::print_property_string($info, $mp_desc, $skip);
bb1ac2de
DM
956}
957
7dfc49cc 958sub print_lxc_network {
f76a2828 959 my $net = shift;
6708ba93 960 return PVE::JSONSchema::print_property_string($net, $netconf_desc);
f76a2828
DM
961}
962
7dfc49cc
DM
963sub parse_lxc_network {
964 my ($data) = @_;
965
966 my $res = {};
967
968 return $res if !$data;
969
ca7feb1a 970 $res = PVE::JSONSchema::parse_property_string($netconf_desc, $data);
7dfc49cc
DM
971
972 $res->{type} = 'veth';
93cdbbfb 973 $res->{hwaddr} = PVE::Tools::random_ether_addr() if !$res->{hwaddr};
cbb03fea 974
7dfc49cc
DM
975 return $res;
976}
f76a2828 977
238a56cb
DM
978sub read_cgroup_value {
979 my ($group, $vmid, $name, $full) = @_;
980
981 my $path = "/sys/fs/cgroup/$group/lxc/$vmid/$name";
982
983 return PVE::Tools::file_get_contents($path) if $full;
984
985 return PVE::Tools::file_read_firstline($path);
986}
987
bf0b8c43
AD
988sub write_cgroup_value {
989 my ($group, $vmid, $name, $value) = @_;
990
991 my $path = "/sys/fs/cgroup/$group/lxc/$vmid/$name";
992 PVE::ProcFSTools::write_proc_entry($path, $value) if -e $path;
993
994}
995
52f1d76b
DM
996sub find_lxc_console_pids {
997
998 my $res = {};
999
1000 PVE::Tools::dir_glob_foreach('/proc', '\d+', sub {
1001 my ($pid) = @_;
1002
1003 my $cmdline = PVE::Tools::file_read_firstline("/proc/$pid/cmdline");
1004 return if !$cmdline;
1005
1006 my @args = split(/\0/, $cmdline);
1007
c31ad455 1008 # search for lxc-console -n <vmid>
cbb03fea 1009 return if scalar(@args) != 3;
52f1d76b
DM
1010 return if $args[1] ne '-n';
1011 return if $args[2] !~ m/^\d+$/;
1012 return if $args[0] !~ m|^(/usr/bin/)?lxc-console$|;
cbb03fea 1013
52f1d76b 1014 my $vmid = $args[2];
cbb03fea 1015
52f1d76b
DM
1016 push @{$res->{$vmid}}, $pid;
1017 });
1018
1019 return $res;
1020}
1021
bedeaaf1
AD
1022sub find_lxc_pid {
1023 my ($vmid) = @_;
1024
1025 my $pid = undef;
1026 my $parser = sub {
1027 my $line = shift;
8b25977f 1028 $pid = $1 if $line =~ m/^PID:\s+(\d+)$/;
bedeaaf1 1029 };
c39aa40a 1030 PVE::Tools::run_command(['lxc-info', '-n', $vmid, '-p'], outfunc => $parser);
bedeaaf1 1031
8b25977f 1032 die "unable to get PID for CT $vmid (not running?)\n" if !$pid;
cbb03fea 1033
8b25977f 1034 return $pid;
bedeaaf1
AD
1035}
1036
cbb03fea 1037# Note: we cannot use Net:IP, because that only allows strict
55fa4e09
DM
1038# CIDR networks
1039sub parse_ipv4_cidr {
1040 my ($cidr, $noerr) = @_;
1041
f7a7b413
WB
1042 if ($cidr =~ m!^($IPV4RE)(?:/(\d+))$! && ($2 > 7) && ($2 <= 32)) {
1043 return { address => $1, netmask => $PVE::Network::ipv4_reverse_mask->[$2] };
55fa4e09 1044 }
cbb03fea 1045
55fa4e09 1046 return undef if $noerr;
cbb03fea 1047
55fa4e09
DM
1048 die "unable to parse ipv4 address/mask\n";
1049}
93285df8 1050
a12a36e0
WL
1051sub check_lock {
1052 my ($conf) = @_;
1053
27916659 1054 die "VM is locked ($conf->{'lock'})\n" if $conf->{'lock'};
a12a36e0
WL
1055}
1056
6da1f91b
WB
1057sub has_lock {
1058 my ($conf, $lock) = @_;
1059 return $conf->{lock} && (!defined($lock) || $lock eq $conf->{lock});
1060}
1061
e22af68f
AG
1062sub check_protection {
1063 my ($vm_conf, $err_msg) = @_;
1064
1065 if ($vm_conf->{protection}) {
1066 die "$err_msg - protection mode enabled\n";
1067 }
1068}
1069
27916659 1070sub update_lxc_config {
c628ffa1 1071 my ($storage_cfg, $vmid, $conf) = @_;
b80dd50a 1072
bb1ac2de
DM
1073 my $dir = "/var/lib/lxc/$vmid";
1074
1075 if ($conf->{template}) {
1076
1077 unlink "$dir/config";
1078
1079 return;
1080 }
1081
27916659 1082 my $raw = '';
b80dd50a 1083
27916659
DM
1084 die "missing 'arch' - internal error" if !$conf->{arch};
1085 $raw .= "lxc.arch = $conf->{arch}\n";
b80dd50a 1086
425b62cb
WB
1087 my $unprivileged = $conf->{unprivileged};
1088 my $custom_idmap = grep { $_->[0] eq 'lxc.id_map' } @{$conf->{lxc}};
1089
27916659 1090 my $ostype = $conf->{ostype} || die "missing 'ostype' - internal error";
238b7e3e 1091 if ($ostype =~ /^(?:debian | ubuntu | centos | fedora | opensuse | archlinux | alpine | unmanaged)$/x) {
c34f7efe
WB
1092 my $inc ="/usr/share/lxc/config/$ostype.common.conf";
1093 $inc ="/usr/share/lxc/config/common.conf" if !-f $inc;
1094 $raw .= "lxc.include = $inc\n";
425b62cb 1095 if ($unprivileged || $custom_idmap) {
c34f7efe
WB
1096 $inc = "/usr/share/lxc/config/$ostype.userns.conf";
1097 $inc = "/usr/share/lxc/config/userns.conf" if !-f $inc;
1098 $raw .= "lxc.include = $inc\n"
425b62cb 1099 }
27916659 1100 } else {
9a7a910b 1101 die "implement me (ostype $ostype)";
27916659 1102 }
b80dd50a 1103
50df544c
WB
1104 # WARNING: DO NOT REMOVE this without making sure that loop device nodes
1105 # cannot be exposed to the container with r/w access (cgroup perms).
1106 # When this is enabled mounts will still remain in the monitor's namespace
1107 # after the container unmounted them and thus will not detach from their
1108 # files while the container is running!
c16b8890 1109 $raw .= "lxc.monitor.unshare = 1\n";
58cc92a9 1110
425b62cb
WB
1111 # Should we read them from /etc/subuid?
1112 if ($unprivileged && !$custom_idmap) {
1113 $raw .= "lxc.id_map = u 0 100000 65536\n";
1114 $raw .= "lxc.id_map = g 0 100000 65536\n";
1115 }
1116
6f035afe 1117 if (!has_dev_console($conf)) {
eeaea429
DM
1118 $raw .= "lxc.console = none\n";
1119 $raw .= "lxc.cgroup.devices.deny = c 5:1 rwm\n";
1120 }
4f958489 1121
0d0ca400 1122 my $ttycount = get_tty_count($conf);
27916659 1123 $raw .= "lxc.tty = $ttycount\n";
cbb03fea 1124
c31ad455 1125 # some init scripts expect a linux terminal (turnkey).
a691a5a3
DM
1126 $raw .= "lxc.environment = TERM=linux\n";
1127
27916659
DM
1128 my $utsname = $conf->{hostname} || "CT$vmid";
1129 $raw .= "lxc.utsname = $utsname\n";
cbb03fea 1130
27916659
DM
1131 my $memory = $conf->{memory} || 512;
1132 my $swap = $conf->{swap} // 0;
1133
1134 my $lxcmem = int($memory*1024*1024);
1135 $raw .= "lxc.cgroup.memory.limit_in_bytes = $lxcmem\n";
a12a36e0 1136
27916659
DM
1137 my $lxcswap = int(($memory + $swap)*1024*1024);
1138 $raw .= "lxc.cgroup.memory.memsw.limit_in_bytes = $lxcswap\n";
1139
1140 if (my $cpulimit = $conf->{cpulimit}) {
1141 $raw .= "lxc.cgroup.cpu.cfs_period_us = 100000\n";
1142 my $value = int(100000*$cpulimit);
1143 $raw .= "lxc.cgroup.cpu.cfs_quota_us = $value\n";
a12a36e0
WL
1144 }
1145
27916659
DM
1146 my $shares = $conf->{cpuunits} || 1024;
1147 $raw .= "lxc.cgroup.cpu.shares = $shares\n";
1148
44a9face 1149 my $mountpoint = parse_ct_rootfs($conf->{rootfs});
a3076d81 1150
c9a5774b 1151 $raw .= "lxc.rootfs = $dir/rootfs\n";
27916659
DM
1152
1153 my $netcount = 0;
1154 foreach my $k (keys %$conf) {
1155 next if $k !~ m/^net(\d+)$/;
1156 my $ind = $1;
a16d94c8 1157 my $d = parse_lxc_network($conf->{$k});
27916659
DM
1158 $netcount++;
1159 $raw .= "lxc.network.type = veth\n";
18862537 1160 $raw .= "lxc.network.veth.pair = veth${vmid}i${ind}\n";
27916659
DM
1161 $raw .= "lxc.network.hwaddr = $d->{hwaddr}\n" if defined($d->{hwaddr});
1162 $raw .= "lxc.network.name = $d->{name}\n" if defined($d->{name});
1163 $raw .= "lxc.network.mtu = $d->{mtu}\n" if defined($d->{mtu});
a12a36e0
WL
1164 }
1165
e576f689
DM
1166 if (my $lxcconf = $conf->{lxc}) {
1167 foreach my $entry (@$lxcconf) {
1168 my ($k, $v) = @$entry;
1169 $netcount++ if $k eq 'lxc.network.type';
1170 $raw .= "$k = $v\n";
1171 }
1172 }
27916659 1173
e576f689
DM
1174 $raw .= "lxc.network.type = empty\n" if !$netcount;
1175
27916659
DM
1176 File::Path::mkpath("$dir/rootfs");
1177
1178 PVE::Tools::file_set_contents("$dir/config", $raw);
b80dd50a
DM
1179}
1180
117636e5
DM
1181# verify and cleanup nameserver list (replace \0 with ' ')
1182sub verify_nameserver_list {
1183 my ($nameserver_list) = @_;
1184
1185 my @list = ();
1186 foreach my $server (PVE::Tools::split_list($nameserver_list)) {
1187 PVE::JSONSchema::pve_verify_ip($server);
1188 push @list, $server;
1189 }
1190
1191 return join(' ', @list);
1192}
1193
1194sub verify_searchdomain_list {
1195 my ($searchdomain_list) = @_;
1196
1197 my @list = ();
1198 foreach my $server (PVE::Tools::split_list($searchdomain_list)) {
1199 # todo: should we add checks for valid dns domains?
1200 push @list, $server;
1201 }
1202
1203 return join(' ', @list);
1204}
1205
12e95ae4 1206sub is_volume_in_use {
4defdb73 1207 my ($config, $volid, $include_snapshots) = @_;
12e95ae4
FG
1208 my $used = 0;
1209
1210 foreach_mountpoint($config, sub {
1211 my ($ms, $mountpoint) = @_;
1212 return if $used;
1213 if ($mountpoint->{type} eq 'volume' && $mountpoint->{volume} eq $volid) {
1214 $used = 1;
1215 }
1216 });
1217
4defdb73
FG
1218 my $snapshots = $config->{snapshots};
1219 if ($include_snapshots && $snapshots) {
1220 foreach my $snap (keys %$snapshots) {
1221 $used ||= is_volume_in_use($snapshots->{$snap}, $volid);
1222 }
1223 }
1224
12e95ae4
FG
1225 return $used;
1226}
1227
69202f71
WB
1228sub add_unused_volume {
1229 my ($config, $volid) = @_;
1230
1231 my $key;
1232 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1233 my $test = "unused$ind";
1234 if (my $vid = $config->{$test}) {
1235 return if $vid eq $volid; # do not add duplicates
1236 } else {
1237 $key = $test;
1238 }
1239 }
1240
c31ad455 1241 die "Too many unused volumes - please delete them first.\n" if !$key;
69202f71
WB
1242
1243 $config->{$key} = $volid;
1244
1245 return $key;
1246}
1247
27916659 1248sub update_pct_config {
93285df8
DM
1249 my ($vmid, $conf, $running, $param, $delete) = @_;
1250
bf0b8c43
AD
1251 my @nohotplug;
1252
7b49dfe0 1253 my $new_disks = 0;
69202f71 1254 my @deleted_volumes;
4fee75fd 1255
cbb03fea
DM
1256 my $rootdir;
1257 if ($running) {
bedeaaf1 1258 my $pid = find_lxc_pid($vmid);
cbb03fea 1259 $rootdir = "/proc/$pid/root";
bedeaaf1
AD
1260 }
1261
7a168607
DM
1262 my $hotplug_error = sub {
1263 if ($running) {
a6a77cfa
WB
1264 push @nohotplug, @_;
1265 return 1;
7a168607
DM
1266 } else {
1267 return 0;
a6a77cfa 1268 }
7a168607 1269 };
a6a77cfa 1270
93285df8
DM
1271 if (defined($delete)) {
1272 foreach my $opt (@$delete) {
a61a5448
WB
1273 if (!exists($conf->{$opt})) {
1274 warn "no such option: $opt\n";
1275 next;
1276 }
1277
27916659 1278 if ($opt eq 'hostname' || $opt eq 'memory' || $opt eq 'rootfs') {
93285df8
DM
1279 die "unable to delete required option '$opt'\n";
1280 } elsif ($opt eq 'swap') {
27916659 1281 delete $conf->{$opt};
bf0b8c43 1282 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", -1);
40603eb3 1283 } elsif ($opt eq 'description' || $opt eq 'onboot' || $opt eq 'startup') {
27916659 1284 delete $conf->{$opt};
4f958489 1285 } elsif ($opt eq 'nameserver' || $opt eq 'searchdomain' ||
40603eb3 1286 $opt eq 'tty' || $opt eq 'console' || $opt eq 'cmode') {
a6a77cfa 1287 next if $hotplug_error->($opt);
27916659 1288 delete $conf->{$opt};
68fba17b 1289 } elsif ($opt =~ m/^net(\d)$/) {
93285df8 1290 delete $conf->{$opt};
68fba17b
AD
1291 next if !$running;
1292 my $netid = $1;
18862537 1293 PVE::Network::veth_delete("veth${vmid}i$netid");
7e806596
AG
1294 } elsif ($opt eq 'protection') {
1295 delete $conf->{$opt};
69202f71 1296 } elsif ($opt =~ m/^unused(\d+)$/) {
a6a77cfa 1297 next if $hotplug_error->($opt);
69202f71
WB
1298 check_protection($conf, "can't remove CT $vmid drive '$opt'");
1299 push @deleted_volumes, $conf->{$opt};
1300 delete $conf->{$opt};
4fee75fd 1301 } elsif ($opt =~ m/^mp(\d+)$/) {
a6a77cfa 1302 next if $hotplug_error->($opt);
e22af68f 1303 check_protection($conf, "can't remove CT $vmid drive '$opt'");
12e95ae4 1304 my $mp = parse_ct_mountpoint($conf->{$opt});
4fee75fd 1305 delete $conf->{$opt};
12e95ae4
FG
1306 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1307 add_unused_volume($conf, $mp->{volume});
1308 }
425b62cb
WB
1309 } elsif ($opt eq 'unprivileged') {
1310 die "unable to delete read-only option: '$opt'\n";
93285df8 1311 } else {
9a7a910b 1312 die "implement me (delete: $opt)"
93285df8 1313 }
706c9791 1314 write_config($vmid, $conf) if $running;
93285df8
DM
1315 }
1316 }
1317
be6383d7
WB
1318 # There's no separate swap size to configure, there's memory and "total"
1319 # memory (iow. memory+swap). This means we have to change them together.
27916659
DM
1320 my $wanted_memory = PVE::Tools::extract_param($param, 'memory');
1321 my $wanted_swap = PVE::Tools::extract_param($param, 'swap');
be6383d7 1322 if (defined($wanted_memory) || defined($wanted_swap)) {
27916659 1323
a2c57b0c
WB
1324 my $old_memory = ($conf->{memory} || 512);
1325 my $old_swap = ($conf->{swap} || 0);
1326
1327 $wanted_memory //= $old_memory;
1328 $wanted_swap //= $old_swap;
27916659
DM
1329
1330 my $total = $wanted_memory + $wanted_swap;
1331 if ($running) {
a2c57b0c
WB
1332 my $old_total = $old_memory + $old_swap;
1333 if ($total > $old_total) {
1334 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", int($total*1024*1024));
1335 write_cgroup_value("memory", $vmid, "memory.limit_in_bytes", int($wanted_memory*1024*1024));
1336 } else {
1337 write_cgroup_value("memory", $vmid, "memory.limit_in_bytes", int($wanted_memory*1024*1024));
1338 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", int($total*1024*1024));
1339 }
be6383d7 1340 }
27916659
DM
1341 $conf->{memory} = $wanted_memory;
1342 $conf->{swap} = $wanted_swap;
1343
706c9791 1344 write_config($vmid, $conf) if $running;
be6383d7
WB
1345 }
1346
dfab6edb
WB
1347 my $used_volids = {};
1348
93285df8
DM
1349 foreach my $opt (keys %$param) {
1350 my $value = $param->{$opt};
1351 if ($opt eq 'hostname') {
27916659 1352 $conf->{$opt} = $value;
a99b3509 1353 } elsif ($opt eq 'onboot') {
27916659 1354 $conf->{$opt} = $value ? 1 : 0;
a3249355 1355 } elsif ($opt eq 'startup') {
27916659 1356 $conf->{$opt} = $value;
40603eb3 1357 } elsif ($opt eq 'tty' || $opt eq 'console' || $opt eq 'cmode') {
a6a77cfa 1358 next if $hotplug_error->($opt);
e576f689 1359 $conf->{$opt} = $value;
ffa1d001 1360 } elsif ($opt eq 'nameserver') {
a6a77cfa 1361 next if $hotplug_error->($opt);
117636e5 1362 my $list = verify_nameserver_list($value);
27916659 1363 $conf->{$opt} = $list;
ffa1d001 1364 } elsif ($opt eq 'searchdomain') {
a6a77cfa 1365 next if $hotplug_error->($opt);
117636e5 1366 my $list = verify_searchdomain_list($value);
27916659 1367 $conf->{$opt} = $list;
45573f7c 1368 } elsif ($opt eq 'cpulimit') {
a6a77cfa 1369 next if $hotplug_error->($opt); # FIXME: hotplug
27916659 1370 $conf->{$opt} = $value;
b80dd50a 1371 } elsif ($opt eq 'cpuunits') {
27916659 1372 $conf->{$opt} = $value;
bf0b8c43 1373 write_cgroup_value("cpu", $vmid, "cpu.shares", $value);
93285df8 1374 } elsif ($opt eq 'description') {
27916659 1375 $conf->{$opt} = PVE::Tools::encode_text($value);
93285df8
DM
1376 } elsif ($opt =~ m/^net(\d+)$/) {
1377 my $netid = $1;
a16d94c8 1378 my $net = parse_lxc_network($value);
27916659
DM
1379 if (!$running) {
1380 $conf->{$opt} = print_lxc_network($net);
cbb03fea 1381 } else {
bedeaaf1
AD
1382 update_net($vmid, $conf, $opt, $net, $netid, $rootdir);
1383 }
7e806596
AG
1384 } elsif ($opt eq 'protection') {
1385 $conf->{$opt} = $value ? 1 : 0;
4fee75fd 1386 } elsif ($opt =~ m/^mp(\d+)$/) {
a6a77cfa 1387 next if $hotplug_error->($opt);
e22af68f 1388 check_protection($conf, "can't update CT $vmid drive '$opt'");
12e95ae4 1389 my $old = $conf->{$opt};
4fee75fd 1390 $conf->{$opt} = $value;
12e95ae4
FG
1391 if (defined($old)) {
1392 my $mp = parse_ct_mountpoint($old);
1393 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1394 add_unused_volume($conf, $mp->{volume});
1395 }
1396 }
7b49dfe0 1397 $new_disks = 1;
dfab6edb
WB
1398 my $mp = parse_ct_mountpoint($value);
1399 $used_volids->{$mp->{volume}} = 1;
4fee75fd 1400 } elsif ($opt eq 'rootfs') {
55ce8db8 1401 next if $hotplug_error->($opt);
e22af68f 1402 check_protection($conf, "can't update CT $vmid drive '$opt'");
12e95ae4 1403 my $old = $conf->{$opt};
55ce8db8 1404 $conf->{$opt} = $value;
12e95ae4
FG
1405 if (defined($old)) {
1406 my $mp = parse_ct_rootfs($old);
1407 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1408 add_unused_volume($conf, $mp->{volume});
1409 }
1410 }
dfab6edb
WB
1411 my $mp = parse_ct_rootfs($value);
1412 $used_volids->{$mp->{volume}} = 1;
425b62cb
WB
1413 } elsif ($opt eq 'unprivileged') {
1414 die "unable to modify read-only option: '$opt'\n";
238b7e3e
DM
1415 } elsif ($opt eq 'ostype') {
1416 next if $hotplug_error->($opt);
1417 $conf->{$opt} = $value;
93285df8 1418 } else {
a92f66c9 1419 die "implement me: $opt";
93285df8 1420 }
706c9791 1421 write_config($vmid, $conf) if $running;
93285df8 1422 }
bf0b8c43 1423
dfab6edb
WB
1424 # Cleanup config:
1425
1426 # Remove unused disks after re-adding
1427 foreach my $key (keys %$conf) {
1428 next if $key !~ /^unused\d+/;
1429 my $volid = $conf->{$key};
1430 if ($used_volids->{$volid}) {
1431 delete $conf->{$key};
1432 }
1433 }
1434
1435 # Apply deletions and creations of new volumes
69202f71
WB
1436 if (@deleted_volumes) {
1437 my $storage_cfg = PVE::Storage::config();
1438 foreach my $volume (@deleted_volumes) {
dfab6edb 1439 next if $used_volids->{$volume}; # could have been re-added, too
4defdb73
FG
1440 # also check for references in snapshots
1441 next if is_volume_in_use($conf, $volume, 1);
69202f71
WB
1442 delete_mountpoint_volume($storage_cfg, $vmid, $volume);
1443 }
1444 }
1445
7b49dfe0 1446 if ($new_disks) {
4fee75fd 1447 my $storage_cfg = PVE::Storage::config();
6c871c36 1448 create_disks($storage_cfg, $vmid, $conf, $conf);
4fee75fd 1449 }
694c25df
WB
1450
1451 # This should be the last thing we do here
1452 if ($running && scalar(@nohotplug)) {
1453 die "unable to modify " . join(',', @nohotplug) . " while container is running\n";
1454 }
93285df8 1455}
c325b32f 1456
6f035afe
DM
1457sub has_dev_console {
1458 my ($conf) = @_;
1459
1460 return !(defined($conf->{console}) && !$conf->{console});
1461}
1462
0d0ca400
DM
1463sub get_tty_count {
1464 my ($conf) = @_;
1465
1466 return $conf->{tty} // $confdesc->{tty}->{default};
1467}
1468
aca816ad
DM
1469sub get_cmode {
1470 my ($conf) = @_;
1471
1472 return $conf->{cmode} // $confdesc->{cmode}->{default};
1473}
1474
1475sub get_console_command {
1476 my ($vmid, $conf) = @_;
1477
1478 my $cmode = get_cmode($conf);
1479
1480 if ($cmode eq 'console') {
1481 return ['lxc-console', '-n', $vmid, '-t', 0];
1482 } elsif ($cmode eq 'tty') {
1483 return ['lxc-console', '-n', $vmid];
1484 } elsif ($cmode eq 'shell') {
1485 return ['lxc-attach', '--clear-env', '-n', $vmid];
1486 } else {
1487 die "internal error";
1488 }
1489}
1490
c325b32f
DM
1491sub get_primary_ips {
1492 my ($conf) = @_;
1493
1494 # return data from net0
cbb03fea 1495
27916659 1496 return undef if !defined($conf->{net0});
a16d94c8 1497 my $net = parse_lxc_network($conf->{net0});
c325b32f
DM
1498
1499 my $ipv4 = $net->{ip};
db78a181
WB
1500 if ($ipv4) {
1501 if ($ipv4 =~ /^(dhcp|manual)$/) {
1502 $ipv4 = undef
1503 } else {
1504 $ipv4 =~ s!/\d+$!!;
1505 }
1506 }
65e5eaa3 1507 my $ipv6 = $net->{ip6};
db78a181 1508 if ($ipv6) {
5f291c7d 1509 if ($ipv6 =~ /^(auto|dhcp|manual)$/) {
db78a181
WB
1510 $ipv6 = undef;
1511 } else {
1512 $ipv6 =~ s!/\d+$!!;
1513 }
1514 }
cbb03fea 1515
c325b32f
DM
1516 return ($ipv4, $ipv6);
1517}
148d1cb4 1518
b407293b
WB
1519sub delete_mountpoint_volume {
1520 my ($storage_cfg, $vmid, $volume) = @_;
1521
7c921c80 1522 return if classify_mountpoint($volume) ne 'volume';
b407293b
WB
1523
1524 my ($vtype, $name, $owner) = PVE::Storage::parse_volname($storage_cfg, $volume);
1525 PVE::Storage::vdisk_free($storage_cfg, $volume) if $vmid == $owner;
1526}
ef241384 1527
27916659 1528sub destroy_lxc_container {
148d1cb4
DM
1529 my ($storage_cfg, $vmid, $conf) = @_;
1530
db8989e1
WB
1531 foreach_mountpoint($conf, sub {
1532 my ($ms, $mountpoint) = @_;
b407293b 1533 delete_mountpoint_volume($storage_cfg, $vmid, $mountpoint->{volume});
db8989e1
WB
1534 });
1535
27916659
DM
1536 rmdir "/var/lib/lxc/$vmid/rootfs";
1537 unlink "/var/lib/lxc/$vmid/config";
1538 rmdir "/var/lib/lxc/$vmid";
1539 destroy_config($vmid);
1540
1541 #my $cmd = ['lxc-destroy', '-n', $vmid ];
1542 #PVE::Tools::run_command($cmd);
148d1cb4 1543}
68fba17b 1544
ef241384 1545sub vm_stop_cleanup {
5fa890f0 1546 my ($storage_cfg, $vmid, $conf, $keepActive) = @_;
ef241384
DM
1547
1548 eval {
1549 if (!$keepActive) {
bf9d912c 1550
09aa32fd 1551 my $vollist = get_vm_volumes($conf);
a8b6b8a7 1552 PVE::Storage::deactivate_volumes($storage_cfg, $vollist);
ef241384
DM
1553 }
1554 };
1555 warn $@ if $@; # avoid errors - just warn
1556}
1557
93cdbbfb
AD
1558my $safe_num_ne = sub {
1559 my ($a, $b) = @_;
1560
1561 return 0 if !defined($a) && !defined($b);
1562 return 1 if !defined($a);
1563 return 1 if !defined($b);
1564
1565 return $a != $b;
1566};
1567
1568my $safe_string_ne = sub {
1569 my ($a, $b) = @_;
1570
1571 return 0 if !defined($a) && !defined($b);
1572 return 1 if !defined($a);
1573 return 1 if !defined($b);
1574
1575 return $a ne $b;
1576};
1577
1578sub update_net {
bedeaaf1 1579 my ($vmid, $conf, $opt, $newnet, $netid, $rootdir) = @_;
93cdbbfb 1580
18862537
WB
1581 if ($newnet->{type} ne 'veth') {
1582 # for when there are physical interfaces
1583 die "cannot update interface of type $newnet->{type}";
1584 }
1585
1586 my $veth = "veth${vmid}i${netid}";
93cdbbfb
AD
1587 my $eth = $newnet->{name};
1588
18862537
WB
1589 if (my $oldnetcfg = $conf->{$opt}) {
1590 my $oldnet = parse_lxc_network($oldnetcfg);
1591
1592 if (&$safe_string_ne($oldnet->{hwaddr}, $newnet->{hwaddr}) ||
1593 &$safe_string_ne($oldnet->{name}, $newnet->{name})) {
93cdbbfb 1594
18862537 1595 PVE::Network::veth_delete($veth);
bedeaaf1 1596 delete $conf->{$opt};
706c9791 1597 write_config($vmid, $conf);
93cdbbfb 1598
18862537 1599 hotplug_net($vmid, $conf, $opt, $newnet, $netid);
bedeaaf1 1600
18862537
WB
1601 } elsif (&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
1602 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
1603 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
bedeaaf1 1604
18862537 1605 if ($oldnet->{bridge}) {
bedeaaf1 1606 PVE::Network::tap_unplug($veth);
18862537
WB
1607 foreach (qw(bridge tag firewall)) {
1608 delete $oldnet->{$_};
1609 }
1610 $conf->{$opt} = print_lxc_network($oldnet);
706c9791 1611 write_config($vmid, $conf);
bedeaaf1 1612 }
93cdbbfb 1613
23eb2244 1614 PVE::Network::tap_plug($veth, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks});
18862537
WB
1615 foreach (qw(bridge tag firewall)) {
1616 $oldnet->{$_} = $newnet->{$_} if $newnet->{$_};
1617 }
1618 $conf->{$opt} = print_lxc_network($oldnet);
706c9791 1619 write_config($vmid, $conf);
93cdbbfb
AD
1620 }
1621 } else {
18862537 1622 hotplug_net($vmid, $conf, $opt, $newnet, $netid);
93cdbbfb
AD
1623 }
1624
bedeaaf1 1625 update_ipconfig($vmid, $conf, $opt, $eth, $newnet, $rootdir);
93cdbbfb
AD
1626}
1627
1628sub hotplug_net {
18862537 1629 my ($vmid, $conf, $opt, $newnet, $netid) = @_;
93cdbbfb 1630
18862537 1631 my $veth = "veth${vmid}i${netid}";
cbb03fea 1632 my $vethpeer = $veth . "p";
93cdbbfb
AD
1633 my $eth = $newnet->{name};
1634
1635 PVE::Network::veth_create($veth, $vethpeer, $newnet->{bridge}, $newnet->{hwaddr});
23eb2244 1636 PVE::Network::tap_plug($veth, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks});
93cdbbfb 1637
cbb03fea 1638 # attach peer in container
93cdbbfb
AD
1639 my $cmd = ['lxc-device', '-n', $vmid, 'add', $vethpeer, "$eth" ];
1640 PVE::Tools::run_command($cmd);
1641
cbb03fea 1642 # link up peer in container
93cdbbfb
AD
1643 $cmd = ['lxc-attach', '-n', $vmid, '-s', 'NETWORK', '--', '/sbin/ip', 'link', 'set', $eth ,'up' ];
1644 PVE::Tools::run_command($cmd);
bedeaaf1 1645
18862537
WB
1646 my $done = { type => 'veth' };
1647 foreach (qw(bridge tag firewall hwaddr name)) {
1648 $done->{$_} = $newnet->{$_} if $newnet->{$_};
1649 }
1650 $conf->{$opt} = print_lxc_network($done);
bedeaaf1 1651
706c9791 1652 write_config($vmid, $conf);
93cdbbfb
AD
1653}
1654
68a05bb3 1655sub update_ipconfig {
bedeaaf1
AD
1656 my ($vmid, $conf, $opt, $eth, $newnet, $rootdir) = @_;
1657
f2104b80 1658 my $lxc_setup = PVE::LXC::Setup->new($conf, $rootdir);
bedeaaf1 1659
18862537 1660 my $optdata = parse_lxc_network($conf->{$opt});
84e0c123
WB
1661 my $deleted = [];
1662 my $added = [];
8d723477
WB
1663 my $nscmd = sub {
1664 my $cmdargs = shift;
1665 PVE::Tools::run_command(['lxc-attach', '-n', $vmid, '-s', 'NETWORK', '--', @_], %$cmdargs);
84e0c123 1666 };
8d723477 1667 my $ipcmd = sub { &$nscmd({}, '/sbin/ip', @_) };
2bfd1615 1668
84e0c123 1669 my $change_ip_config = sub {
f39002a6
DM
1670 my ($ipversion) = @_;
1671
1672 my $family_opt = "-$ipversion";
1673 my $suffix = $ipversion == 4 ? '' : $ipversion;
84e0c123
WB
1674 my $gw= "gw$suffix";
1675 my $ip= "ip$suffix";
bedeaaf1 1676
6178b0dd
WB
1677 my $newip = $newnet->{$ip};
1678 my $newgw = $newnet->{$gw};
1679 my $oldip = $optdata->{$ip};
1680
1681 my $change_ip = &$safe_string_ne($oldip, $newip);
1682 my $change_gw = &$safe_string_ne($optdata->{$gw}, $newgw);
bedeaaf1 1683
84e0c123 1684 return if !$change_ip && !$change_gw;
68a05bb3 1685
84e0c123 1686 # step 1: add new IP, if this fails we cancel
292aff54
WB
1687 my $is_real_ip = ($newip && $newip !~ /^(?:auto|dhcp|manual)$/);
1688 if ($change_ip && $is_real_ip) {
8d723477 1689 eval { &$ipcmd($family_opt, 'addr', 'add', $newip, 'dev', $eth); };
84e0c123
WB
1690 if (my $err = $@) {
1691 warn $err;
1692 return;
1693 }
bedeaaf1 1694 }
bedeaaf1 1695
84e0c123
WB
1696 # step 2: replace gateway
1697 # If this fails we delete the added IP and cancel.
1698 # If it succeeds we save the config and delete the old IP, ignoring
1699 # errors. The config is then saved.
1700 # Note: 'ip route replace' can add
1701 if ($change_gw) {
6178b0dd 1702 if ($newgw) {
292aff54
WB
1703 eval {
1704 if ($is_real_ip && !PVE::Network::is_ip_in_cidr($newgw, $newip, $ipversion)) {
1705 &$ipcmd($family_opt, 'route', 'add', $newgw, 'dev', $eth);
1706 }
1707 &$ipcmd($family_opt, 'route', 'replace', 'default', 'via', $newgw);
1708 };
84e0c123
WB
1709 if (my $err = $@) {
1710 warn $err;
1711 # the route was not replaced, the old IP is still available
1712 # rollback (delete new IP) and cancel
1713 if ($change_ip) {
8d723477 1714 eval { &$ipcmd($family_opt, 'addr', 'del', $newip, 'dev', $eth); };
84e0c123
WB
1715 warn $@ if $@; # no need to die here
1716 }
1717 return;
1718 }
1719 } else {
8d723477 1720 eval { &$ipcmd($family_opt, 'route', 'del', 'default'); };
84e0c123
WB
1721 # if the route was not deleted, the guest might have deleted it manually
1722 # warn and continue
1723 warn $@ if $@;
1724 }
2bfd1615 1725 }
2bfd1615 1726
6178b0dd 1727 # from this point on we save the configuration
84e0c123 1728 # step 3: delete old IP ignoring errors
6178b0dd 1729 if ($change_ip && $oldip && $oldip !~ /^(?:auto|dhcp)$/) {
8d723477
WB
1730 # We need to enable promote_secondaries, otherwise our newly added
1731 # address will be removed along with the old one.
1732 my $promote = 0;
1733 eval {
1734 if ($ipversion == 4) {
1735 &$nscmd({ outfunc => sub { $promote = int(shift) } },
1736 'cat', "/proc/sys/net/ipv4/conf/$eth/promote_secondaries");
1737 &$nscmd({}, 'sysctl', "net.ipv4.conf.$eth.promote_secondaries=1");
1738 }
1739 &$ipcmd($family_opt, 'addr', 'del', $oldip, 'dev', $eth);
1740 };
84e0c123 1741 warn $@ if $@; # no need to die here
8d723477
WB
1742
1743 if ($ipversion == 4) {
1744 &$nscmd({}, 'sysctl', "net.ipv4.conf.$eth.promote_secondaries=$promote");
1745 }
bedeaaf1
AD
1746 }
1747
84e0c123
WB
1748 foreach my $property ($ip, $gw) {
1749 if ($newnet->{$property}) {
1750 $optdata->{$property} = $newnet->{$property};
1751 } else {
1752 delete $optdata->{$property};
1753 }
bedeaaf1 1754 }
18862537 1755 $conf->{$opt} = print_lxc_network($optdata);
706c9791 1756 write_config($vmid, $conf);
84e0c123
WB
1757 $lxc_setup->setup_network($conf);
1758 };
bedeaaf1 1759
f39002a6
DM
1760 &$change_ip_config(4);
1761 &$change_ip_config(6);
489e960d
WL
1762
1763}
1764
a92f66c9
WL
1765# Internal snapshots
1766
1767# NOTE: Snapshot create/delete involves several non-atomic
c31ad455
FG
1768# actions, and can take a long time.
1769# So we try to avoid locking the file and use the 'lock' variable
a92f66c9
WL
1770# inside the config file instead.
1771
1772my $snapshot_copy_config = sub {
1773 my ($source, $dest) = @_;
1774
1775 foreach my $k (keys %$source) {
1776 next if $k eq 'snapshots';
09d3ec42
DM
1777 next if $k eq 'snapstate';
1778 next if $k eq 'snaptime';
1779 next if $k eq 'vmstate';
1780 next if $k eq 'lock';
a92f66c9 1781 next if $k eq 'digest';
09d3ec42 1782 next if $k eq 'description';
0f8b9438 1783 next if $k =~ m/^unused\d+$/;
a92f66c9
WL
1784
1785 $dest->{$k} = $source->{$k};
1786 }
1787};
1788
0f8b9438
FG
1789my $snapshot_apply_config = sub {
1790 my ($conf, $snap) = @_;
1791
1792 # copy snapshot list
1793 my $newconf = {
1794 snapshots => $conf->{snapshots},
1795 };
1796
1797 # keep description and list of unused disks
1798 foreach my $k (keys %$conf) {
1799 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
1800 $newconf->{$k} = $conf->{$k};
1801 }
1802
1803 &$snapshot_copy_config($snap, $newconf);
1804
1805 return $newconf;
1806};
1807
4e8b04cd 1808sub snapshot_save_vmstate {
0f8b9438 1809 die "implement me - snapshot_save_vmstate\n";
4e8b04cd 1810}
0f8b9438 1811
0bfffef4
FG
1812sub snapshot_prepare {
1813 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
a92f66c9
WL
1814
1815 my $snap;
1816
1817 my $updatefn = sub {
1818
1819 my $conf = load_config($vmid);
1820
bb1ac2de
DM
1821 die "you can't take a snapshot if it's a template\n"
1822 if is_template($conf);
1823
a92f66c9
WL
1824 check_lock($conf);
1825
09d3ec42 1826 $conf->{lock} = 'snapshot';
a92f66c9
WL
1827
1828 die "snapshot name '$snapname' already used\n"
1829 if defined($conf->{snapshots}->{$snapname});
1830
1831 my $storecfg = PVE::Storage::config();
41f044fb
FG
1832 die "snapshot feature is not available\n"
1833 if !has_feature('snapshot', $conf, $storecfg, undef, undef, $snapname eq 'vzdump');
a92f66c9
WL
1834
1835 $snap = $conf->{snapshots}->{$snapname} = {};
1836
0f8b9438 1837 if ($save_vmstate && check_running($vmid)) {
4e8b04cd 1838 snapshot_save_vmstate($vmid, $conf, $snapname, $storecfg);
0f8b9438
FG
1839 }
1840
a92f66c9
WL
1841 &$snapshot_copy_config($conf, $snap);
1842
0f8b9438
FG
1843 $snap->{snapstate} = "prepare";
1844 $snap->{snaptime} = time();
1845 $snap->{description} = $comment if $comment;
a92f66c9 1846
706c9791 1847 write_config($vmid, $conf);
a92f66c9
WL
1848 };
1849
3cc56749 1850 lock_config($vmid, $updatefn);
a92f66c9
WL
1851
1852 return $snap;
0bfffef4 1853}
a92f66c9 1854
0bfffef4 1855sub snapshot_commit {
a92f66c9
WL
1856 my ($vmid, $snapname) = @_;
1857
1858 my $updatefn = sub {
1859
1860 my $conf = load_config($vmid);
1861
1862 die "missing snapshot lock\n"
09d3ec42 1863 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
a92f66c9 1864
0f8b9438
FG
1865 my $snap = $conf->{snapshots}->{$snapname};
1866 die "snapshot '$snapname' does not exist\n" if !defined($snap);
a92f66c9
WL
1867
1868 die "wrong snapshot state\n"
0f8b9438 1869 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
a92f66c9 1870
0f8b9438 1871 delete $snap->{snapstate};
09d3ec42 1872 delete $conf->{lock};
a92f66c9 1873
4d3d8201 1874 $conf->{parent} = $snapname;
0f8b9438 1875
4d3d8201 1876 write_config($vmid, $conf);
a92f66c9
WL
1877 };
1878
0bfffef4
FG
1879 lock_config($vmid, $updatefn);
1880}
a92f66c9
WL
1881
1882sub has_feature {
41f044fb 1883 my ($feature, $conf, $storecfg, $snapname, $running, $backup_only) = @_;
09d3ec42 1884
a92f66c9 1885 my $err;
09d3ec42 1886
8bf50651
DM
1887 foreach_mountpoint($conf, sub {
1888 my ($ms, $mountpoint) = @_;
1889
2c3ed8c4 1890 return if $err; # skip further test
41f044fb 1891 return if $backup_only && $ms ne 'rootfs' && !$mountpoint->{backup};
2c3ed8c4 1892
41f044fb 1893 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $mountpoint->{volume}, $snapname, $running);
8bf50651 1894 });
a92f66c9
WL
1895
1896 return $err ? 0 : 1;
1897}
1898
34fdb3d7
WB
1899my $enter_namespace = sub {
1900 my ($vmid, $pid, $which, $type) = @_;
1901 sysopen my $fd, "/proc/$pid/ns/$which", O_RDONLY
1902 or die "failed to open $which namespace of container $vmid: $!\n";
1903 PVE::Tools::setns(fileno($fd), $type)
1904 or die "failed to enter $which namespace of container $vmid: $!\n";
1905 close $fd;
1906};
1907
1908my $do_syncfs = sub {
1909 my ($vmid, $pid, $socket) = @_;
1910
1911 &$enter_namespace($vmid, $pid, 'mnt', PVE::Tools::CLONE_NEWNS);
1912
1913 # Tell the parent process to start reading our /proc/mounts
1914 print {$socket} "go\n";
1915 $socket->flush();
1916
1917 # Receive /proc/self/mounts
1918 my $mountdata = do { local $/ = undef; <$socket> };
1919 close $socket;
1920
1921 # Now sync all mountpoints...
1922 my $mounts = PVE::ProcFSTools::parse_mounts($mountdata);
1923 foreach my $mp (@$mounts) {
1924 my ($what, $dir, $fs) = @$mp;
1925 next if $fs eq 'fuse.lxcfs';
1926 eval { PVE::Tools::sync_mountpoint($dir); };
1927 warn $@ if $@;
1928 }
1929};
1930
1931sub sync_container_namespace {
1932 my ($vmid) = @_;
1933 my $pid = find_lxc_pid($vmid);
1934
1935 # SOCK_DGRAM is nicer for barriers but cannot be slurped
1936 socketpair my $pfd, my $cfd, AF_UNIX, SOCK_STREAM, PF_UNSPEC
1937 or die "failed to create socketpair: $!\n";
1938
1939 my $child = fork();
1940 die "fork failed: $!\n" if !defined($child);
1941
1942 if (!$child) {
1943 eval {
1944 close $pfd;
1945 &$do_syncfs($vmid, $pid, $cfd);
1946 };
1947 if (my $err = $@) {
1948 warn $err;
1949 POSIX::_exit(1);
1950 }
1951 POSIX::_exit(0);
1952 }
1953 close $cfd;
1954 my $go = <$pfd>;
1955 die "failed to enter container namespace\n" if $go ne "go\n";
1956
1957 open my $mounts, '<', "/proc/$child/mounts"
1958 or die "failed to open container's /proc/mounts: $!\n";
1959 my $mountdata = do { local $/ = undef; <$mounts> };
1960 close $mounts;
1961 print {$pfd} $mountdata;
1962 close $pfd;
1963
1964 while (waitpid($child, 0) != $child) {}
1965 die "failed to sync container namespace\n" if $? != 0;
1966}
1967
5040d81c
FG
1968sub check_freeze_needed {
1969 my ($vmid, $config, $save_vmstate) = @_;
1970
1971 my $ret = check_running($vmid);
1972 return ($ret, $ret);
1973}
1974
489e960d 1975sub snapshot_create {
0bfffef4 1976 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
489e960d 1977
0bfffef4 1978 my $snap = snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
a92f66c9 1979
5040d81c
FG
1980 $save_vmstate = 0 if !$snap->{vmstate};
1981
09d3ec42 1982 my $conf = load_config($vmid);
a92f66c9 1983
5040d81c 1984 my ($running, $freezefs) = check_freeze_needed($vmid, $conf, $snap->{vmstate});
74bf6d37
FG
1985
1986 my $drivehash = {};
1987
a92f66c9 1988 eval {
5040d81c 1989 if ($freezefs) {
74bf6d37 1990 PVE::Tools::run_command(['/usr/bin/lxc-freeze', '-n', $vmid]);
34fdb3d7 1991 sync_container_namespace($vmid);
5040d81c 1992 }
a92f66c9
WL
1993
1994 my $storecfg = PVE::Storage::config();
5040d81c
FG
1995 foreach_mountpoint($conf, sub {
1996 my ($ms, $mountpoint) = @_;
a92f66c9 1997
5040d81c
FG
1998 return if $snapname eq 'vzdump' && $ms ne 'rootfs' && !$mountpoint->{backup};
1999 PVE::Storage::volume_snapshot($storecfg, $mountpoint->{volume}, $snapname);
2000 $drivehash->{$ms} = 1;
2001 });
a92f66c9 2002 };
2477a7f1
DM
2003 my $err = $@;
2004
5040d81c
FG
2005 if ($running) {
2006 if ($freezefs) {
2007 eval { PVE::Tools::run_command(['/usr/bin/lxc-unfreeze', '-n', $vmid]); };
2008 warn $@ if $@;
2009 }
2477a7f1
DM
2010 }
2011
2012 if ($err) {
5040d81c 2013 warn "snapshot create failed: starting cleanup\n";
74bf6d37 2014 eval { snapshot_delete($vmid, $snapname, 1, $drivehash); };
5040d81c 2015 warn "$@" if $@;
a92f66c9
WL
2016 die "$err\n";
2017 }
74bf6d37 2018
0bfffef4 2019 snapshot_commit($vmid, $snapname);
68a05bb3
AD
2020}
2021
74bf6d37 2022# Note: $drivehash is only set when called from snapshot_create.
57ccb3f8 2023sub snapshot_delete {
74bf6d37 2024 my ($vmid, $snapname, $force, $drivehash) = @_;
57ccb3f8 2025
4de963d4 2026 my $prepare = 1;
31429832 2027
4de963d4 2028 my $snap;
5040d81c 2029 my $unused = [];
31429832 2030
7b2eb379 2031 my $unlink_parent = sub {
7b2eb379 2032 my ($confref, $new_parent) = @_;
31429832 2033
7b2eb379
FG
2034 if ($confref->{parent} && $confref->{parent} eq $snapname) {
2035 if ($new_parent) {
2036 $confref->{parent} = $new_parent;
31429832 2037 } else {
7b2eb379 2038 delete $confref->{parent};
31429832
WL
2039 }
2040 }
7b2eb379
FG
2041 };
2042
4de963d4
FG
2043 my $updatefn = sub {
2044 my ($remove_drive) = @_;
7b2eb379 2045
4de963d4 2046 my $conf = load_config($vmid);
74bf6d37 2047
4de963d4 2048 if (!$drivehash) {
74bf6d37 2049 check_lock($conf);
4de963d4
FG
2050 die "you can't delete a snapshot if vm is a template\n"
2051 if is_template($conf);
74bf6d37 2052 }
7b2eb379 2053
4de963d4
FG
2054 $snap = $conf->{snapshots}->{$snapname};
2055
2056 die "snapshot '$snapname' does not exist\n" if !defined($snap);
2057
2058 # remove parent refs
2059 if (!$prepare) {
2060 &$unlink_parent($conf, $snap->{parent});
2061 foreach my $sn (keys %{$conf->{snapshots}}) {
2062 next if $sn eq $snapname;
2063 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
2064 }
7b2eb379
FG
2065 }
2066
4de963d4
FG
2067 if ($remove_drive) {
2068 if ($remove_drive eq 'vmstate') {
2069 die "implement me - saving vmstate\n";
2070 } else {
5040d81c
FG
2071 my $value = $snap->{$remove_drive};
2072 my $mountpoint = $remove_drive eq 'rootfs' ? parse_ct_rootfs($value, 1) : parse_ct_mountpoint($value, 1);
2073 delete $snap->{$remove_drive};
2074 add_unused_volume($snap, $mountpoint->{volume})
2075 if (!is_volume_in_use($snap, $mountpoint->{volume}));
4de963d4
FG
2076 }
2077 }
31429832 2078
4de963d4
FG
2079 if ($prepare) {
2080 $snap->{snapstate} = 'delete';
2081 } else {
2082 delete $conf->{snapshots}->{$snapname};
2083 delete $conf->{lock} if $drivehash;
5040d81c
FG
2084 foreach my $volid (@$unused) {
2085 add_unused_volume($conf, $volid)
2086 if (!is_volume_in_use($conf, $volid));
2087 }
4de963d4 2088 }
31429832 2089
706c9791 2090 write_config($vmid, $conf);
31429832
WL
2091 };
2092
4de963d4
FG
2093 lock_config($vmid, $updatefn);
2094
2095 # now remove vmstate file
2096 # never set for LXC!
2097 my $storecfg = PVE::Storage::config();
2098
2099 if ($snap->{vmstate}) {
2100 die "implement me - saving vmstate\n";
2101 };
31429832 2102
4de963d4 2103 # now remove all volume snapshots
5040d81c
FG
2104 foreach_mountpoint($snap, sub {
2105 my ($ms, $mountpoint) = @_;
2106
2107 return if $snapname eq 'vzdump' && $ms ne 'rootfs' && !$mountpoint->{backup};
2108 if (!$drivehash || $drivehash->{$ms}) {
2109 eval { PVE::Storage::volume_snapshot_delete($storecfg, $mountpoint->{volume}, $snapname); };
2110 if (my $err = $@) {
2111 die $err if !$force;
2112 warn $err;
2113 }
2114 }
2115
2116 # save changes (remove mp from snapshot)
2117 lock_config($vmid, $updatefn, $ms) if !$force;
2118 push @$unused, $mountpoint->{volume};
2119 });
4de963d4
FG
2120
2121 # now cleanup config
2122 $prepare = 0;
2123 lock_config($vmid, $updatefn);
57ccb3f8
WL
2124}
2125
723157f6
WL
2126sub snapshot_rollback {
2127 my ($vmid, $snapname) = @_;
2128
20e5d106
FG
2129 my $prepare = 1;
2130
6860ba0c
WL
2131 my $storecfg = PVE::Storage::config();
2132
2133 my $conf = load_config($vmid);
2134
20e5d106 2135 my $get_snapshot_config = sub {
bb1ac2de 2136
20e5d106 2137 die "you can't rollback if vm is a template\n" if is_template($conf);
6860ba0c 2138
20e5d106 2139 my $res = $conf->{snapshots}->{$snapname};
6860ba0c 2140
20e5d106
FG
2141 die "snapshot '$snapname' does not exist\n" if !defined($res);
2142
2143 return $res;
2144 };
2145
2146 my $snap = &$get_snapshot_config();
2147
5040d81c
FG
2148 foreach_mountpoint($snap, sub {
2149 my ($ms, $mountpoint) = @_;
09d3ec42 2150
5040d81c
FG
2151 PVE::Storage::volume_rollback_is_possible($storecfg, $mountpoint->{volume}, $snapname);
2152 });
6860ba0c
WL
2153
2154 my $updatefn = sub {
2155
20e5d106 2156 $conf = load_config($vmid);
6860ba0c 2157
20e5d106
FG
2158 $snap = &$get_snapshot_config();
2159
2160 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
2161 if $snap->{snapstate};
6860ba0c 2162
20e5d106
FG
2163 if ($prepare) {
2164 check_lock($conf);
69d4afc7
FG
2165 PVE::Tools::run_command(['/usr/bin/lxc-stop', '-n', $vmid, '--kill'])
2166 if check_running($vmid);
20e5d106 2167 }
6860ba0c
WL
2168
2169 die "unable to rollback vm $vmid: vm is running\n"
2170 if check_running($vmid);
2171
20e5d106
FG
2172 if ($prepare) {
2173 $conf->{lock} = 'rollback';
2174 } else {
2175 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
2176 delete $conf->{lock};
2177 }
6860ba0c
WL
2178
2179 my $forcemachine;
2180
20e5d106
FG
2181 if (!$prepare) {
2182 # copy snapshot config to current config
2183 $conf = &$snapshot_apply_config($conf, $snap);
2184 $conf->{parent} = $snapname;
2185 }
6860ba0c 2186
706c9791 2187 write_config($vmid, $conf);
6860ba0c 2188
20e5d106 2189 if (!$prepare && $snap->{vmstate}) {
19d36a45 2190 die "implement me - save vmstate\n";
20e5d106 2191 }
6860ba0c
WL
2192 };
2193
3cc56749 2194 lock_config($vmid, $updatefn);
6860ba0c 2195
5040d81c
FG
2196 foreach_mountpoint($snap, sub {
2197 my ($ms, $mountpoint) = @_;
2198
2199 PVE::Storage::volume_snapshot_rollback($storecfg, $mountpoint->{volume}, $snapname);
2200 });
6860ba0c 2201
20e5d106
FG
2202 $prepare = 0;
2203 lock_config($vmid, $updatefn);
723157f6 2204}
b935932a 2205
bb1ac2de
DM
2206sub template_create {
2207 my ($vmid, $conf) = @_;
2208
2209 my $storecfg = PVE::Storage::config();
2210
44a9face 2211 my $rootinfo = parse_ct_rootfs($conf->{rootfs});
bb1ac2de
DM
2212 my $volid = $rootinfo->{volume};
2213
2214 die "Template feature is not available for '$volid'\n"
2215 if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
2216
2217 PVE::Storage::activate_volumes($storecfg, [$volid]);
2218
2219 my $template_volid = PVE::Storage::vdisk_create_base($storecfg, $volid);
2220 $rootinfo->{volume} = $template_volid;
4fee75fd 2221 $conf->{rootfs} = print_ct_mountpoint($rootinfo, 1);
bb1ac2de
DM
2222
2223 write_config($vmid, $conf);
2224}
2225
2226sub is_template {
2227 my ($conf) = @_;
2228
2229 return 1 if defined $conf->{template} && $conf->{template} == 1;
2230}
2231
9622e848
DM
2232sub mountpoint_names {
2233 my ($reverse) = @_;
ced7fddb 2234
9622e848 2235 my @names = ('rootfs');
eaebef36
DM
2236
2237 for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
9622e848
DM
2238 push @names, "mp$i";
2239 }
2240
2241 return $reverse ? reverse @names : @names;
2242}
2243
3c9dbfa9 2244
9622e848
DM
2245sub foreach_mountpoint_full {
2246 my ($conf, $reverse, $func) = @_;
2247
2248 foreach my $key (mountpoint_names($reverse)) {
2249 my $value = $conf->{$key};
2250 next if !defined($value);
44a9face 2251 my $mountpoint = $key eq 'rootfs' ? parse_ct_rootfs($value, 1) : parse_ct_mountpoint($value, 1);
ca7feb1a 2252 next if !defined($mountpoint);
3c9dbfa9 2253
eaebef36 2254 &$func($key, $mountpoint);
ced7fddb
AD
2255 }
2256}
2257
9622e848
DM
2258sub foreach_mountpoint {
2259 my ($conf, $func) = @_;
2260
2261 foreach_mountpoint_full($conf, 0, $func);
2262}
2263
2264sub foreach_mountpoint_reverse {
2265 my ($conf, $func) = @_;
2266
2267 foreach_mountpoint_full($conf, 1, $func);
2268}
2269
52389a07 2270sub check_ct_modify_config_perm {
f1ba1a4b 2271 my ($rpcenv, $authuser, $vmid, $pool, $newconf, $delete) = @_;
52389a07 2272
c81f19d1 2273 return 1 if $authuser eq 'root@pam';
52389a07 2274
f1ba1a4b
WB
2275 my $check = sub {
2276 my ($opt, $delete) = @_;
52389a07
DM
2277 if ($opt eq 'cpus' || $opt eq 'cpuunits' || $opt eq 'cpulimit') {
2278 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.CPU']);
e59a61ed 2279 } elsif ($opt eq 'rootfs' || $opt =~ /^mp\d+$/) {
52389a07 2280 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Disk']);
f1ba1a4b
WB
2281 return if $delete;
2282 my $data = $opt eq 'rootfs' ? parse_ct_rootfs($newconf->{$opt})
2283 : parse_ct_mountpoint($newconf->{$opt});
2284 raise_perm_exc("mountpoint type $data->{type}") if $data->{type} ne 'volume';
52389a07
DM
2285 } elsif ($opt eq 'memory' || $opt eq 'swap') {
2286 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Memory']);
2287 } elsif ($opt =~ m/^net\d+$/ || $opt eq 'nameserver' ||
2288 $opt eq 'searchdomain' || $opt eq 'hostname') {
2289 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Network']);
2290 } else {
2291 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Options']);
2292 }
f1ba1a4b
WB
2293 };
2294
2295 foreach my $opt (keys %$newconf) {
2296 &$check($opt, 0);
2297 }
2298 foreach my $opt (@$delete) {
2299 &$check($opt, 1);
52389a07
DM
2300 }
2301
2302 return 1;
2303}
2304
9622e848 2305sub umount_all {
da629848 2306 my ($vmid, $storage_cfg, $conf, $noerr) = @_;
9622e848
DM
2307
2308 my $rootdir = "/var/lib/lxc/$vmid/rootfs";
2309 my $volid_list = get_vm_volumes($conf);
2310
2311 foreach_mountpoint_reverse($conf, sub {
2312 my ($ms, $mountpoint) = @_;
2313
2314 my $volid = $mountpoint->{volume};
2315 my $mount = $mountpoint->{mp};
2316
2317 return if !$volid || !$mount;
2318
d18f96b4 2319 my $mount_path = "$rootdir/$mount";
f845a93d 2320 $mount_path =~ s!/+!/!g;
9622e848 2321
228a5a1d
WL
2322 return if !PVE::ProcFSTools::is_mounted($mount_path);
2323
9622e848 2324 eval {
d18f96b4 2325 PVE::Tools::run_command(['umount', '-d', $mount_path]);
9622e848
DM
2326 };
2327 if (my $err = $@) {
2328 if ($noerr) {
2329 warn $err;
2330 } else {
2331 die $err;
2332 }
2333 }
2334 });
9622e848
DM
2335}
2336
2337sub mount_all {
7b49dfe0 2338 my ($vmid, $storage_cfg, $conf) = @_;
9622e848
DM
2339
2340 my $rootdir = "/var/lib/lxc/$vmid/rootfs";
1adc7e53 2341 File::Path::make_path($rootdir);
9622e848
DM
2342
2343 my $volid_list = get_vm_volumes($conf);
2344 PVE::Storage::activate_volumes($storage_cfg, $volid_list);
2345
2346 eval {
9622e848
DM
2347 foreach_mountpoint($conf, sub {
2348 my ($ms, $mountpoint) = @_;
2349
da629848 2350 mountpoint_mount($mountpoint, $rootdir, $storage_cfg);
9622e848
DM
2351 });
2352 };
2353 if (my $err = $@) {
e2007ac2 2354 warn "mounting container failed\n";
9622e848 2355 umount_all($vmid, $storage_cfg, $conf, 1);
e2007ac2 2356 die $err;
9622e848
DM
2357 }
2358
da629848 2359 return $rootdir;
9622e848
DM
2360}
2361
2362
b15c75fc 2363sub mountpoint_mount_path {
da629848 2364 my ($mountpoint, $storage_cfg, $snapname) = @_;
b15c75fc 2365
da629848 2366 return mountpoint_mount($mountpoint, undef, $storage_cfg, $snapname);
b15c75fc 2367}
cc6b0307 2368
2cfae16e
WB
2369my $check_mount_path = sub {
2370 my ($path) = @_;
2371 $path = File::Spec->canonpath($path);
2372 my $real = Cwd::realpath($path);
2373 if ($real ne $path) {
2374 die "mount path modified by symlink: $path != $real";
2375 }
2376};
2377
21f292ff
WB
2378sub query_loopdev {
2379 my ($path) = @_;
2380 my $found;
2381 my $parser = sub {
2382 my $line = shift;
2383 if ($line =~ m@^(/dev/loop\d+):@) {
2384 $found = $1;
2385 }
2386 };
2387 my $cmd = ['losetup', '--associated', $path];
2388 PVE::Tools::run_command($cmd, outfunc => $parser);
2389 return $found;
2390}
2391
50df544c
WB
2392# Run a function with a file attached to a loop device.
2393# The loop device is always detached afterwards (or set to autoclear).
2394# Returns the loop device.
2395sub run_with_loopdev {
2396 my ($func, $file) = @_;
54d11e5c
WB
2397 my $device = query_loopdev($file);
2398 # Try to reuse an existing device
2399 if ($device) {
2400 # We assume that whoever setup the loop device is responsible for
2401 # detaching it.
2402 &$func($device);
2403 return $device;
2404 }
2405
50df544c
WB
2406 my $parser = sub {
2407 my $line = shift;
2408 if ($line =~ m@^(/dev/loop\d+)$@) {
2409 $device = $1;
2410 }
2411 };
2412 PVE::Tools::run_command(['losetup', '--show', '-f', $file], outfunc => $parser);
2413 die "failed to setup loop device for $file\n" if !$device;
2414 eval { &$func($device); };
2415 my $err = $@;
2416 PVE::Tools::run_command(['losetup', '-d', $device]);
2417 die $err if $err;
2418 return $device;
2419}
2420
c2744c97
WB
2421sub bindmount {
2422 my ($dir, $dest, $ro, @extra_opts) = @_;
2423 PVE::Tools::run_command(['mount', '-o', 'bind', @extra_opts, $dir, $dest]);
2424 if ($ro) {
2425 eval { PVE::Tools::run_command(['mount', '-o', 'bind,remount,ro', $dest]); };
2426 if (my $err = $@) {
2427 warn "bindmount error\n";
2428 # don't leave writable bind-mounts behind...
2429 PVE::Tools::run_command(['umount', $dest]);
2430 die $err;
2431 }
2432 }
2433}
2434
b15c75fc 2435# use $rootdir = undef to just return the corresponding mount path
cc6b0307 2436sub mountpoint_mount {
da629848 2437 my ($mountpoint, $rootdir, $storage_cfg, $snapname) = @_;
cc6b0307
AD
2438
2439 my $volid = $mountpoint->{volume};
2440 my $mount = $mountpoint->{mp};
7c921c80 2441 my $type = $mountpoint->{type};
50df544c
WB
2442 my $quota = !$snapname && !$mountpoint->{ro} && $mountpoint->{quota};
2443 my $mounted_dev;
b15c75fc 2444
cc6b0307
AD
2445 return if !$volid || !$mount;
2446
b15c75fc
DM
2447 my $mount_path;
2448
2449 if (defined($rootdir)) {
2450 $rootdir =~ s!/+$!!;
2451 $mount_path = "$rootdir/$mount";
f845a93d 2452 $mount_path =~ s!/+!/!g;
2cfae16e 2453 &$check_mount_path($mount_path);
b15c75fc 2454 File::Path::mkpath($mount_path);
116ce06f 2455 }
b15c75fc
DM
2456
2457 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
cc6b0307 2458
b15c75fc 2459 die "unknown snapshot path for '$volid'" if !$storage && defined($snapname);
cc6b0307 2460
471dd315
WB
2461 my $optstring = '';
2462 if (defined($mountpoint->{acl})) {
2463 $optstring .= ($mountpoint->{acl} ? 'acl' : 'noacl');
2464 }
c2744c97 2465 my $readonly = $mountpoint->{ro};
471dd315
WB
2466
2467 my @extra_opts = ('-o', $optstring);
2468
b15c75fc
DM
2469 if ($storage) {
2470
2471 my $scfg = PVE::Storage::storage_config($storage_cfg, $storage);
2472 my $path = PVE::Storage::path($storage_cfg, $volid, $snapname);
2473
2474 my ($vtype, undef, undef, undef, undef, $isBase, $format) =
2475 PVE::Storage::parse_volname($storage_cfg, $volid);
2476
c87b9dd8
DM
2477 $format = 'iso' if $vtype eq 'iso'; # allow to handle iso files
2478
b15c75fc 2479 if ($format eq 'subvol') {
30de33be
DM
2480 if ($mount_path) {
2481 if ($snapname) {
e84f7f5d
DM
2482 if ($scfg->{type} eq 'zfspool') {
2483 my $path_arg = $path;
2484 $path_arg =~ s!^/+!!;
471dd315 2485 PVE::Tools::run_command(['mount', '-o', 'ro', @extra_opts, '-t', 'zfs', $path_arg, $mount_path]);
e84f7f5d 2486 } else {
30de33be
DM
2487 die "cannot mount subvol snapshots for storage type '$scfg->{type}'\n";
2488 }
e84f7f5d 2489 } else {
c2744c97 2490 bindmount($path, $mount_path, $readonly, @extra_opts);
50df544c 2491 warn "cannot enable quota control for bind mounted subvolumes\n" if $quota;
30de33be 2492 }
b15c75fc 2493 }
50df544c 2494 return wantarray ? ($path, 0, $mounted_dev) : $path;
c87b9dd8 2495 } elsif ($format eq 'raw' || $format eq 'iso') {
50df544c
WB
2496 my $domount = sub {
2497 my ($path) = @_;
2498 if ($mount_path) {
2499 if ($format eq 'iso') {
2500 PVE::Tools::run_command(['mount', '-o', 'ro', @extra_opts, $path, $mount_path]);
2501 } elsif ($isBase || defined($snapname)) {
2502 PVE::Tools::run_command(['mount', '-o', 'ro,noload', @extra_opts, $path, $mount_path]);
2503 } else {
2504 if ($quota) {
2505 push @extra_opts, '-o', 'usrjquota=aquota.user,grpjquota=aquota.group,jqfmt=vfsv0';
2506 }
c2744c97 2507 push @extra_opts, '-o', 'ro' if $readonly;
50df544c
WB
2508 PVE::Tools::run_command(['mount', @extra_opts, $path, $mount_path]);
2509 }
2510 }
2511 };
30de33be 2512 my $use_loopdev = 0;
b15c75fc 2513 if ($scfg->{path}) {
50df544c 2514 $mounted_dev = run_with_loopdev($domount, $path);
30de33be 2515 $use_loopdev = 1;
2e879877
DM
2516 } elsif ($scfg->{type} eq 'drbd' || $scfg->{type} eq 'lvm' ||
2517 $scfg->{type} eq 'rbd' || $scfg->{type} eq 'lvmthin') {
50df544c
WB
2518 $mounted_dev = $path;
2519 &$domount($path);
b15c75fc
DM
2520 } else {
2521 die "unsupported storage type '$scfg->{type}'\n";
2522 }
50df544c 2523 return wantarray ? ($path, $use_loopdev, $mounted_dev) : $path;
b15c75fc
DM
2524 } else {
2525 die "unsupported image format '$format'\n";
2526 }
7c921c80 2527 } elsif ($type eq 'device') {
c2744c97 2528 push @extra_opts, '-o', 'ro' if $readonly;
471dd315 2529 PVE::Tools::run_command(['mount', @extra_opts, $volid, $mount_path]) if $mount_path;
50df544c 2530 return wantarray ? ($volid, 0, $volid) : $volid;
e2007ac2
DM
2531 } elsif ($type eq 'bind') {
2532 die "directory '$volid' does not exist\n" if ! -d $volid;
2cfae16e 2533 &$check_mount_path($volid);
c2744c97 2534 bindmount($volid, $mount_path, $readonly, @extra_opts) if $mount_path;
50df544c
WB
2535 warn "cannot enable quota control for bind mounts\n" if $quota;
2536 return wantarray ? ($volid, 0, undef) : $volid;
b15c75fc
DM
2537 }
2538
2539 die "unsupported storage";
cc6b0307
AD
2540}
2541
9205e9d0
AD
2542sub get_vm_volumes {
2543 my ($conf, $excludes) = @_;
2544
2545 my $vollist = [];
2546
706c9791 2547 foreach_mountpoint($conf, sub {
9205e9d0
AD
2548 my ($ms, $mountpoint) = @_;
2549
2550 return if $excludes && $ms eq $excludes;
2551
2552 my $volid = $mountpoint->{volume};
2553
7c921c80 2554 return if !$volid || $mountpoint->{type} ne 'volume';
9205e9d0
AD
2555
2556 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2557 return if !$sid;
2558
2559 push @$vollist, $volid;
2560 });
2561
2562 return $vollist;
2563}
2564
6c871c36 2565sub mkfs {
d216e891 2566 my ($dev, $rootuid, $rootgid) = @_;
6c871c36 2567
d216e891
WB
2568 PVE::Tools::run_command(['mkfs.ext4', '-O', 'mmp',
2569 '-E', "root_owner=$rootuid:$rootgid",
2570 $dev]);
6c871c36
DM
2571}
2572
2573sub format_disk {
d216e891 2574 my ($storage_cfg, $volid, $rootuid, $rootgid) = @_;
6c871c36
DM
2575
2576 if ($volid =~ m!^/dev/.+!) {
2577 mkfs($volid);
2578 return;
2579 }
2580
2581 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2582
2583 die "cannot format volume '$volid' with no storage\n" if !$storage;
2584
08ca136d
DM
2585 PVE::Storage::activate_volumes($storage_cfg, [$volid]);
2586
6c871c36
DM
2587 my $path = PVE::Storage::path($storage_cfg, $volid);
2588
2589 my ($vtype, undef, undef, undef, undef, $isBase, $format) =
2590 PVE::Storage::parse_volname($storage_cfg, $volid);
2591
2592 die "cannot format volume '$volid' (format == $format)\n"
2593 if $format ne 'raw';
2594
d216e891 2595 mkfs($path, $rootuid, $rootgid);
6c871c36
DM
2596}
2597
2598sub destroy_disks {
2599 my ($storecfg, $vollist) = @_;
2600
2601 foreach my $volid (@$vollist) {
2602 eval { PVE::Storage::vdisk_free($storecfg, $volid); };
2603 warn $@ if $@;
2604 }
2605}
2606
2607sub create_disks {
2608 my ($storecfg, $vmid, $settings, $conf) = @_;
2609
2610 my $vollist = [];
2611
2612 eval {
d216e891
WB
2613 my (undef, $rootuid, $rootgid) = PVE::LXC::parse_id_maps($conf);
2614 my $chown_vollist = [];
2615
6c871c36
DM
2616 foreach_mountpoint($settings, sub {
2617 my ($ms, $mountpoint) = @_;
2618
2619 my $volid = $mountpoint->{volume};
2620 my $mp = $mountpoint->{mp};
2621
2622 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2623
e2007ac2 2624 if ($storage && ($volid =~ m/^([^:\s]+):(\d+(\.\d+)?)$/)) {
8ed5ff9d 2625 my ($storeid, $size_gb) = ($1, $2);
6c871c36 2626
8ed5ff9d 2627 my $size_kb = int(${size_gb}*1024) * 1024;
6c871c36
DM
2628
2629 my $scfg = PVE::Storage::storage_config($storecfg, $storage);
2630 # fixme: use better naming ct-$vmid-disk-X.raw?
2631
2632 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs') {
8ed5ff9d 2633 if ($size_kb > 0) {
6c871c36 2634 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw',
8ed5ff9d 2635 undef, $size_kb);
d216e891 2636 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2637 } else {
2638 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'subvol',
2639 undef, 0);
d216e891 2640 push @$chown_vollist, $volid;
6c871c36
DM
2641 }
2642 } elsif ($scfg->{type} eq 'zfspool') {
2643
2644 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'subvol',
8ed5ff9d 2645 undef, $size_kb);
d216e891 2646 push @$chown_vollist, $volid;
2e879877 2647 } elsif ($scfg->{type} eq 'drbd' || $scfg->{type} eq 'lvm' || $scfg->{type} eq 'lvmthin') {
6c871c36 2648
8ed5ff9d 2649 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw', undef, $size_kb);
d216e891 2650 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2651
2652 } elsif ($scfg->{type} eq 'rbd') {
2653
2654 die "krbd option must be enabled on storage type '$scfg->{type}'\n" if !$scfg->{krbd};
8ed5ff9d 2655 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw', undef, $size_kb);
d216e891 2656 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2657 } else {
2658 die "unable to create containers on storage type '$scfg->{type}'\n";
2659 }
2660 push @$vollist, $volid;
71c780b9
WB
2661 $mountpoint->{volume} = $volid;
2662 $mountpoint->{size} = $size_kb * 1024;
2663 $conf->{$ms} = print_ct_mountpoint($mountpoint, $ms eq 'rootfs');
6c871c36 2664 } else {
e2007ac2
DM
2665 # use specified/existing volid/dir/device
2666 $conf->{$ms} = print_ct_mountpoint($mountpoint, $ms eq 'rootfs');
6c871c36
DM
2667 }
2668 });
d216e891
WB
2669
2670 PVE::Storage::activate_volumes($storecfg, $chown_vollist, undef);
2671 foreach my $volid (@$chown_vollist) {
2672 my $path = PVE::Storage::path($storecfg, $volid, undef);
2673 chown($rootuid, $rootgid, $path);
2674 }
2675 PVE::Storage::deactivate_volumes($storecfg, $chown_vollist, undef);
6c871c36
DM
2676 };
2677 # free allocated images on error
2678 if (my $err = $@) {
2679 destroy_disks($storecfg, $vollist);
2680 die $err;
2681 }
2682 return $vollist;
2683}
2684
68e8f3c5
DM
2685# bash completion helper
2686
2687sub complete_os_templates {
2688 my ($cmdname, $pname, $cvalue) = @_;
2689
2690 my $cfg = PVE::Storage::config();
2691
9e9bc3a6 2692 my $storeid;
68e8f3c5
DM
2693
2694 if ($cvalue =~ m/^([^:]+):/) {
2695 $storeid = $1;
2696 }
2697
2698 my $vtype = $cmdname eq 'restore' ? 'backup' : 'vztmpl';
2699 my $data = PVE::Storage::template_list($cfg, $storeid, $vtype);
2700
2701 my $res = [];
2702 foreach my $id (keys %$data) {
2703 foreach my $item (@{$data->{$id}}) {
2704 push @$res, $item->{volid} if defined($item->{volid});
2705 }
2706 }
2707
2708 return $res;
2709}
2710
68e8f3c5
DM
2711my $complete_ctid_full = sub {
2712 my ($running) = @_;
2713
2714 my $idlist = vmstatus();
2715
2716 my $active_hash = list_active_containers();
2717
2718 my $res = [];
2719
2720 foreach my $id (keys %$idlist) {
2721 my $d = $idlist->{$id};
2722 if (defined($running)) {
2723 next if $d->{template};
2724 next if $running && !$active_hash->{$id};
2725 next if !$running && $active_hash->{$id};
2726 }
2727 push @$res, $id;
2728
2729 }
2730 return $res;
2731};
2732
2733sub complete_ctid {
2734 return &$complete_ctid_full();
2735}
2736
2737sub complete_ctid_stopped {
2738 return &$complete_ctid_full(0);
2739}
2740
2741sub complete_ctid_running {
2742 return &$complete_ctid_full(1);
2743}
2744
c6a605f9
WB
2745sub parse_id_maps {
2746 my ($conf) = @_;
2747
2748 my $id_map = [];
2749 my $rootuid = 0;
2750 my $rootgid = 0;
2751
2752 my $lxc = $conf->{lxc};
2753 foreach my $entry (@$lxc) {
2754 my ($key, $value) = @$entry;
2755 next if $key ne 'lxc.id_map';
2756 if ($value =~ /^([ug])\s+(\d+)\s+(\d+)\s+(\d+)\s*$/) {
2757 my ($type, $ct, $host, $length) = ($1, $2, $3, $4);
2758 push @$id_map, [$type, $ct, $host, $length];
2759 if ($ct == 0) {
2760 $rootuid = $host if $type eq 'u';
2761 $rootgid = $host if $type eq 'g';
2762 }
2763 } else {
2764 die "failed to parse id_map: $value\n";
2765 }
2766 }
2767
2768 if (!@$id_map && $conf->{unprivileged}) {
2769 # Should we read them from /etc/subuid?
2770 $id_map = [ ['u', '0', '100000', '65536'],
2771 ['g', '0', '100000', '65536'] ];
2772 $rootuid = $rootgid = 100000;
2773 }
2774
2775 return ($id_map, $rootuid, $rootgid);
2776}
2777
01dce99b
WB
2778sub userns_command {
2779 my ($id_map) = @_;
2780 if (@$id_map) {
2781 return ['lxc-usernsexec', (map { ('-m', join(':', @$_)) } @$id_map), '--'];
2782 }
2783 return [];
2784}
2785
846a66b0
WB
2786sub set_lock {
2787 my ($vmid, $lock) = @_;
2788 my $conf;
2789 lock_config($vmid, sub {
2790 $conf = load_config($vmid);
2791 check_lock($conf);
2792 $conf->{lock} = $lock;
2793 write_config($vmid, $conf);
2794 });
2795 return $conf;
2796}
2797
2798sub remove_lock {
2799 my ($vmid, $lock) = @_;
2800 lock_config($vmid, sub {
2801 my $conf = load_config($vmid);
2802 if (!$conf->{lock}) {
2803 die "no lock found trying to remove lock '$lock'\n";
2804 } elsif (defined($lock) && $conf->{lock} ne $lock) {
2805 die "found lock '$conf->{lock}' trying to remove lock '$lock'\n";
2806 }
2807 delete $conf->{lock};
2808 write_config($vmid, $conf);
2809 });
2810}
2811
f76a2828 28121;