]> git.proxmox.com Git - pve-container.git/blame - src/PVE/LXC.pm
Implement pct push/pull
[pve-container.git] / src / PVE / LXC.pm
CommitLineData
f76a2828
DM
1package PVE::LXC;
2
3use strict;
4use warnings;
d14a9a1b 5use POSIX qw(EINTR);
f76a2828 6
34fdb3d7
WB
7use Socket;
8
f76a2828 9use File::Path;
2cfae16e
WB
10use File::Spec;
11use Cwd qw();
3cc56749 12use Fcntl qw(O_RDONLY);
f76a2828
DM
13
14use PVE::Cluster qw(cfs_register_file cfs_read_file);
f1ba1a4b 15use PVE::Exception qw(raise_perm_exc);
c65e0a6d 16use PVE::Storage;
f76a2828
DM
17use PVE::SafeSyslog;
18use PVE::INotify;
a3249355 19use PVE::JSONSchema qw(get_standard_option);
1bfe8728 20use PVE::Tools qw($IPV6RE $IPV4RE dir_glob_foreach lock_file lock_file_full);
68fba17b 21use PVE::Network;
52389a07 22use PVE::AccessControl;
228a5a1d 23use PVE::ProcFSTools;
688afc63 24use Time::HiRes qw (gettimeofday);
f76a2828
DM
25
26use Data::Dumper;
27
27916659
DM
28my $nodename = PVE::INotify::nodename();
29
688afc63
WL
30my $cpuinfo= PVE::ProcFSTools::read_cpuinfo();
31
f9897acd 32our $COMMON_TAR_FLAGS = [ '--sparse', '--numeric-owner', '--acls',
fc4e132e
WB
33 '--xattrs',
34 '--xattrs-include=user.*',
4132377b
WB
35 '--xattrs-include=security.capability',
36 '--warning=no-xattr-write' ];
fc4e132e 37
27916659 38cfs_register_file('/lxc/', \&parse_pct_config, \&write_pct_config);
f76a2828 39
769fbfab
WB
40my $rootfs_desc = {
41 volume => {
42 type => 'string',
43 default_key => 1,
da990295 44 format => 'pve-lxc-mp-string',
769fbfab
WB
45 format_description => 'volume',
46 description => 'Volume, device or directory to mount into the container.',
47 },
48 backup => {
49 type => 'boolean',
50 format_description => '[1|0]',
51 description => 'Whether to include the mountpoint in backups.',
52 optional => 1,
53 },
54 size => {
72d583ff
WB
55 type => 'string',
56 format => 'disk-size',
769fbfab 57 format_description => 'DiskSize',
769fbfab
WB
58 description => 'Volume size (read only value).',
59 optional => 1,
60 },
471dd315
WB
61 acl => {
62 type => 'boolean',
63 format_description => 'acl',
64 description => 'Explicitly enable or disable ACL support.',
65 optional => 1,
66 },
67 ro => {
68 type => 'boolean',
69 format_description => 'ro',
70 description => 'Read-only mountpoint (not supported with bind mounts)',
71 optional => 1,
72 },
50df544c
WB
73 quota => {
74 type => 'boolean',
75 format_description => '[0|1]',
76 description => 'Enable user quotas inside the container (not supported with zfs subvolumes)',
77 optional => 1,
78 },
769fbfab 79};
822de0c3 80
27916659 81PVE::JSONSchema::register_standard_option('pve-ct-rootfs', {
769fbfab 82 type => 'string', format => $rootfs_desc,
8fbd2935 83 description => "Use volume as container root.",
27916659
DM
84 optional => 1,
85});
86
52389a07
DM
87PVE::JSONSchema::register_standard_option('pve-lxc-snapshot-name', {
88 description => "The name of the snapshot.",
89 type => 'string', format => 'pve-configid',
90 maxLength => 40,
91});
92
27916659 93my $confdesc = {
09d3ec42
DM
94 lock => {
95 optional => 1,
96 type => 'string',
97 description => "Lock/unlock the VM.",
98 enum => [qw(migrate backup snapshot rollback)],
99 },
27916659
DM
100 onboot => {
101 optional => 1,
102 type => 'boolean',
103 description => "Specifies whether a VM will be started during system bootup.",
104 default => 0,
117636e5 105 },
27916659 106 startup => get_standard_option('pve-startup-order'),
bb1ac2de
DM
107 template => {
108 optional => 1,
109 type => 'boolean',
110 description => "Enable/disable Template.",
111 default => 0,
112 },
27916659
DM
113 arch => {
114 optional => 1,
115 type => 'string',
116 enum => ['amd64', 'i386'],
117 description => "OS architecture type.",
118 default => 'amd64',
117636e5 119 },
27916659
DM
120 ostype => {
121 optional => 1,
122 type => 'string',
238b7e3e
DM
123 enum => ['debian', 'ubuntu', 'centos', 'fedora', 'opensuse', 'archlinux', 'alpine', 'unmanaged'],
124 description => "OS type. This is used to setup configuration inside the container, and corresponds to lxc setup scripts in /usr/share/lxc/config/<ostype>.common.conf. Value 'unmanaged' can be used to skip and OS specific setup.",
a3249355 125 },
4f958489
DM
126 console => {
127 optional => 1,
128 type => 'boolean',
129 description => "Attach a console device (/dev/console) to the container.",
130 default => 1,
131 },
27916659
DM
132 tty => {
133 optional => 1,
134 type => 'integer',
135 description => "Specify the number of tty available to the container",
136 minimum => 0,
137 maximum => 6,
0d0ca400 138 default => 2,
611fe3aa 139 },
27916659
DM
140 cpulimit => {
141 optional => 1,
142 type => 'number',
c31ad455 143 description => "Limit of CPU usage. Note if the computer has 2 CPUs, it has a total of '2' CPU time. Value '0' indicates no CPU limit.",
27916659
DM
144 minimum => 0,
145 maximum => 128,
146 default => 0,
147 },
148 cpuunits => {
149 optional => 1,
150 type => 'integer',
c31ad455 151 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to the weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
27916659
DM
152 minimum => 0,
153 maximum => 500000,
81bee809 154 default => 1024,
27916659
DM
155 },
156 memory => {
157 optional => 1,
158 type => 'integer',
159 description => "Amount of RAM for the VM in MB.",
160 minimum => 16,
161 default => 512,
162 },
163 swap => {
164 optional => 1,
165 type => 'integer',
166 description => "Amount of SWAP for the VM in MB.",
167 minimum => 0,
168 default => 512,
169 },
170 hostname => {
171 optional => 1,
172 description => "Set a host name for the container.",
159aad3e 173 type => 'string', format => 'dns-name',
27916659
DM
174 maxLength => 255,
175 },
176 description => {
177 optional => 1,
178 type => 'string',
179 description => "Container description. Only used on the configuration web interface.",
180 },
181 searchdomain => {
182 optional => 1,
159aad3e 183 type => 'string', format => 'dns-name-list',
c31ad455 184 description => "Sets DNS search domains for a container. Create will automatically use the setting from the host if you neither set searchdomain nor nameserver.",
27916659
DM
185 },
186 nameserver => {
187 optional => 1,
159aad3e 188 type => 'string', format => 'address-list',
c31ad455 189 description => "Sets DNS server IP address for a container. Create will automatically use the setting from the host if you neither set searchdomain nor nameserver.",
27916659
DM
190 },
191 rootfs => get_standard_option('pve-ct-rootfs'),
09d3ec42
DM
192 parent => {
193 optional => 1,
194 type => 'string', format => 'pve-configid',
195 maxLength => 40,
196 description => "Parent snapshot name. This is used internally, and should not be modified.",
197 },
198 snaptime => {
199 optional => 1,
200 description => "Timestamp for snapshots.",
201 type => 'integer',
202 minimum => 0,
203 },
aca816ad
DM
204 cmode => {
205 optional => 1,
206 description => "Console mode. By default, the console command tries to open a connection to one of the available tty devices. By setting cmode to 'console' it tries to attach to /dev/console instead. If you set cmode to 'shell', it simply invokes a shell inside the container (no login).",
207 type => 'string',
208 enum => ['shell', 'console', 'tty'],
209 default => 'tty',
210 },
7e806596
AG
211 protection => {
212 optional => 1,
213 type => 'boolean',
c31ad455 214 description => "Sets the protection flag of the container. This will prevent the CT or CT's disk remove/update operation.",
7e806596
AG
215 default => 0,
216 },
425b62cb
WB
217 unprivileged => {
218 optional => 1,
219 type => 'boolean',
220 description => "Makes the container run as unprivileged user. (Should not be modified manually.)",
221 default => 0,
222 },
f76a2828
DM
223};
224
e576f689
DM
225my $valid_lxc_conf_keys = {
226 'lxc.include' => 1,
227 'lxc.arch' => 1,
228 'lxc.utsname' => 1,
229 'lxc.haltsignal' => 1,
230 'lxc.rebootsignal' => 1,
231 'lxc.stopsignal' => 1,
232 'lxc.init_cmd' => 1,
233 'lxc.network.type' => 1,
234 'lxc.network.flags' => 1,
235 'lxc.network.link' => 1,
236 'lxc.network.mtu' => 1,
237 'lxc.network.name' => 1,
238 'lxc.network.hwaddr' => 1,
239 'lxc.network.ipv4' => 1,
240 'lxc.network.ipv4.gateway' => 1,
241 'lxc.network.ipv6' => 1,
242 'lxc.network.ipv6.gateway' => 1,
243 'lxc.network.script.up' => 1,
244 'lxc.network.script.down' => 1,
245 'lxc.pts' => 1,
246 'lxc.console.logfile' => 1,
247 'lxc.console' => 1,
248 'lxc.tty' => 1,
249 'lxc.devttydir' => 1,
250 'lxc.hook.autodev' => 1,
251 'lxc.autodev' => 1,
252 'lxc.kmsg' => 1,
253 'lxc.mount' => 1,
254 'lxc.mount.entry' => 1,
255 'lxc.mount.auto' => 1,
312e9850 256 'lxc.rootfs' => 'lxc.rootfs is auto generated from rootfs',
e576f689 257 'lxc.rootfs.mount' => 1,
312e9850
WB
258 'lxc.rootfs.options' => 'lxc.rootfs.options is not supported' .
259 ', please use mountpoint options in the "rootfs" key',
e576f689
DM
260 # lxc.cgroup.*
261 'lxc.cap.drop' => 1,
262 'lxc.cap.keep' => 1,
263 'lxc.aa_profile' => 1,
264 'lxc.aa_allow_incomplete' => 1,
265 'lxc.se_context' => 1,
266 'lxc.seccomp' => 1,
267 'lxc.id_map' => 1,
268 'lxc.hook.pre-start' => 1,
269 'lxc.hook.pre-mount' => 1,
270 'lxc.hook.mount' => 1,
271 'lxc.hook.start' => 1,
53775872 272 'lxc.hook.stop' => 1,
e576f689
DM
273 'lxc.hook.post-stop' => 1,
274 'lxc.hook.clone' => 1,
275 'lxc.hook.destroy' => 1,
276 'lxc.loglevel' => 1,
277 'lxc.logfile' => 1,
278 'lxc.start.auto' => 1,
279 'lxc.start.delay' => 1,
280 'lxc.start.order' => 1,
281 'lxc.group' => 1,
282 'lxc.environment' => 1,
e576f689
DM
283};
284
769fbfab
WB
285my $netconf_desc = {
286 type => {
287 type => 'string',
288 optional => 1,
289 description => "Network interface type.",
290 enum => [qw(veth)],
291 },
292 name => {
293 type => 'string',
294 format_description => 'String',
295 description => 'Name of the network device as seen from inside the container. (lxc.network.name)',
296 pattern => '[-_.\w\d]+',
297 },
298 bridge => {
299 type => 'string',
300 format_description => 'vmbr<Number>',
301 description => 'Bridge to attach the network device to.',
302 pattern => '[-_.\w\d]+',
a7c080a7 303 optional => 1,
769fbfab
WB
304 },
305 hwaddr => {
306 type => 'string',
307 format_description => 'MAC',
308 description => 'Bridge to attach the network device to. (lxc.network.hwaddr)',
309 pattern => qr/(?:[a-f0-9]{2}:){5}[a-f0-9]{2}/i,
310 optional => 1,
311 },
312 mtu => {
313 type => 'integer',
314 format_description => 'Number',
315 description => 'Maximum transfer unit of the interface. (lxc.network.mtu)',
07521af1 316 minimum => 64, # minimum ethernet frame is 64 bytes
769fbfab
WB
317 optional => 1,
318 },
319 ip => {
320 type => 'string',
321 format => 'pve-ipv4-config',
322 format_description => 'IPv4Format/CIDR',
323 description => 'IPv4 address in CIDR format.',
324 optional => 1,
325 },
326 gw => {
327 type => 'string',
328 format => 'ipv4',
329 format_description => 'GatewayIPv4',
330 description => 'Default gateway for IPv4 traffic.',
331 optional => 1,
332 },
333 ip6 => {
334 type => 'string',
335 format => 'pve-ipv6-config',
336 format_description => 'IPv6Format/CIDR',
337 description => 'IPv6 address in CIDR format.',
338 optional => 1,
339 },
340 gw6 => {
341 type => 'string',
342 format => 'ipv6',
343 format_description => 'GatewayIPv6',
344 description => 'Default gateway for IPv6 traffic.',
345 optional => 1,
346 },
347 firewall => {
348 type => 'boolean',
349 format_description => '[1|0]',
350 description => "Controls whether this interface's firewall rules should be used.",
351 optional => 1,
352 },
353 tag => {
354 type => 'integer',
355 format_description => 'VlanNo',
356 minimum => '2',
357 maximum => '4094',
23eb2244
WB
358 description => "VLAN tag for this interface.",
359 optional => 1,
360 },
361 trunks => {
362 type => 'string',
363 pattern => qr/\d+(?:;\d+)*/,
364 format_description => 'vlanid[;vlanid...]',
365 description => "VLAN ids to pass through the interface",
769fbfab
WB
366 optional => 1,
367 },
368};
369PVE::JSONSchema::register_format('pve-lxc-network', $netconf_desc);
370
27916659
DM
371my $MAX_LXC_NETWORKS = 10;
372for (my $i = 0; $i < $MAX_LXC_NETWORKS; $i++) {
373 $confdesc->{"net$i"} = {
374 optional => 1,
1a0a239c 375 type => 'string', format => $netconf_desc,
769fbfab 376 description => "Specifies network interfaces for the container.",
27916659 377 };
90bc31f7
DM
378}
379
da990295
DC
380PVE::JSONSchema::register_format('pve-lxc-mp-string', \&verify_lxc_mp_string);
381sub verify_lxc_mp_string{
382 my ($mp, $noerr) = @_;
383
384 # do not allow:
385 # /./ or /../
386 # /. or /.. at the end
387 # ../ at the beginning
388
389 if($mp =~ m@/\.\.?/@ ||
390 $mp =~ m@/\.\.?$@ ||
391 $mp =~ m@^\.\./@){
392 return undef if $noerr;
393 die "$mp contains illegal character sequences\n";
394 }
395 return $mp;
396}
397
769fbfab
WB
398my $mp_desc = {
399 %$rootfs_desc,
400 mp => {
401 type => 'string',
da990295 402 format => 'pve-lxc-mp-string',
769fbfab
WB
403 format_description => 'Path',
404 description => 'Path to the mountpoint as seen from inside the container.',
769fbfab
WB
405 },
406};
407PVE::JSONSchema::register_format('pve-ct-mountpoint', $mp_desc);
408
69202f71
WB
409my $unuseddesc = {
410 optional => 1,
411 type => 'string', format => 'pve-volume-id',
412 description => "Reference to unused volumes.",
413};
414
02c9d10c
AD
415my $MAX_MOUNT_POINTS = 10;
416for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
417 $confdesc->{"mp$i"} = {
418 optional => 1,
769fbfab 419 type => 'string', format => $mp_desc,
566d5f81 420 description => "Use volume as container mount point (experimental feature).",
02c9d10c
AD
421 optional => 1,
422 };
423}
424
69202f71
WB
425my $MAX_UNUSED_DISKS = $MAX_MOUNT_POINTS;
426for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
427 $confdesc->{"unused$i"} = $unuseddesc;
428}
429
27916659
DM
430sub write_pct_config {
431 my ($filename, $conf) = @_;
f76a2828 432
27916659 433 delete $conf->{snapstate}; # just to be sure
f76a2828 434
27916659
DM
435 my $generate_raw_config = sub {
436 my ($conf) = @_;
f76a2828 437
27916659 438 my $raw = '';
cbb03fea 439
27916659
DM
440 # add description as comment to top of file
441 my $descr = $conf->{description} || '';
442 foreach my $cl (split(/\n/, $descr)) {
443 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
a12a36e0 444 }
fff3a342 445
27916659 446 foreach my $key (sort keys %$conf) {
09d3ec42 447 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' ||
e576f689 448 $key eq 'snapshots' || $key eq 'snapname' || $key eq 'lxc';
545d10ba
DM
449 my $value = $conf->{$key};
450 die "detected invalid newline inside property '$key'\n" if $value =~ m/\n/;
451 $raw .= "$key: $value\n";
a12a36e0 452 }
e576f689
DM
453
454 if (my $lxcconf = $conf->{lxc}) {
455 foreach my $entry (@$lxcconf) {
456 my ($k, $v) = @$entry;
457 $raw .= "$k: $v\n";
458 }
459 }
460
27916659 461 return $raw;
a12a36e0 462 };
160f0941 463
27916659 464 my $raw = &$generate_raw_config($conf);
a12a36e0 465
27916659
DM
466 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
467 $raw .= "\n[$snapname]\n";
468 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
f76a2828
DM
469 }
470
f76a2828
DM
471 return $raw;
472}
473
27916659
DM
474sub check_type {
475 my ($key, $value) = @_;
822de0c3 476
27916659 477 die "unknown setting '$key'\n" if !$confdesc->{$key};
822de0c3 478
27916659
DM
479 my $type = $confdesc->{$key}->{type};
480
481 if (!defined($value)) {
482 die "got undefined value\n";
483 }
484
485 if ($value =~ m/[\n\r]/) {
486 die "property contains a line feed\n";
487 }
822de0c3 488
27916659
DM
489 if ($type eq 'boolean') {
490 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
491 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
492 die "type check ('boolean') failed - got '$value'\n";
493 } elsif ($type eq 'integer') {
494 return int($1) if $value =~ m/^(\d+)$/;
495 die "type check ('integer') failed - got '$value'\n";
496 } elsif ($type eq 'number') {
497 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
498 die "type check ('number') failed - got '$value'\n";
499 } elsif ($type eq 'string') {
500 if (my $fmt = $confdesc->{$key}->{format}) {
501 PVE::JSONSchema::check_format($fmt, $value);
502 return $value;
503 }
cbb03fea 504 return $value;
822de0c3 505 } else {
27916659 506 die "internal error"
822de0c3 507 }
822de0c3
DM
508}
509
27916659 510sub parse_pct_config {
f76a2828
DM
511 my ($filename, $raw) = @_;
512
513 return undef if !defined($raw);
514
27916659 515 my $res = {
f76a2828 516 digest => Digest::SHA::sha1_hex($raw),
27916659 517 snapshots => {},
f76a2828
DM
518 };
519
27916659 520 $filename =~ m|/lxc/(\d+).conf$|
f76a2828
DM
521 || die "got strange filename '$filename'";
522
523 my $vmid = $1;
524
27916659
DM
525 my $conf = $res;
526 my $descr = '';
527 my $section = '';
528
529 my @lines = split(/\n/, $raw);
530 foreach my $line (@lines) {
531 next if $line =~ m/^\s*$/;
532
533 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
534 $section = $1;
535 $conf->{description} = $descr if $descr;
536 $descr = '';
537 $conf = $res->{snapshots}->{$section} = {};
538 next;
a12a36e0 539 }
a12a36e0 540
27916659
DM
541 if ($line =~ m/^\#(.*)\s*$/) {
542 $descr .= PVE::Tools::decode_text($1) . "\n";
543 next;
f76a2828 544 }
5d186e16 545
545d10ba 546 if ($line =~ m/^(lxc\.[a-z0-9_\-\.]+)(:|\s*=)\s*(.*?)\s*$/) {
e576f689
DM
547 my $key = $1;
548 my $value = $3;
a23d627d
WB
549 my $validity = $valid_lxc_conf_keys->{$key} || 0;
550 if ($validity eq 1 || $key =~ m/^lxc\.cgroup\./) {
e576f689 551 push @{$conf->{lxc}}, [$key, $value];
a23d627d 552 } elsif (my $errmsg = $validity) {
312e9850 553 warn "vm $vmid - $key: $errmsg\n";
e576f689
DM
554 } else {
555 warn "vm $vmid - unable to parse config: $line\n";
556 }
557 } elsif ($line =~ m/^(description):\s*(.*\S)\s*$/) {
27916659
DM
558 $descr .= PVE::Tools::decode_text($2);
559 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
560 $conf->{snapstate} = $1;
fe9a4ab3 561 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S.*)\s*$/) {
27916659 562 my $key = $1;
5d186e16 563 my $value = $2;
27916659
DM
564 eval { $value = check_type($key, $value); };
565 warn "vm $vmid - unable to parse value of '$key' - $@" if $@;
566 $conf->{$key} = $value;
5d186e16 567 } else {
27916659 568 warn "vm $vmid - unable to parse config: $line\n";
5d186e16 569 }
7dfc49cc
DM
570 }
571
27916659 572 $conf->{description} = $descr if $descr;
5d186e16 573
27916659
DM
574 delete $res->{snapstate}; # just to be sure
575
576 return $res;
f76a2828
DM
577}
578
579sub config_list {
580 my $vmlist = PVE::Cluster::get_vmlist();
581 my $res = {};
582 return $res if !$vmlist || !$vmlist->{ids};
583 my $ids = $vmlist->{ids};
584
585 foreach my $vmid (keys %$ids) {
586 next if !$vmid; # skip CT0
587 my $d = $ids->{$vmid};
588 next if !$d->{node} || $d->{node} ne $nodename;
589 next if !$d->{type} || $d->{type} ne 'lxc';
590 $res->{$vmid}->{type} = 'lxc';
591 }
592 return $res;
593}
594
595sub cfs_config_path {
596 my ($vmid, $node) = @_;
597
598 $node = $nodename if !$node;
27916659 599 return "nodes/$node/lxc/$vmid.conf";
f76a2828
DM
600}
601
9c2d4ce9
DM
602sub config_file {
603 my ($vmid, $node) = @_;
604
605 my $cfspath = cfs_config_path($vmid, $node);
606 return "/etc/pve/$cfspath";
607}
608
f76a2828 609sub load_config {
d18499cf 610 my ($vmid, $node) = @_;
f76a2828 611
d18499cf
TL
612 $node = $nodename if !$node;
613 my $cfspath = cfs_config_path($vmid, $node);
f76a2828
DM
614
615 my $conf = PVE::Cluster::cfs_read_file($cfspath);
c31ad455 616 die "container $vmid does not exist\n" if !defined($conf);
f76a2828
DM
617
618 return $conf;
619}
620
5b4657d0
DM
621sub create_config {
622 my ($vmid, $conf) = @_;
623
624 my $dir = "/etc/pve/nodes/$nodename/lxc";
625 mkdir $dir;
626
5b4657d0
DM
627 write_config($vmid, $conf);
628}
629
630sub destroy_config {
631 my ($vmid) = @_;
632
27916659 633 unlink config_file($vmid, $nodename);
5b4657d0
DM
634}
635
f76a2828
DM
636sub write_config {
637 my ($vmid, $conf) = @_;
638
639 my $cfspath = cfs_config_path($vmid);
640
641 PVE::Cluster::cfs_write_file($cfspath, $conf);
642}
643
d14a9a1b 644# flock: we use one file handle per process, so lock file
c31ad455 645# can be called multiple times and will succeed for the same process.
d14a9a1b
DM
646
647my $lock_handles = {};
648my $lockdir = "/run/lock/lxc";
649
3cc56749 650sub config_file_lock {
d14a9a1b 651 my ($vmid) = @_;
cbb03fea 652
53396388 653 return "$lockdir/pve-config-${vmid}.lock";
d14a9a1b
DM
654}
655
3cc56749 656sub lock_config_full {
2d3f23be 657 my ($vmid, $timeout, $code, @param) = @_;
d14a9a1b 658
3cc56749 659 my $filename = config_file_lock($vmid);
d14a9a1b 660
3cc56749
FG
661 mkdir $lockdir if !-d $lockdir;
662
663 my $res = lock_file($filename, $timeout, $code, @param);
664
665 die $@ if $@;
666
667 return $res;
668}
669
670sub lock_config_mode {
671 my ($vmid, $timeout, $shared, $code, @param) = @_;
672
673 my $filename = config_file_lock($vmid);
d14a9a1b 674
f99e8278
AD
675 mkdir $lockdir if !-d $lockdir;
676
3cc56749 677 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
f76a2828 678
2d3f23be 679 die $@ if $@;
f76a2828
DM
680
681 return $res;
682}
683
3cc56749
FG
684sub lock_config {
685 my ($vmid, $code, @param) = @_;
686
687 return lock_config_full($vmid, 10, $code, @param);
688}
689
ec52ac21
DM
690sub option_exists {
691 my ($name) = @_;
692
693 return defined($confdesc->{$name});
694}
f76a2828
DM
695
696# add JSON properties for create and set function
697sub json_config_properties {
698 my $prop = shift;
699
700 foreach my $opt (keys %$confdesc) {
09d3ec42 701 next if $opt eq 'parent' || $opt eq 'snaptime';
27916659
DM
702 next if $prop->{$opt};
703 $prop->{$opt} = $confdesc->{$opt};
704 }
705
706 return $prop;
707}
708
822de0c3
DM
709# container status helpers
710
711sub list_active_containers {
cbb03fea 712
822de0c3
DM
713 my $filename = "/proc/net/unix";
714
715 # similar test is used by lcxcontainers.c: list_active_containers
716 my $res = {};
cbb03fea 717
822de0c3
DM
718 my $fh = IO::File->new ($filename, "r");
719 return $res if !$fh;
720
721 while (defined(my $line = <$fh>)) {
722 if ($line =~ m/^[a-f0-9]+:\s\S+\s\S+\s\S+\s\S+\s\S+\s\d+\s(\S+)$/) {
723 my $path = $1;
27916659 724 if ($path =~ m!^@/var/lib/lxc/(\d+)/command$!) {
822de0c3
DM
725 $res->{$1} = 1;
726 }
727 }
728 }
729
730 close($fh);
cbb03fea 731
822de0c3
DM
732 return $res;
733}
f76a2828 734
5c752bbf
DM
735# warning: this is slow
736sub check_running {
737 my ($vmid) = @_;
738
739 my $active_hash = list_active_containers();
740
741 return 1 if defined($active_hash->{$vmid});
cbb03fea 742
5c752bbf
DM
743 return undef;
744}
745
10fc3ba5 746sub get_container_disk_usage {
73e03cb7 747 my ($vmid, $pid) = @_;
10fc3ba5 748
73e03cb7 749 return PVE::Tools::df("/proc/$pid/root/", 1);
10fc3ba5
DM
750}
751
688afc63
WL
752my $last_proc_vmid_stat;
753
754my $parse_cpuacct_stat = sub {
755 my ($vmid) = @_;
756
757 my $raw = read_cgroup_value('cpuacct', $vmid, 'cpuacct.stat', 1);
758
759 my $stat = {};
760
761 if ($raw =~ m/^user (\d+)\nsystem (\d+)\n/) {
762
763 $stat->{utime} = $1;
764 $stat->{stime} = $2;
765
766 }
767
768 return $stat;
769};
770
f76a2828
DM
771sub vmstatus {
772 my ($opt_vmid) = @_;
773
774 my $list = $opt_vmid ? { $opt_vmid => { type => 'lxc' }} : config_list();
775
822de0c3 776 my $active_hash = list_active_containers();
cbb03fea 777
688afc63
WL
778 my $cpucount = $cpuinfo->{cpus} || 1;
779
780 my $cdtime = gettimeofday;
781
782 my $uptime = (PVE::ProcFSTools::read_proc_uptime(1))[0];
783
f76a2828 784 foreach my $vmid (keys %$list) {
f76a2828 785 my $d = $list->{$vmid};
10fc3ba5 786
d5588ee3
DM
787 eval { $d->{pid} = find_lxc_pid($vmid) if defined($active_hash->{$vmid}); };
788 warn $@ if $@; # ignore errors (consider them stopped)
cbb03fea 789
d5588ee3 790 $d->{status} = $d->{pid} ? 'running' : 'stopped';
f76a2828
DM
791
792 my $cfspath = cfs_config_path($vmid);
238a56cb 793 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
cbb03fea 794
27916659 795 $d->{name} = $conf->{'hostname'} || "CT$vmid";
238a56cb 796 $d->{name} =~ s/[\s]//g;
cbb03fea 797
9db5687d 798 $d->{cpus} = $conf->{cpulimit} || $cpucount;
44da0641 799
d5588ee3
DM
800 if ($d->{pid}) {
801 my $res = get_container_disk_usage($vmid, $d->{pid});
27916659
DM
802 $d->{disk} = $res->{used};
803 $d->{maxdisk} = $res->{total};
804 } else {
805 $d->{disk} = 0;
806 # use 4GB by default ??
807 if (my $rootfs = $conf->{rootfs}) {
44a9face 808 my $rootinfo = parse_ct_rootfs($rootfs);
27916659
DM
809 $d->{maxdisk} = int(($rootinfo->{size} || 4)*1024*1024)*1024;
810 } else {
811 $d->{maxdisk} = 4*1024*1024*1024;
10fc3ba5 812 }
238a56cb 813 }
cbb03fea 814
238a56cb
DM
815 $d->{mem} = 0;
816 $d->{swap} = 0;
95df9a12
DM
817 $d->{maxmem} = ($conf->{memory}||512)*1024*1024;
818 $d->{maxswap} = ($conf->{swap}//0)*1024*1024;
e901d418 819
238a56cb
DM
820 $d->{uptime} = 0;
821 $d->{cpu} = 0;
e901d418 822
238a56cb
DM
823 $d->{netout} = 0;
824 $d->{netin} = 0;
f76a2828 825
238a56cb
DM
826 $d->{diskread} = 0;
827 $d->{diskwrite} = 0;
bb1ac2de
DM
828
829 $d->{template} = is_template($conf);
f76a2828 830 }
cbb03fea 831
238a56cb
DM
832 foreach my $vmid (keys %$list) {
833 my $d = $list->{$vmid};
d5588ee3
DM
834 my $pid = $d->{pid};
835
836 next if !$pid; # skip stopped CTs
f76a2828 837
88a8696b
TL
838 my $ctime = (stat("/proc/$pid"))[10]; # 10 = ctime
839 $d->{uptime} = time - $ctime; # the method lxcfs uses
22a77285 840
238a56cb
DM
841 $d->{mem} = read_cgroup_value('memory', $vmid, 'memory.usage_in_bytes');
842 $d->{swap} = read_cgroup_value('memory', $vmid, 'memory.memsw.usage_in_bytes') - $d->{mem};
b5289322
AD
843
844 my $blkio_bytes = read_cgroup_value('blkio', $vmid, 'blkio.throttle.io_service_bytes', 1);
1e647c7c 845 my @bytes = split(/\n/, $blkio_bytes);
b5289322 846 foreach my $byte (@bytes) {
1e647c7c
DM
847 if (my ($key, $value) = $byte =~ /(Read|Write)\s+(\d+)/) {
848 $d->{diskread} = $2 if $key eq 'Read';
849 $d->{diskwrite} = $2 if $key eq 'Write';
850 }
b5289322 851 }
688afc63
WL
852
853 my $pstat = &$parse_cpuacct_stat($vmid);
854
855 my $used = $pstat->{utime} + $pstat->{stime};
856
857 my $old = $last_proc_vmid_stat->{$vmid};
858 if (!$old) {
859 $last_proc_vmid_stat->{$vmid} = {
860 time => $cdtime,
861 used => $used,
862 cpu => 0,
863 };
864 next;
865 }
866
867 my $dtime = ($cdtime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
868
869 if ($dtime > 1000) {
870 my $dutime = $used - $old->{used};
871
872 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
873 $last_proc_vmid_stat->{$vmid} = {
874 time => $cdtime,
875 used => $used,
876 cpu => $d->{cpu},
877 };
878 } else {
879 $d->{cpu} = $old->{cpu};
880 }
238a56cb 881 }
cbb03fea 882
68b8f4d1
WL
883 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
884
885 foreach my $dev (keys %$netdev) {
886 next if $dev !~ m/^veth([1-9]\d*)i/;
887 my $vmid = $1;
888 my $d = $list->{$vmid};
889
890 next if !$d;
891
892 $d->{netout} += $netdev->{$dev}->{receive};
893 $d->{netin} += $netdev->{$dev}->{transmit};
894
895 }
896
f76a2828
DM
897 return $list;
898}
899
7c921c80
WB
900sub classify_mountpoint {
901 my ($vol) = @_;
902 if ($vol =~ m!^/!) {
903 return 'device' if $vol =~ m!^/dev/!;
904 return 'bind';
905 }
906 return 'volume';
907}
908
44a9face
DM
909my $parse_ct_mountpoint_full = sub {
910 my ($desc, $data, $noerr) = @_;
27916659
DM
911
912 $data //= '';
913
1b2c1e8c 914 my $res;
44a9face 915 eval { $res = PVE::JSONSchema::parse_property_string($desc, $data) };
1b2c1e8c 916 if ($@) {
ca7feb1a
WB
917 return undef if $noerr;
918 die $@;
27916659
DM
919 }
920
bf4a209a 921 if (defined(my $size = $res->{size})) {
ca7feb1a
WB
922 $size = PVE::JSONSchema::parse_size($size);
923 if (!defined($size)) {
924 return undef if $noerr;
925 die "invalid size: $size\n";
926 }
927 $res->{size} = $size;
27916659
DM
928 }
929
7c921c80
WB
930 $res->{type} = classify_mountpoint($res->{volume});
931
27916659 932 return $res;
44a9face
DM
933};
934
935sub parse_ct_rootfs {
936 my ($data, $noerr) = @_;
937
938 my $res = &$parse_ct_mountpoint_full($rootfs_desc, $data, $noerr);
939
940 $res->{mp} = '/' if defined($res);
941
942 return $res;
943}
944
945sub parse_ct_mountpoint {
946 my ($data, $noerr) = @_;
947
948 return &$parse_ct_mountpoint_full($mp_desc, $data, $noerr);
27916659 949}
7dfc49cc 950
dde7b02b 951sub print_ct_mountpoint {
4fee75fd 952 my ($info, $nomp) = @_;
7c921c80
WB
953 my $skip = [ 'type' ];
954 push @$skip, 'mp' if $nomp;
6708ba93 955 return PVE::JSONSchema::print_property_string($info, $mp_desc, $skip);
bb1ac2de
DM
956}
957
7dfc49cc 958sub print_lxc_network {
f76a2828 959 my $net = shift;
6708ba93 960 return PVE::JSONSchema::print_property_string($net, $netconf_desc);
f76a2828
DM
961}
962
7dfc49cc
DM
963sub parse_lxc_network {
964 my ($data) = @_;
965
966 my $res = {};
967
968 return $res if !$data;
969
ca7feb1a 970 $res = PVE::JSONSchema::parse_property_string($netconf_desc, $data);
7dfc49cc
DM
971
972 $res->{type} = 'veth';
93cdbbfb 973 $res->{hwaddr} = PVE::Tools::random_ether_addr() if !$res->{hwaddr};
cbb03fea 974
7dfc49cc
DM
975 return $res;
976}
f76a2828 977
238a56cb
DM
978sub read_cgroup_value {
979 my ($group, $vmid, $name, $full) = @_;
980
981 my $path = "/sys/fs/cgroup/$group/lxc/$vmid/$name";
982
983 return PVE::Tools::file_get_contents($path) if $full;
984
985 return PVE::Tools::file_read_firstline($path);
986}
987
bf0b8c43
AD
988sub write_cgroup_value {
989 my ($group, $vmid, $name, $value) = @_;
990
991 my $path = "/sys/fs/cgroup/$group/lxc/$vmid/$name";
992 PVE::ProcFSTools::write_proc_entry($path, $value) if -e $path;
993
994}
995
52f1d76b
DM
996sub find_lxc_console_pids {
997
998 my $res = {};
999
1000 PVE::Tools::dir_glob_foreach('/proc', '\d+', sub {
1001 my ($pid) = @_;
1002
1003 my $cmdline = PVE::Tools::file_read_firstline("/proc/$pid/cmdline");
1004 return if !$cmdline;
1005
1006 my @args = split(/\0/, $cmdline);
1007
c31ad455 1008 # search for lxc-console -n <vmid>
cbb03fea 1009 return if scalar(@args) != 3;
52f1d76b
DM
1010 return if $args[1] ne '-n';
1011 return if $args[2] !~ m/^\d+$/;
1012 return if $args[0] !~ m|^(/usr/bin/)?lxc-console$|;
cbb03fea 1013
52f1d76b 1014 my $vmid = $args[2];
cbb03fea 1015
52f1d76b
DM
1016 push @{$res->{$vmid}}, $pid;
1017 });
1018
1019 return $res;
1020}
1021
bedeaaf1
AD
1022sub find_lxc_pid {
1023 my ($vmid) = @_;
1024
1025 my $pid = undef;
1026 my $parser = sub {
1027 my $line = shift;
8b25977f 1028 $pid = $1 if $line =~ m/^PID:\s+(\d+)$/;
bedeaaf1 1029 };
c39aa40a 1030 PVE::Tools::run_command(['lxc-info', '-n', $vmid, '-p'], outfunc => $parser);
bedeaaf1 1031
8b25977f 1032 die "unable to get PID for CT $vmid (not running?)\n" if !$pid;
cbb03fea 1033
8b25977f 1034 return $pid;
bedeaaf1
AD
1035}
1036
cbb03fea 1037# Note: we cannot use Net:IP, because that only allows strict
55fa4e09
DM
1038# CIDR networks
1039sub parse_ipv4_cidr {
1040 my ($cidr, $noerr) = @_;
1041
f7a7b413
WB
1042 if ($cidr =~ m!^($IPV4RE)(?:/(\d+))$! && ($2 > 7) && ($2 <= 32)) {
1043 return { address => $1, netmask => $PVE::Network::ipv4_reverse_mask->[$2] };
55fa4e09 1044 }
cbb03fea 1045
55fa4e09 1046 return undef if $noerr;
cbb03fea 1047
55fa4e09
DM
1048 die "unable to parse ipv4 address/mask\n";
1049}
93285df8 1050
a12a36e0
WL
1051sub check_lock {
1052 my ($conf) = @_;
1053
27916659 1054 die "VM is locked ($conf->{'lock'})\n" if $conf->{'lock'};
a12a36e0
WL
1055}
1056
e22af68f
AG
1057sub check_protection {
1058 my ($vm_conf, $err_msg) = @_;
1059
1060 if ($vm_conf->{protection}) {
1061 die "$err_msg - protection mode enabled\n";
1062 }
1063}
1064
27916659 1065sub update_lxc_config {
c628ffa1 1066 my ($storage_cfg, $vmid, $conf) = @_;
b80dd50a 1067
bb1ac2de
DM
1068 my $dir = "/var/lib/lxc/$vmid";
1069
1070 if ($conf->{template}) {
1071
1072 unlink "$dir/config";
1073
1074 return;
1075 }
1076
27916659 1077 my $raw = '';
b80dd50a 1078
27916659
DM
1079 die "missing 'arch' - internal error" if !$conf->{arch};
1080 $raw .= "lxc.arch = $conf->{arch}\n";
b80dd50a 1081
425b62cb
WB
1082 my $unprivileged = $conf->{unprivileged};
1083 my $custom_idmap = grep { $_->[0] eq 'lxc.id_map' } @{$conf->{lxc}};
1084
27916659 1085 my $ostype = $conf->{ostype} || die "missing 'ostype' - internal error";
238b7e3e 1086 if ($ostype =~ /^(?:debian | ubuntu | centos | fedora | opensuse | archlinux | alpine | unmanaged)$/x) {
c34f7efe
WB
1087 my $inc ="/usr/share/lxc/config/$ostype.common.conf";
1088 $inc ="/usr/share/lxc/config/common.conf" if !-f $inc;
1089 $raw .= "lxc.include = $inc\n";
425b62cb 1090 if ($unprivileged || $custom_idmap) {
c34f7efe
WB
1091 $inc = "/usr/share/lxc/config/$ostype.userns.conf";
1092 $inc = "/usr/share/lxc/config/userns.conf" if !-f $inc;
1093 $raw .= "lxc.include = $inc\n"
425b62cb 1094 }
27916659 1095 } else {
9a7a910b 1096 die "implement me (ostype $ostype)";
27916659 1097 }
b80dd50a 1098
50df544c
WB
1099 # WARNING: DO NOT REMOVE this without making sure that loop device nodes
1100 # cannot be exposed to the container with r/w access (cgroup perms).
1101 # When this is enabled mounts will still remain in the monitor's namespace
1102 # after the container unmounted them and thus will not detach from their
1103 # files while the container is running!
c16b8890 1104 $raw .= "lxc.monitor.unshare = 1\n";
58cc92a9 1105
425b62cb
WB
1106 # Should we read them from /etc/subuid?
1107 if ($unprivileged && !$custom_idmap) {
1108 $raw .= "lxc.id_map = u 0 100000 65536\n";
1109 $raw .= "lxc.id_map = g 0 100000 65536\n";
1110 }
1111
6f035afe 1112 if (!has_dev_console($conf)) {
eeaea429
DM
1113 $raw .= "lxc.console = none\n";
1114 $raw .= "lxc.cgroup.devices.deny = c 5:1 rwm\n";
1115 }
4f958489 1116
0d0ca400 1117 my $ttycount = get_tty_count($conf);
27916659 1118 $raw .= "lxc.tty = $ttycount\n";
cbb03fea 1119
c31ad455 1120 # some init scripts expect a linux terminal (turnkey).
a691a5a3
DM
1121 $raw .= "lxc.environment = TERM=linux\n";
1122
27916659
DM
1123 my $utsname = $conf->{hostname} || "CT$vmid";
1124 $raw .= "lxc.utsname = $utsname\n";
cbb03fea 1125
27916659
DM
1126 my $memory = $conf->{memory} || 512;
1127 my $swap = $conf->{swap} // 0;
1128
1129 my $lxcmem = int($memory*1024*1024);
1130 $raw .= "lxc.cgroup.memory.limit_in_bytes = $lxcmem\n";
a12a36e0 1131
27916659
DM
1132 my $lxcswap = int(($memory + $swap)*1024*1024);
1133 $raw .= "lxc.cgroup.memory.memsw.limit_in_bytes = $lxcswap\n";
1134
1135 if (my $cpulimit = $conf->{cpulimit}) {
1136 $raw .= "lxc.cgroup.cpu.cfs_period_us = 100000\n";
1137 my $value = int(100000*$cpulimit);
1138 $raw .= "lxc.cgroup.cpu.cfs_quota_us = $value\n";
a12a36e0
WL
1139 }
1140
27916659
DM
1141 my $shares = $conf->{cpuunits} || 1024;
1142 $raw .= "lxc.cgroup.cpu.shares = $shares\n";
1143
44a9face 1144 my $mountpoint = parse_ct_rootfs($conf->{rootfs});
a3076d81 1145
c9a5774b 1146 $raw .= "lxc.rootfs = $dir/rootfs\n";
27916659
DM
1147
1148 my $netcount = 0;
1149 foreach my $k (keys %$conf) {
1150 next if $k !~ m/^net(\d+)$/;
1151 my $ind = $1;
a16d94c8 1152 my $d = parse_lxc_network($conf->{$k});
27916659
DM
1153 $netcount++;
1154 $raw .= "lxc.network.type = veth\n";
18862537 1155 $raw .= "lxc.network.veth.pair = veth${vmid}i${ind}\n";
27916659
DM
1156 $raw .= "lxc.network.hwaddr = $d->{hwaddr}\n" if defined($d->{hwaddr});
1157 $raw .= "lxc.network.name = $d->{name}\n" if defined($d->{name});
1158 $raw .= "lxc.network.mtu = $d->{mtu}\n" if defined($d->{mtu});
a12a36e0
WL
1159 }
1160
e576f689
DM
1161 if (my $lxcconf = $conf->{lxc}) {
1162 foreach my $entry (@$lxcconf) {
1163 my ($k, $v) = @$entry;
1164 $netcount++ if $k eq 'lxc.network.type';
1165 $raw .= "$k = $v\n";
1166 }
1167 }
27916659 1168
e576f689
DM
1169 $raw .= "lxc.network.type = empty\n" if !$netcount;
1170
27916659
DM
1171 File::Path::mkpath("$dir/rootfs");
1172
1173 PVE::Tools::file_set_contents("$dir/config", $raw);
b80dd50a
DM
1174}
1175
117636e5
DM
1176# verify and cleanup nameserver list (replace \0 with ' ')
1177sub verify_nameserver_list {
1178 my ($nameserver_list) = @_;
1179
1180 my @list = ();
1181 foreach my $server (PVE::Tools::split_list($nameserver_list)) {
1182 PVE::JSONSchema::pve_verify_ip($server);
1183 push @list, $server;
1184 }
1185
1186 return join(' ', @list);
1187}
1188
1189sub verify_searchdomain_list {
1190 my ($searchdomain_list) = @_;
1191
1192 my @list = ();
1193 foreach my $server (PVE::Tools::split_list($searchdomain_list)) {
1194 # todo: should we add checks for valid dns domains?
1195 push @list, $server;
1196 }
1197
1198 return join(' ', @list);
1199}
1200
12e95ae4 1201sub is_volume_in_use {
4defdb73 1202 my ($config, $volid, $include_snapshots) = @_;
12e95ae4
FG
1203 my $used = 0;
1204
1205 foreach_mountpoint($config, sub {
1206 my ($ms, $mountpoint) = @_;
1207 return if $used;
1208 if ($mountpoint->{type} eq 'volume' && $mountpoint->{volume} eq $volid) {
1209 $used = 1;
1210 }
1211 });
1212
4defdb73
FG
1213 my $snapshots = $config->{snapshots};
1214 if ($include_snapshots && $snapshots) {
1215 foreach my $snap (keys %$snapshots) {
1216 $used ||= is_volume_in_use($snapshots->{$snap}, $volid);
1217 }
1218 }
1219
12e95ae4
FG
1220 return $used;
1221}
1222
69202f71
WB
1223sub add_unused_volume {
1224 my ($config, $volid) = @_;
1225
1226 my $key;
1227 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1228 my $test = "unused$ind";
1229 if (my $vid = $config->{$test}) {
1230 return if $vid eq $volid; # do not add duplicates
1231 } else {
1232 $key = $test;
1233 }
1234 }
1235
c31ad455 1236 die "Too many unused volumes - please delete them first.\n" if !$key;
69202f71
WB
1237
1238 $config->{$key} = $volid;
1239
1240 return $key;
1241}
1242
27916659 1243sub update_pct_config {
93285df8
DM
1244 my ($vmid, $conf, $running, $param, $delete) = @_;
1245
bf0b8c43
AD
1246 my @nohotplug;
1247
7b49dfe0 1248 my $new_disks = 0;
69202f71 1249 my @deleted_volumes;
4fee75fd 1250
cbb03fea
DM
1251 my $rootdir;
1252 if ($running) {
bedeaaf1 1253 my $pid = find_lxc_pid($vmid);
cbb03fea 1254 $rootdir = "/proc/$pid/root";
bedeaaf1
AD
1255 }
1256
7a168607
DM
1257 my $hotplug_error = sub {
1258 if ($running) {
a6a77cfa
WB
1259 push @nohotplug, @_;
1260 return 1;
7a168607
DM
1261 } else {
1262 return 0;
a6a77cfa 1263 }
7a168607 1264 };
a6a77cfa 1265
93285df8
DM
1266 if (defined($delete)) {
1267 foreach my $opt (@$delete) {
a61a5448
WB
1268 if (!exists($conf->{$opt})) {
1269 warn "no such option: $opt\n";
1270 next;
1271 }
1272
27916659 1273 if ($opt eq 'hostname' || $opt eq 'memory' || $opt eq 'rootfs') {
93285df8
DM
1274 die "unable to delete required option '$opt'\n";
1275 } elsif ($opt eq 'swap') {
27916659 1276 delete $conf->{$opt};
bf0b8c43 1277 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", -1);
40603eb3 1278 } elsif ($opt eq 'description' || $opt eq 'onboot' || $opt eq 'startup') {
27916659 1279 delete $conf->{$opt};
4f958489 1280 } elsif ($opt eq 'nameserver' || $opt eq 'searchdomain' ||
40603eb3 1281 $opt eq 'tty' || $opt eq 'console' || $opt eq 'cmode') {
a6a77cfa 1282 next if $hotplug_error->($opt);
27916659 1283 delete $conf->{$opt};
68fba17b 1284 } elsif ($opt =~ m/^net(\d)$/) {
93285df8 1285 delete $conf->{$opt};
68fba17b
AD
1286 next if !$running;
1287 my $netid = $1;
18862537 1288 PVE::Network::veth_delete("veth${vmid}i$netid");
7e806596
AG
1289 } elsif ($opt eq 'protection') {
1290 delete $conf->{$opt};
69202f71 1291 } elsif ($opt =~ m/^unused(\d+)$/) {
a6a77cfa 1292 next if $hotplug_error->($opt);
69202f71
WB
1293 check_protection($conf, "can't remove CT $vmid drive '$opt'");
1294 push @deleted_volumes, $conf->{$opt};
1295 delete $conf->{$opt};
4fee75fd 1296 } elsif ($opt =~ m/^mp(\d+)$/) {
a6a77cfa 1297 next if $hotplug_error->($opt);
e22af68f 1298 check_protection($conf, "can't remove CT $vmid drive '$opt'");
12e95ae4 1299 my $mp = parse_ct_mountpoint($conf->{$opt});
4fee75fd 1300 delete $conf->{$opt};
12e95ae4
FG
1301 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1302 add_unused_volume($conf, $mp->{volume});
1303 }
425b62cb
WB
1304 } elsif ($opt eq 'unprivileged') {
1305 die "unable to delete read-only option: '$opt'\n";
93285df8 1306 } else {
9a7a910b 1307 die "implement me (delete: $opt)"
93285df8 1308 }
706c9791 1309 write_config($vmid, $conf) if $running;
93285df8
DM
1310 }
1311 }
1312
be6383d7
WB
1313 # There's no separate swap size to configure, there's memory and "total"
1314 # memory (iow. memory+swap). This means we have to change them together.
27916659
DM
1315 my $wanted_memory = PVE::Tools::extract_param($param, 'memory');
1316 my $wanted_swap = PVE::Tools::extract_param($param, 'swap');
be6383d7 1317 if (defined($wanted_memory) || defined($wanted_swap)) {
27916659 1318
a2c57b0c
WB
1319 my $old_memory = ($conf->{memory} || 512);
1320 my $old_swap = ($conf->{swap} || 0);
1321
1322 $wanted_memory //= $old_memory;
1323 $wanted_swap //= $old_swap;
27916659
DM
1324
1325 my $total = $wanted_memory + $wanted_swap;
1326 if ($running) {
a2c57b0c
WB
1327 my $old_total = $old_memory + $old_swap;
1328 if ($total > $old_total) {
1329 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", int($total*1024*1024));
1330 write_cgroup_value("memory", $vmid, "memory.limit_in_bytes", int($wanted_memory*1024*1024));
1331 } else {
1332 write_cgroup_value("memory", $vmid, "memory.limit_in_bytes", int($wanted_memory*1024*1024));
1333 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", int($total*1024*1024));
1334 }
be6383d7 1335 }
27916659
DM
1336 $conf->{memory} = $wanted_memory;
1337 $conf->{swap} = $wanted_swap;
1338
706c9791 1339 write_config($vmid, $conf) if $running;
be6383d7
WB
1340 }
1341
dfab6edb
WB
1342 my $used_volids = {};
1343
93285df8
DM
1344 foreach my $opt (keys %$param) {
1345 my $value = $param->{$opt};
1346 if ($opt eq 'hostname') {
27916659 1347 $conf->{$opt} = $value;
a99b3509 1348 } elsif ($opt eq 'onboot') {
27916659 1349 $conf->{$opt} = $value ? 1 : 0;
a3249355 1350 } elsif ($opt eq 'startup') {
27916659 1351 $conf->{$opt} = $value;
40603eb3 1352 } elsif ($opt eq 'tty' || $opt eq 'console' || $opt eq 'cmode') {
a6a77cfa 1353 next if $hotplug_error->($opt);
e576f689 1354 $conf->{$opt} = $value;
ffa1d001 1355 } elsif ($opt eq 'nameserver') {
a6a77cfa 1356 next if $hotplug_error->($opt);
117636e5 1357 my $list = verify_nameserver_list($value);
27916659 1358 $conf->{$opt} = $list;
ffa1d001 1359 } elsif ($opt eq 'searchdomain') {
a6a77cfa 1360 next if $hotplug_error->($opt);
117636e5 1361 my $list = verify_searchdomain_list($value);
27916659 1362 $conf->{$opt} = $list;
45573f7c 1363 } elsif ($opt eq 'cpulimit') {
a6a77cfa 1364 next if $hotplug_error->($opt); # FIXME: hotplug
27916659 1365 $conf->{$opt} = $value;
b80dd50a 1366 } elsif ($opt eq 'cpuunits') {
27916659 1367 $conf->{$opt} = $value;
bf0b8c43 1368 write_cgroup_value("cpu", $vmid, "cpu.shares", $value);
93285df8 1369 } elsif ($opt eq 'description') {
27916659 1370 $conf->{$opt} = PVE::Tools::encode_text($value);
93285df8
DM
1371 } elsif ($opt =~ m/^net(\d+)$/) {
1372 my $netid = $1;
a16d94c8 1373 my $net = parse_lxc_network($value);
27916659
DM
1374 if (!$running) {
1375 $conf->{$opt} = print_lxc_network($net);
cbb03fea 1376 } else {
bedeaaf1
AD
1377 update_net($vmid, $conf, $opt, $net, $netid, $rootdir);
1378 }
7e806596
AG
1379 } elsif ($opt eq 'protection') {
1380 $conf->{$opt} = $value ? 1 : 0;
4fee75fd 1381 } elsif ($opt =~ m/^mp(\d+)$/) {
a6a77cfa 1382 next if $hotplug_error->($opt);
e22af68f 1383 check_protection($conf, "can't update CT $vmid drive '$opt'");
12e95ae4 1384 my $old = $conf->{$opt};
4fee75fd 1385 $conf->{$opt} = $value;
12e95ae4
FG
1386 if (defined($old)) {
1387 my $mp = parse_ct_mountpoint($old);
1388 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1389 add_unused_volume($conf, $mp->{volume});
1390 }
1391 }
7b49dfe0 1392 $new_disks = 1;
dfab6edb
WB
1393 my $mp = parse_ct_mountpoint($value);
1394 $used_volids->{$mp->{volume}} = 1;
4fee75fd 1395 } elsif ($opt eq 'rootfs') {
55ce8db8 1396 next if $hotplug_error->($opt);
e22af68f 1397 check_protection($conf, "can't update CT $vmid drive '$opt'");
12e95ae4 1398 my $old = $conf->{$opt};
55ce8db8 1399 $conf->{$opt} = $value;
12e95ae4
FG
1400 if (defined($old)) {
1401 my $mp = parse_ct_rootfs($old);
1402 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1403 add_unused_volume($conf, $mp->{volume});
1404 }
1405 }
dfab6edb
WB
1406 my $mp = parse_ct_rootfs($value);
1407 $used_volids->{$mp->{volume}} = 1;
425b62cb
WB
1408 } elsif ($opt eq 'unprivileged') {
1409 die "unable to modify read-only option: '$opt'\n";
238b7e3e
DM
1410 } elsif ($opt eq 'ostype') {
1411 next if $hotplug_error->($opt);
1412 $conf->{$opt} = $value;
93285df8 1413 } else {
a92f66c9 1414 die "implement me: $opt";
93285df8 1415 }
706c9791 1416 write_config($vmid, $conf) if $running;
93285df8 1417 }
bf0b8c43 1418
dfab6edb
WB
1419 # Cleanup config:
1420
1421 # Remove unused disks after re-adding
1422 foreach my $key (keys %$conf) {
1423 next if $key !~ /^unused\d+/;
1424 my $volid = $conf->{$key};
1425 if ($used_volids->{$volid}) {
1426 delete $conf->{$key};
1427 }
1428 }
1429
1430 # Apply deletions and creations of new volumes
69202f71
WB
1431 if (@deleted_volumes) {
1432 my $storage_cfg = PVE::Storage::config();
1433 foreach my $volume (@deleted_volumes) {
dfab6edb 1434 next if $used_volids->{$volume}; # could have been re-added, too
4defdb73
FG
1435 # also check for references in snapshots
1436 next if is_volume_in_use($conf, $volume, 1);
69202f71
WB
1437 delete_mountpoint_volume($storage_cfg, $vmid, $volume);
1438 }
1439 }
1440
7b49dfe0 1441 if ($new_disks) {
4fee75fd 1442 my $storage_cfg = PVE::Storage::config();
6c871c36 1443 create_disks($storage_cfg, $vmid, $conf, $conf);
4fee75fd 1444 }
694c25df
WB
1445
1446 # This should be the last thing we do here
1447 if ($running && scalar(@nohotplug)) {
1448 die "unable to modify " . join(',', @nohotplug) . " while container is running\n";
1449 }
93285df8 1450}
c325b32f 1451
6f035afe
DM
1452sub has_dev_console {
1453 my ($conf) = @_;
1454
1455 return !(defined($conf->{console}) && !$conf->{console});
1456}
1457
0d0ca400
DM
1458sub get_tty_count {
1459 my ($conf) = @_;
1460
1461 return $conf->{tty} // $confdesc->{tty}->{default};
1462}
1463
aca816ad
DM
1464sub get_cmode {
1465 my ($conf) = @_;
1466
1467 return $conf->{cmode} // $confdesc->{cmode}->{default};
1468}
1469
1470sub get_console_command {
1471 my ($vmid, $conf) = @_;
1472
1473 my $cmode = get_cmode($conf);
1474
1475 if ($cmode eq 'console') {
1476 return ['lxc-console', '-n', $vmid, '-t', 0];
1477 } elsif ($cmode eq 'tty') {
1478 return ['lxc-console', '-n', $vmid];
1479 } elsif ($cmode eq 'shell') {
1480 return ['lxc-attach', '--clear-env', '-n', $vmid];
1481 } else {
1482 die "internal error";
1483 }
1484}
1485
c325b32f
DM
1486sub get_primary_ips {
1487 my ($conf) = @_;
1488
1489 # return data from net0
cbb03fea 1490
27916659 1491 return undef if !defined($conf->{net0});
a16d94c8 1492 my $net = parse_lxc_network($conf->{net0});
c325b32f
DM
1493
1494 my $ipv4 = $net->{ip};
db78a181
WB
1495 if ($ipv4) {
1496 if ($ipv4 =~ /^(dhcp|manual)$/) {
1497 $ipv4 = undef
1498 } else {
1499 $ipv4 =~ s!/\d+$!!;
1500 }
1501 }
65e5eaa3 1502 my $ipv6 = $net->{ip6};
db78a181 1503 if ($ipv6) {
5f291c7d 1504 if ($ipv6 =~ /^(auto|dhcp|manual)$/) {
db78a181
WB
1505 $ipv6 = undef;
1506 } else {
1507 $ipv6 =~ s!/\d+$!!;
1508 }
1509 }
cbb03fea 1510
c325b32f
DM
1511 return ($ipv4, $ipv6);
1512}
148d1cb4 1513
b407293b
WB
1514sub delete_mountpoint_volume {
1515 my ($storage_cfg, $vmid, $volume) = @_;
1516
7c921c80 1517 return if classify_mountpoint($volume) ne 'volume';
b407293b
WB
1518
1519 my ($vtype, $name, $owner) = PVE::Storage::parse_volname($storage_cfg, $volume);
1520 PVE::Storage::vdisk_free($storage_cfg, $volume) if $vmid == $owner;
1521}
ef241384 1522
27916659 1523sub destroy_lxc_container {
148d1cb4
DM
1524 my ($storage_cfg, $vmid, $conf) = @_;
1525
db8989e1
WB
1526 foreach_mountpoint($conf, sub {
1527 my ($ms, $mountpoint) = @_;
b407293b 1528 delete_mountpoint_volume($storage_cfg, $vmid, $mountpoint->{volume});
db8989e1
WB
1529 });
1530
27916659
DM
1531 rmdir "/var/lib/lxc/$vmid/rootfs";
1532 unlink "/var/lib/lxc/$vmid/config";
1533 rmdir "/var/lib/lxc/$vmid";
1534 destroy_config($vmid);
1535
1536 #my $cmd = ['lxc-destroy', '-n', $vmid ];
1537 #PVE::Tools::run_command($cmd);
148d1cb4 1538}
68fba17b 1539
ef241384 1540sub vm_stop_cleanup {
5fa890f0 1541 my ($storage_cfg, $vmid, $conf, $keepActive) = @_;
ef241384
DM
1542
1543 eval {
1544 if (!$keepActive) {
bf9d912c 1545
09aa32fd 1546 my $vollist = get_vm_volumes($conf);
a8b6b8a7 1547 PVE::Storage::deactivate_volumes($storage_cfg, $vollist);
ef241384
DM
1548 }
1549 };
1550 warn $@ if $@; # avoid errors - just warn
1551}
1552
93cdbbfb
AD
1553my $safe_num_ne = sub {
1554 my ($a, $b) = @_;
1555
1556 return 0 if !defined($a) && !defined($b);
1557 return 1 if !defined($a);
1558 return 1 if !defined($b);
1559
1560 return $a != $b;
1561};
1562
1563my $safe_string_ne = sub {
1564 my ($a, $b) = @_;
1565
1566 return 0 if !defined($a) && !defined($b);
1567 return 1 if !defined($a);
1568 return 1 if !defined($b);
1569
1570 return $a ne $b;
1571};
1572
1573sub update_net {
bedeaaf1 1574 my ($vmid, $conf, $opt, $newnet, $netid, $rootdir) = @_;
93cdbbfb 1575
18862537
WB
1576 if ($newnet->{type} ne 'veth') {
1577 # for when there are physical interfaces
1578 die "cannot update interface of type $newnet->{type}";
1579 }
1580
1581 my $veth = "veth${vmid}i${netid}";
93cdbbfb
AD
1582 my $eth = $newnet->{name};
1583
18862537
WB
1584 if (my $oldnetcfg = $conf->{$opt}) {
1585 my $oldnet = parse_lxc_network($oldnetcfg);
1586
1587 if (&$safe_string_ne($oldnet->{hwaddr}, $newnet->{hwaddr}) ||
1588 &$safe_string_ne($oldnet->{name}, $newnet->{name})) {
93cdbbfb 1589
18862537 1590 PVE::Network::veth_delete($veth);
bedeaaf1 1591 delete $conf->{$opt};
706c9791 1592 write_config($vmid, $conf);
93cdbbfb 1593
18862537 1594 hotplug_net($vmid, $conf, $opt, $newnet, $netid);
bedeaaf1 1595
18862537
WB
1596 } elsif (&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
1597 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
1598 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
bedeaaf1 1599
18862537 1600 if ($oldnet->{bridge}) {
bedeaaf1 1601 PVE::Network::tap_unplug($veth);
18862537
WB
1602 foreach (qw(bridge tag firewall)) {
1603 delete $oldnet->{$_};
1604 }
1605 $conf->{$opt} = print_lxc_network($oldnet);
706c9791 1606 write_config($vmid, $conf);
bedeaaf1 1607 }
93cdbbfb 1608
23eb2244 1609 PVE::Network::tap_plug($veth, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks});
18862537
WB
1610 foreach (qw(bridge tag firewall)) {
1611 $oldnet->{$_} = $newnet->{$_} if $newnet->{$_};
1612 }
1613 $conf->{$opt} = print_lxc_network($oldnet);
706c9791 1614 write_config($vmid, $conf);
93cdbbfb
AD
1615 }
1616 } else {
18862537 1617 hotplug_net($vmid, $conf, $opt, $newnet, $netid);
93cdbbfb
AD
1618 }
1619
bedeaaf1 1620 update_ipconfig($vmid, $conf, $opt, $eth, $newnet, $rootdir);
93cdbbfb
AD
1621}
1622
1623sub hotplug_net {
18862537 1624 my ($vmid, $conf, $opt, $newnet, $netid) = @_;
93cdbbfb 1625
18862537 1626 my $veth = "veth${vmid}i${netid}";
cbb03fea 1627 my $vethpeer = $veth . "p";
93cdbbfb
AD
1628 my $eth = $newnet->{name};
1629
1630 PVE::Network::veth_create($veth, $vethpeer, $newnet->{bridge}, $newnet->{hwaddr});
23eb2244 1631 PVE::Network::tap_plug($veth, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks});
93cdbbfb 1632
cbb03fea 1633 # attach peer in container
93cdbbfb
AD
1634 my $cmd = ['lxc-device', '-n', $vmid, 'add', $vethpeer, "$eth" ];
1635 PVE::Tools::run_command($cmd);
1636
cbb03fea 1637 # link up peer in container
93cdbbfb
AD
1638 $cmd = ['lxc-attach', '-n', $vmid, '-s', 'NETWORK', '--', '/sbin/ip', 'link', 'set', $eth ,'up' ];
1639 PVE::Tools::run_command($cmd);
bedeaaf1 1640
18862537
WB
1641 my $done = { type => 'veth' };
1642 foreach (qw(bridge tag firewall hwaddr name)) {
1643 $done->{$_} = $newnet->{$_} if $newnet->{$_};
1644 }
1645 $conf->{$opt} = print_lxc_network($done);
bedeaaf1 1646
706c9791 1647 write_config($vmid, $conf);
93cdbbfb
AD
1648}
1649
68a05bb3 1650sub update_ipconfig {
bedeaaf1
AD
1651 my ($vmid, $conf, $opt, $eth, $newnet, $rootdir) = @_;
1652
f2104b80 1653 my $lxc_setup = PVE::LXC::Setup->new($conf, $rootdir);
bedeaaf1 1654
18862537 1655 my $optdata = parse_lxc_network($conf->{$opt});
84e0c123
WB
1656 my $deleted = [];
1657 my $added = [];
8d723477
WB
1658 my $nscmd = sub {
1659 my $cmdargs = shift;
1660 PVE::Tools::run_command(['lxc-attach', '-n', $vmid, '-s', 'NETWORK', '--', @_], %$cmdargs);
84e0c123 1661 };
8d723477 1662 my $ipcmd = sub { &$nscmd({}, '/sbin/ip', @_) };
2bfd1615 1663
84e0c123 1664 my $change_ip_config = sub {
f39002a6
DM
1665 my ($ipversion) = @_;
1666
1667 my $family_opt = "-$ipversion";
1668 my $suffix = $ipversion == 4 ? '' : $ipversion;
84e0c123
WB
1669 my $gw= "gw$suffix";
1670 my $ip= "ip$suffix";
bedeaaf1 1671
6178b0dd
WB
1672 my $newip = $newnet->{$ip};
1673 my $newgw = $newnet->{$gw};
1674 my $oldip = $optdata->{$ip};
1675
1676 my $change_ip = &$safe_string_ne($oldip, $newip);
1677 my $change_gw = &$safe_string_ne($optdata->{$gw}, $newgw);
bedeaaf1 1678
84e0c123 1679 return if !$change_ip && !$change_gw;
68a05bb3 1680
84e0c123 1681 # step 1: add new IP, if this fails we cancel
292aff54
WB
1682 my $is_real_ip = ($newip && $newip !~ /^(?:auto|dhcp|manual)$/);
1683 if ($change_ip && $is_real_ip) {
8d723477 1684 eval { &$ipcmd($family_opt, 'addr', 'add', $newip, 'dev', $eth); };
84e0c123
WB
1685 if (my $err = $@) {
1686 warn $err;
1687 return;
1688 }
bedeaaf1 1689 }
bedeaaf1 1690
84e0c123
WB
1691 # step 2: replace gateway
1692 # If this fails we delete the added IP and cancel.
1693 # If it succeeds we save the config and delete the old IP, ignoring
1694 # errors. The config is then saved.
1695 # Note: 'ip route replace' can add
1696 if ($change_gw) {
6178b0dd 1697 if ($newgw) {
292aff54
WB
1698 eval {
1699 if ($is_real_ip && !PVE::Network::is_ip_in_cidr($newgw, $newip, $ipversion)) {
1700 &$ipcmd($family_opt, 'route', 'add', $newgw, 'dev', $eth);
1701 }
1702 &$ipcmd($family_opt, 'route', 'replace', 'default', 'via', $newgw);
1703 };
84e0c123
WB
1704 if (my $err = $@) {
1705 warn $err;
1706 # the route was not replaced, the old IP is still available
1707 # rollback (delete new IP) and cancel
1708 if ($change_ip) {
8d723477 1709 eval { &$ipcmd($family_opt, 'addr', 'del', $newip, 'dev', $eth); };
84e0c123
WB
1710 warn $@ if $@; # no need to die here
1711 }
1712 return;
1713 }
1714 } else {
8d723477 1715 eval { &$ipcmd($family_opt, 'route', 'del', 'default'); };
84e0c123
WB
1716 # if the route was not deleted, the guest might have deleted it manually
1717 # warn and continue
1718 warn $@ if $@;
1719 }
2bfd1615 1720 }
2bfd1615 1721
6178b0dd 1722 # from this point on we save the configuration
84e0c123 1723 # step 3: delete old IP ignoring errors
6178b0dd 1724 if ($change_ip && $oldip && $oldip !~ /^(?:auto|dhcp)$/) {
8d723477
WB
1725 # We need to enable promote_secondaries, otherwise our newly added
1726 # address will be removed along with the old one.
1727 my $promote = 0;
1728 eval {
1729 if ($ipversion == 4) {
1730 &$nscmd({ outfunc => sub { $promote = int(shift) } },
1731 'cat', "/proc/sys/net/ipv4/conf/$eth/promote_secondaries");
1732 &$nscmd({}, 'sysctl', "net.ipv4.conf.$eth.promote_secondaries=1");
1733 }
1734 &$ipcmd($family_opt, 'addr', 'del', $oldip, 'dev', $eth);
1735 };
84e0c123 1736 warn $@ if $@; # no need to die here
8d723477
WB
1737
1738 if ($ipversion == 4) {
1739 &$nscmd({}, 'sysctl', "net.ipv4.conf.$eth.promote_secondaries=$promote");
1740 }
bedeaaf1
AD
1741 }
1742
84e0c123
WB
1743 foreach my $property ($ip, $gw) {
1744 if ($newnet->{$property}) {
1745 $optdata->{$property} = $newnet->{$property};
1746 } else {
1747 delete $optdata->{$property};
1748 }
bedeaaf1 1749 }
18862537 1750 $conf->{$opt} = print_lxc_network($optdata);
706c9791 1751 write_config($vmid, $conf);
84e0c123
WB
1752 $lxc_setup->setup_network($conf);
1753 };
bedeaaf1 1754
f39002a6
DM
1755 &$change_ip_config(4);
1756 &$change_ip_config(6);
489e960d
WL
1757
1758}
1759
a92f66c9
WL
1760# Internal snapshots
1761
1762# NOTE: Snapshot create/delete involves several non-atomic
c31ad455
FG
1763# actions, and can take a long time.
1764# So we try to avoid locking the file and use the 'lock' variable
a92f66c9
WL
1765# inside the config file instead.
1766
1767my $snapshot_copy_config = sub {
1768 my ($source, $dest) = @_;
1769
1770 foreach my $k (keys %$source) {
1771 next if $k eq 'snapshots';
09d3ec42
DM
1772 next if $k eq 'snapstate';
1773 next if $k eq 'snaptime';
1774 next if $k eq 'vmstate';
1775 next if $k eq 'lock';
a92f66c9 1776 next if $k eq 'digest';
09d3ec42 1777 next if $k eq 'description';
0f8b9438 1778 next if $k =~ m/^unused\d+$/;
a92f66c9
WL
1779
1780 $dest->{$k} = $source->{$k};
1781 }
1782};
1783
0f8b9438
FG
1784my $snapshot_apply_config = sub {
1785 my ($conf, $snap) = @_;
1786
1787 # copy snapshot list
1788 my $newconf = {
1789 snapshots => $conf->{snapshots},
1790 };
1791
1792 # keep description and list of unused disks
1793 foreach my $k (keys %$conf) {
1794 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
1795 $newconf->{$k} = $conf->{$k};
1796 }
1797
1798 &$snapshot_copy_config($snap, $newconf);
1799
1800 return $newconf;
1801};
1802
4e8b04cd 1803sub snapshot_save_vmstate {
0f8b9438 1804 die "implement me - snapshot_save_vmstate\n";
4e8b04cd 1805}
0f8b9438 1806
0bfffef4
FG
1807sub snapshot_prepare {
1808 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
a92f66c9
WL
1809
1810 my $snap;
1811
1812 my $updatefn = sub {
1813
1814 my $conf = load_config($vmid);
1815
bb1ac2de
DM
1816 die "you can't take a snapshot if it's a template\n"
1817 if is_template($conf);
1818
a92f66c9
WL
1819 check_lock($conf);
1820
09d3ec42 1821 $conf->{lock} = 'snapshot';
a92f66c9
WL
1822
1823 die "snapshot name '$snapname' already used\n"
1824 if defined($conf->{snapshots}->{$snapname});
1825
1826 my $storecfg = PVE::Storage::config();
41f044fb
FG
1827 die "snapshot feature is not available\n"
1828 if !has_feature('snapshot', $conf, $storecfg, undef, undef, $snapname eq 'vzdump');
a92f66c9
WL
1829
1830 $snap = $conf->{snapshots}->{$snapname} = {};
1831
0f8b9438 1832 if ($save_vmstate && check_running($vmid)) {
4e8b04cd 1833 snapshot_save_vmstate($vmid, $conf, $snapname, $storecfg);
0f8b9438
FG
1834 }
1835
a92f66c9
WL
1836 &$snapshot_copy_config($conf, $snap);
1837
0f8b9438
FG
1838 $snap->{snapstate} = "prepare";
1839 $snap->{snaptime} = time();
1840 $snap->{description} = $comment if $comment;
a92f66c9 1841
706c9791 1842 write_config($vmid, $conf);
a92f66c9
WL
1843 };
1844
3cc56749 1845 lock_config($vmid, $updatefn);
a92f66c9
WL
1846
1847 return $snap;
0bfffef4 1848}
a92f66c9 1849
0bfffef4 1850sub snapshot_commit {
a92f66c9
WL
1851 my ($vmid, $snapname) = @_;
1852
1853 my $updatefn = sub {
1854
1855 my $conf = load_config($vmid);
1856
1857 die "missing snapshot lock\n"
09d3ec42 1858 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
a92f66c9 1859
0f8b9438
FG
1860 my $snap = $conf->{snapshots}->{$snapname};
1861 die "snapshot '$snapname' does not exist\n" if !defined($snap);
a92f66c9
WL
1862
1863 die "wrong snapshot state\n"
0f8b9438 1864 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
a92f66c9 1865
0f8b9438 1866 delete $snap->{snapstate};
09d3ec42 1867 delete $conf->{lock};
a92f66c9 1868
0f8b9438
FG
1869 my $newconf = &$snapshot_apply_config($conf, $snap);
1870
1871 $newconf->{parent} = $snapname;
1872
1873 write_config($vmid, $newconf);
a92f66c9
WL
1874 };
1875
0bfffef4
FG
1876 lock_config($vmid, $updatefn);
1877}
a92f66c9
WL
1878
1879sub has_feature {
41f044fb 1880 my ($feature, $conf, $storecfg, $snapname, $running, $backup_only) = @_;
09d3ec42 1881
a92f66c9 1882 my $err;
09d3ec42 1883
8bf50651
DM
1884 foreach_mountpoint($conf, sub {
1885 my ($ms, $mountpoint) = @_;
1886
2c3ed8c4 1887 return if $err; # skip further test
41f044fb 1888 return if $backup_only && $ms ne 'rootfs' && !$mountpoint->{backup};
2c3ed8c4 1889
41f044fb 1890 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $mountpoint->{volume}, $snapname, $running);
8bf50651 1891 });
a92f66c9
WL
1892
1893 return $err ? 0 : 1;
1894}
1895
34fdb3d7
WB
1896my $enter_namespace = sub {
1897 my ($vmid, $pid, $which, $type) = @_;
1898 sysopen my $fd, "/proc/$pid/ns/$which", O_RDONLY
1899 or die "failed to open $which namespace of container $vmid: $!\n";
1900 PVE::Tools::setns(fileno($fd), $type)
1901 or die "failed to enter $which namespace of container $vmid: $!\n";
1902 close $fd;
1903};
1904
1905my $do_syncfs = sub {
1906 my ($vmid, $pid, $socket) = @_;
1907
1908 &$enter_namespace($vmid, $pid, 'mnt', PVE::Tools::CLONE_NEWNS);
1909
1910 # Tell the parent process to start reading our /proc/mounts
1911 print {$socket} "go\n";
1912 $socket->flush();
1913
1914 # Receive /proc/self/mounts
1915 my $mountdata = do { local $/ = undef; <$socket> };
1916 close $socket;
1917
1918 # Now sync all mountpoints...
1919 my $mounts = PVE::ProcFSTools::parse_mounts($mountdata);
1920 foreach my $mp (@$mounts) {
1921 my ($what, $dir, $fs) = @$mp;
1922 next if $fs eq 'fuse.lxcfs';
1923 eval { PVE::Tools::sync_mountpoint($dir); };
1924 warn $@ if $@;
1925 }
1926};
1927
1928sub sync_container_namespace {
1929 my ($vmid) = @_;
1930 my $pid = find_lxc_pid($vmid);
1931
1932 # SOCK_DGRAM is nicer for barriers but cannot be slurped
1933 socketpair my $pfd, my $cfd, AF_UNIX, SOCK_STREAM, PF_UNSPEC
1934 or die "failed to create socketpair: $!\n";
1935
1936 my $child = fork();
1937 die "fork failed: $!\n" if !defined($child);
1938
1939 if (!$child) {
1940 eval {
1941 close $pfd;
1942 &$do_syncfs($vmid, $pid, $cfd);
1943 };
1944 if (my $err = $@) {
1945 warn $err;
1946 POSIX::_exit(1);
1947 }
1948 POSIX::_exit(0);
1949 }
1950 close $cfd;
1951 my $go = <$pfd>;
1952 die "failed to enter container namespace\n" if $go ne "go\n";
1953
1954 open my $mounts, '<', "/proc/$child/mounts"
1955 or die "failed to open container's /proc/mounts: $!\n";
1956 my $mountdata = do { local $/ = undef; <$mounts> };
1957 close $mounts;
1958 print {$pfd} $mountdata;
1959 close $pfd;
1960
1961 while (waitpid($child, 0) != $child) {}
1962 die "failed to sync container namespace\n" if $? != 0;
1963}
1964
5040d81c
FG
1965sub check_freeze_needed {
1966 my ($vmid, $config, $save_vmstate) = @_;
1967
1968 my $ret = check_running($vmid);
1969 return ($ret, $ret);
1970}
1971
489e960d 1972sub snapshot_create {
0bfffef4 1973 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
489e960d 1974
0bfffef4 1975 my $snap = snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
a92f66c9 1976
5040d81c
FG
1977 $save_vmstate = 0 if !$snap->{vmstate};
1978
09d3ec42 1979 my $conf = load_config($vmid);
a92f66c9 1980
5040d81c 1981 my ($running, $freezefs) = check_freeze_needed($vmid, $conf, $snap->{vmstate});
74bf6d37
FG
1982
1983 my $drivehash = {};
1984
a92f66c9 1985 eval {
5040d81c 1986 if ($freezefs) {
74bf6d37 1987 PVE::Tools::run_command(['/usr/bin/lxc-freeze', '-n', $vmid]);
34fdb3d7 1988 sync_container_namespace($vmid);
5040d81c 1989 }
a92f66c9
WL
1990
1991 my $storecfg = PVE::Storage::config();
5040d81c
FG
1992 foreach_mountpoint($conf, sub {
1993 my ($ms, $mountpoint) = @_;
a92f66c9 1994
5040d81c
FG
1995 return if $snapname eq 'vzdump' && $ms ne 'rootfs' && !$mountpoint->{backup};
1996 PVE::Storage::volume_snapshot($storecfg, $mountpoint->{volume}, $snapname);
1997 $drivehash->{$ms} = 1;
1998 });
a92f66c9 1999 };
2477a7f1
DM
2000 my $err = $@;
2001
5040d81c
FG
2002 if ($running) {
2003 if ($freezefs) {
2004 eval { PVE::Tools::run_command(['/usr/bin/lxc-unfreeze', '-n', $vmid]); };
2005 warn $@ if $@;
2006 }
2477a7f1
DM
2007 }
2008
2009 if ($err) {
5040d81c 2010 warn "snapshot create failed: starting cleanup\n";
74bf6d37 2011 eval { snapshot_delete($vmid, $snapname, 1, $drivehash); };
5040d81c 2012 warn "$@" if $@;
a92f66c9
WL
2013 die "$err\n";
2014 }
74bf6d37 2015
0bfffef4 2016 snapshot_commit($vmid, $snapname);
68a05bb3
AD
2017}
2018
74bf6d37 2019# Note: $drivehash is only set when called from snapshot_create.
57ccb3f8 2020sub snapshot_delete {
74bf6d37 2021 my ($vmid, $snapname, $force, $drivehash) = @_;
57ccb3f8 2022
4de963d4 2023 my $prepare = 1;
31429832 2024
4de963d4 2025 my $snap;
5040d81c 2026 my $unused = [];
31429832 2027
7b2eb379 2028 my $unlink_parent = sub {
7b2eb379 2029 my ($confref, $new_parent) = @_;
31429832 2030
7b2eb379
FG
2031 if ($confref->{parent} && $confref->{parent} eq $snapname) {
2032 if ($new_parent) {
2033 $confref->{parent} = $new_parent;
31429832 2034 } else {
7b2eb379 2035 delete $confref->{parent};
31429832
WL
2036 }
2037 }
7b2eb379
FG
2038 };
2039
4de963d4
FG
2040 my $updatefn = sub {
2041 my ($remove_drive) = @_;
7b2eb379 2042
4de963d4 2043 my $conf = load_config($vmid);
74bf6d37 2044
4de963d4 2045 if (!$drivehash) {
74bf6d37 2046 check_lock($conf);
4de963d4
FG
2047 die "you can't delete a snapshot if vm is a template\n"
2048 if is_template($conf);
74bf6d37 2049 }
7b2eb379 2050
4de963d4
FG
2051 $snap = $conf->{snapshots}->{$snapname};
2052
2053 die "snapshot '$snapname' does not exist\n" if !defined($snap);
2054
2055 # remove parent refs
2056 if (!$prepare) {
2057 &$unlink_parent($conf, $snap->{parent});
2058 foreach my $sn (keys %{$conf->{snapshots}}) {
2059 next if $sn eq $snapname;
2060 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
2061 }
7b2eb379
FG
2062 }
2063
4de963d4
FG
2064 if ($remove_drive) {
2065 if ($remove_drive eq 'vmstate') {
2066 die "implement me - saving vmstate\n";
2067 } else {
5040d81c
FG
2068 my $value = $snap->{$remove_drive};
2069 my $mountpoint = $remove_drive eq 'rootfs' ? parse_ct_rootfs($value, 1) : parse_ct_mountpoint($value, 1);
2070 delete $snap->{$remove_drive};
2071 add_unused_volume($snap, $mountpoint->{volume})
2072 if (!is_volume_in_use($snap, $mountpoint->{volume}));
4de963d4
FG
2073 }
2074 }
31429832 2075
4de963d4
FG
2076 if ($prepare) {
2077 $snap->{snapstate} = 'delete';
2078 } else {
2079 delete $conf->{snapshots}->{$snapname};
2080 delete $conf->{lock} if $drivehash;
5040d81c
FG
2081 foreach my $volid (@$unused) {
2082 add_unused_volume($conf, $volid)
2083 if (!is_volume_in_use($conf, $volid));
2084 }
4de963d4 2085 }
31429832 2086
706c9791 2087 write_config($vmid, $conf);
31429832
WL
2088 };
2089
4de963d4
FG
2090 lock_config($vmid, $updatefn);
2091
2092 # now remove vmstate file
2093 # never set for LXC!
2094 my $storecfg = PVE::Storage::config();
2095
2096 if ($snap->{vmstate}) {
2097 die "implement me - saving vmstate\n";
2098 };
31429832 2099
4de963d4 2100 # now remove all volume snapshots
5040d81c
FG
2101 foreach_mountpoint($snap, sub {
2102 my ($ms, $mountpoint) = @_;
2103
2104 return if $snapname eq 'vzdump' && $ms ne 'rootfs' && !$mountpoint->{backup};
2105 if (!$drivehash || $drivehash->{$ms}) {
2106 eval { PVE::Storage::volume_snapshot_delete($storecfg, $mountpoint->{volume}, $snapname); };
2107 if (my $err = $@) {
2108 die $err if !$force;
2109 warn $err;
2110 }
2111 }
2112
2113 # save changes (remove mp from snapshot)
2114 lock_config($vmid, $updatefn, $ms) if !$force;
2115 push @$unused, $mountpoint->{volume};
2116 });
4de963d4
FG
2117
2118 # now cleanup config
2119 $prepare = 0;
2120 lock_config($vmid, $updatefn);
57ccb3f8
WL
2121}
2122
723157f6
WL
2123sub snapshot_rollback {
2124 my ($vmid, $snapname) = @_;
2125
20e5d106
FG
2126 my $prepare = 1;
2127
6860ba0c
WL
2128 my $storecfg = PVE::Storage::config();
2129
2130 my $conf = load_config($vmid);
2131
20e5d106 2132 my $get_snapshot_config = sub {
bb1ac2de 2133
20e5d106 2134 die "you can't rollback if vm is a template\n" if is_template($conf);
6860ba0c 2135
20e5d106 2136 my $res = $conf->{snapshots}->{$snapname};
6860ba0c 2137
20e5d106
FG
2138 die "snapshot '$snapname' does not exist\n" if !defined($res);
2139
2140 return $res;
2141 };
2142
2143 my $snap = &$get_snapshot_config();
2144
5040d81c
FG
2145 foreach_mountpoint($snap, sub {
2146 my ($ms, $mountpoint) = @_;
09d3ec42 2147
5040d81c
FG
2148 PVE::Storage::volume_rollback_is_possible($storecfg, $mountpoint->{volume}, $snapname);
2149 });
6860ba0c
WL
2150
2151 my $updatefn = sub {
2152
20e5d106 2153 $conf = load_config($vmid);
6860ba0c 2154
20e5d106
FG
2155 $snap = &$get_snapshot_config();
2156
2157 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
2158 if $snap->{snapstate};
6860ba0c 2159
20e5d106
FG
2160 if ($prepare) {
2161 check_lock($conf);
69d4afc7
FG
2162 PVE::Tools::run_command(['/usr/bin/lxc-stop', '-n', $vmid, '--kill'])
2163 if check_running($vmid);
20e5d106 2164 }
6860ba0c
WL
2165
2166 die "unable to rollback vm $vmid: vm is running\n"
2167 if check_running($vmid);
2168
20e5d106
FG
2169 if ($prepare) {
2170 $conf->{lock} = 'rollback';
2171 } else {
2172 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
2173 delete $conf->{lock};
2174 }
6860ba0c
WL
2175
2176 my $forcemachine;
2177
20e5d106
FG
2178 if (!$prepare) {
2179 # copy snapshot config to current config
2180 $conf = &$snapshot_apply_config($conf, $snap);
2181 $conf->{parent} = $snapname;
2182 }
6860ba0c 2183
706c9791 2184 write_config($vmid, $conf);
6860ba0c 2185
20e5d106 2186 if (!$prepare && $snap->{vmstate}) {
19d36a45 2187 die "implement me - save vmstate\n";
20e5d106 2188 }
6860ba0c
WL
2189 };
2190
3cc56749 2191 lock_config($vmid, $updatefn);
6860ba0c 2192
5040d81c
FG
2193 foreach_mountpoint($snap, sub {
2194 my ($ms, $mountpoint) = @_;
2195
2196 PVE::Storage::volume_snapshot_rollback($storecfg, $mountpoint->{volume}, $snapname);
2197 });
6860ba0c 2198
20e5d106
FG
2199 $prepare = 0;
2200 lock_config($vmid, $updatefn);
723157f6 2201}
b935932a 2202
bb1ac2de
DM
2203sub template_create {
2204 my ($vmid, $conf) = @_;
2205
2206 my $storecfg = PVE::Storage::config();
2207
44a9face 2208 my $rootinfo = parse_ct_rootfs($conf->{rootfs});
bb1ac2de
DM
2209 my $volid = $rootinfo->{volume};
2210
2211 die "Template feature is not available for '$volid'\n"
2212 if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
2213
2214 PVE::Storage::activate_volumes($storecfg, [$volid]);
2215
2216 my $template_volid = PVE::Storage::vdisk_create_base($storecfg, $volid);
2217 $rootinfo->{volume} = $template_volid;
4fee75fd 2218 $conf->{rootfs} = print_ct_mountpoint($rootinfo, 1);
bb1ac2de
DM
2219
2220 write_config($vmid, $conf);
2221}
2222
2223sub is_template {
2224 my ($conf) = @_;
2225
2226 return 1 if defined $conf->{template} && $conf->{template} == 1;
2227}
2228
9622e848
DM
2229sub mountpoint_names {
2230 my ($reverse) = @_;
ced7fddb 2231
9622e848 2232 my @names = ('rootfs');
eaebef36
DM
2233
2234 for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
9622e848
DM
2235 push @names, "mp$i";
2236 }
2237
2238 return $reverse ? reverse @names : @names;
2239}
2240
3c9dbfa9 2241
9622e848
DM
2242sub foreach_mountpoint_full {
2243 my ($conf, $reverse, $func) = @_;
2244
2245 foreach my $key (mountpoint_names($reverse)) {
2246 my $value = $conf->{$key};
2247 next if !defined($value);
44a9face 2248 my $mountpoint = $key eq 'rootfs' ? parse_ct_rootfs($value, 1) : parse_ct_mountpoint($value, 1);
ca7feb1a 2249 next if !defined($mountpoint);
3c9dbfa9 2250
eaebef36 2251 &$func($key, $mountpoint);
ced7fddb
AD
2252 }
2253}
2254
9622e848
DM
2255sub foreach_mountpoint {
2256 my ($conf, $func) = @_;
2257
2258 foreach_mountpoint_full($conf, 0, $func);
2259}
2260
2261sub foreach_mountpoint_reverse {
2262 my ($conf, $func) = @_;
2263
2264 foreach_mountpoint_full($conf, 1, $func);
2265}
2266
52389a07 2267sub check_ct_modify_config_perm {
f1ba1a4b 2268 my ($rpcenv, $authuser, $vmid, $pool, $newconf, $delete) = @_;
52389a07 2269
c81f19d1 2270 return 1 if $authuser eq 'root@pam';
52389a07 2271
f1ba1a4b
WB
2272 my $check = sub {
2273 my ($opt, $delete) = @_;
52389a07
DM
2274 if ($opt eq 'cpus' || $opt eq 'cpuunits' || $opt eq 'cpulimit') {
2275 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.CPU']);
e59a61ed 2276 } elsif ($opt eq 'rootfs' || $opt =~ /^mp\d+$/) {
52389a07 2277 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Disk']);
f1ba1a4b
WB
2278 return if $delete;
2279 my $data = $opt eq 'rootfs' ? parse_ct_rootfs($newconf->{$opt})
2280 : parse_ct_mountpoint($newconf->{$opt});
2281 raise_perm_exc("mountpoint type $data->{type}") if $data->{type} ne 'volume';
52389a07
DM
2282 } elsif ($opt eq 'memory' || $opt eq 'swap') {
2283 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Memory']);
2284 } elsif ($opt =~ m/^net\d+$/ || $opt eq 'nameserver' ||
2285 $opt eq 'searchdomain' || $opt eq 'hostname') {
2286 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Network']);
2287 } else {
2288 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Options']);
2289 }
f1ba1a4b
WB
2290 };
2291
2292 foreach my $opt (keys %$newconf) {
2293 &$check($opt, 0);
2294 }
2295 foreach my $opt (@$delete) {
2296 &$check($opt, 1);
52389a07
DM
2297 }
2298
2299 return 1;
2300}
2301
9622e848 2302sub umount_all {
da629848 2303 my ($vmid, $storage_cfg, $conf, $noerr) = @_;
9622e848
DM
2304
2305 my $rootdir = "/var/lib/lxc/$vmid/rootfs";
2306 my $volid_list = get_vm_volumes($conf);
2307
2308 foreach_mountpoint_reverse($conf, sub {
2309 my ($ms, $mountpoint) = @_;
2310
2311 my $volid = $mountpoint->{volume};
2312 my $mount = $mountpoint->{mp};
2313
2314 return if !$volid || !$mount;
2315
d18f96b4 2316 my $mount_path = "$rootdir/$mount";
f845a93d 2317 $mount_path =~ s!/+!/!g;
9622e848 2318
228a5a1d
WL
2319 return if !PVE::ProcFSTools::is_mounted($mount_path);
2320
9622e848 2321 eval {
d18f96b4 2322 PVE::Tools::run_command(['umount', '-d', $mount_path]);
9622e848
DM
2323 };
2324 if (my $err = $@) {
2325 if ($noerr) {
2326 warn $err;
2327 } else {
2328 die $err;
2329 }
2330 }
2331 });
9622e848
DM
2332}
2333
2334sub mount_all {
7b49dfe0 2335 my ($vmid, $storage_cfg, $conf) = @_;
9622e848
DM
2336
2337 my $rootdir = "/var/lib/lxc/$vmid/rootfs";
1adc7e53 2338 File::Path::make_path($rootdir);
9622e848
DM
2339
2340 my $volid_list = get_vm_volumes($conf);
2341 PVE::Storage::activate_volumes($storage_cfg, $volid_list);
2342
2343 eval {
9622e848
DM
2344 foreach_mountpoint($conf, sub {
2345 my ($ms, $mountpoint) = @_;
2346
da629848 2347 mountpoint_mount($mountpoint, $rootdir, $storage_cfg);
9622e848
DM
2348 });
2349 };
2350 if (my $err = $@) {
e2007ac2 2351 warn "mounting container failed\n";
9622e848 2352 umount_all($vmid, $storage_cfg, $conf, 1);
e2007ac2 2353 die $err;
9622e848
DM
2354 }
2355
da629848 2356 return $rootdir;
9622e848
DM
2357}
2358
2359
b15c75fc 2360sub mountpoint_mount_path {
da629848 2361 my ($mountpoint, $storage_cfg, $snapname) = @_;
b15c75fc 2362
da629848 2363 return mountpoint_mount($mountpoint, undef, $storage_cfg, $snapname);
b15c75fc 2364}
cc6b0307 2365
2cfae16e
WB
2366my $check_mount_path = sub {
2367 my ($path) = @_;
2368 $path = File::Spec->canonpath($path);
2369 my $real = Cwd::realpath($path);
2370 if ($real ne $path) {
2371 die "mount path modified by symlink: $path != $real";
2372 }
2373};
2374
21f292ff
WB
2375sub query_loopdev {
2376 my ($path) = @_;
2377 my $found;
2378 my $parser = sub {
2379 my $line = shift;
2380 if ($line =~ m@^(/dev/loop\d+):@) {
2381 $found = $1;
2382 }
2383 };
2384 my $cmd = ['losetup', '--associated', $path];
2385 PVE::Tools::run_command($cmd, outfunc => $parser);
2386 return $found;
2387}
2388
50df544c
WB
2389# Run a function with a file attached to a loop device.
2390# The loop device is always detached afterwards (or set to autoclear).
2391# Returns the loop device.
2392sub run_with_loopdev {
2393 my ($func, $file) = @_;
2394 my $device;
2395 my $parser = sub {
2396 my $line = shift;
2397 if ($line =~ m@^(/dev/loop\d+)$@) {
2398 $device = $1;
2399 }
2400 };
2401 PVE::Tools::run_command(['losetup', '--show', '-f', $file], outfunc => $parser);
2402 die "failed to setup loop device for $file\n" if !$device;
2403 eval { &$func($device); };
2404 my $err = $@;
2405 PVE::Tools::run_command(['losetup', '-d', $device]);
2406 die $err if $err;
2407 return $device;
2408}
2409
c2744c97
WB
2410sub bindmount {
2411 my ($dir, $dest, $ro, @extra_opts) = @_;
2412 PVE::Tools::run_command(['mount', '-o', 'bind', @extra_opts, $dir, $dest]);
2413 if ($ro) {
2414 eval { PVE::Tools::run_command(['mount', '-o', 'bind,remount,ro', $dest]); };
2415 if (my $err = $@) {
2416 warn "bindmount error\n";
2417 # don't leave writable bind-mounts behind...
2418 PVE::Tools::run_command(['umount', $dest]);
2419 die $err;
2420 }
2421 }
2422}
2423
b15c75fc 2424# use $rootdir = undef to just return the corresponding mount path
cc6b0307 2425sub mountpoint_mount {
da629848 2426 my ($mountpoint, $rootdir, $storage_cfg, $snapname) = @_;
cc6b0307
AD
2427
2428 my $volid = $mountpoint->{volume};
2429 my $mount = $mountpoint->{mp};
7c921c80 2430 my $type = $mountpoint->{type};
50df544c
WB
2431 my $quota = !$snapname && !$mountpoint->{ro} && $mountpoint->{quota};
2432 my $mounted_dev;
b15c75fc 2433
cc6b0307
AD
2434 return if !$volid || !$mount;
2435
b15c75fc
DM
2436 my $mount_path;
2437
2438 if (defined($rootdir)) {
2439 $rootdir =~ s!/+$!!;
2440 $mount_path = "$rootdir/$mount";
f845a93d 2441 $mount_path =~ s!/+!/!g;
2cfae16e 2442 &$check_mount_path($mount_path);
b15c75fc 2443 File::Path::mkpath($mount_path);
116ce06f 2444 }
b15c75fc
DM
2445
2446 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
cc6b0307 2447
b15c75fc 2448 die "unknown snapshot path for '$volid'" if !$storage && defined($snapname);
cc6b0307 2449
471dd315
WB
2450 my $optstring = '';
2451 if (defined($mountpoint->{acl})) {
2452 $optstring .= ($mountpoint->{acl} ? 'acl' : 'noacl');
2453 }
c2744c97 2454 my $readonly = $mountpoint->{ro};
471dd315
WB
2455
2456 my @extra_opts = ('-o', $optstring);
2457
b15c75fc
DM
2458 if ($storage) {
2459
2460 my $scfg = PVE::Storage::storage_config($storage_cfg, $storage);
2461 my $path = PVE::Storage::path($storage_cfg, $volid, $snapname);
2462
2463 my ($vtype, undef, undef, undef, undef, $isBase, $format) =
2464 PVE::Storage::parse_volname($storage_cfg, $volid);
2465
c87b9dd8
DM
2466 $format = 'iso' if $vtype eq 'iso'; # allow to handle iso files
2467
b15c75fc 2468 if ($format eq 'subvol') {
30de33be
DM
2469 if ($mount_path) {
2470 if ($snapname) {
e84f7f5d
DM
2471 if ($scfg->{type} eq 'zfspool') {
2472 my $path_arg = $path;
2473 $path_arg =~ s!^/+!!;
471dd315 2474 PVE::Tools::run_command(['mount', '-o', 'ro', @extra_opts, '-t', 'zfs', $path_arg, $mount_path]);
e84f7f5d 2475 } else {
30de33be
DM
2476 die "cannot mount subvol snapshots for storage type '$scfg->{type}'\n";
2477 }
e84f7f5d 2478 } else {
c2744c97 2479 bindmount($path, $mount_path, $readonly, @extra_opts);
50df544c 2480 warn "cannot enable quota control for bind mounted subvolumes\n" if $quota;
30de33be 2481 }
b15c75fc 2482 }
50df544c 2483 return wantarray ? ($path, 0, $mounted_dev) : $path;
c87b9dd8 2484 } elsif ($format eq 'raw' || $format eq 'iso') {
50df544c
WB
2485 my $domount = sub {
2486 my ($path) = @_;
2487 if ($mount_path) {
2488 if ($format eq 'iso') {
2489 PVE::Tools::run_command(['mount', '-o', 'ro', @extra_opts, $path, $mount_path]);
2490 } elsif ($isBase || defined($snapname)) {
2491 PVE::Tools::run_command(['mount', '-o', 'ro,noload', @extra_opts, $path, $mount_path]);
2492 } else {
2493 if ($quota) {
2494 push @extra_opts, '-o', 'usrjquota=aquota.user,grpjquota=aquota.group,jqfmt=vfsv0';
2495 }
c2744c97 2496 push @extra_opts, '-o', 'ro' if $readonly;
50df544c
WB
2497 PVE::Tools::run_command(['mount', @extra_opts, $path, $mount_path]);
2498 }
2499 }
2500 };
30de33be 2501 my $use_loopdev = 0;
b15c75fc 2502 if ($scfg->{path}) {
50df544c 2503 $mounted_dev = run_with_loopdev($domount, $path);
30de33be 2504 $use_loopdev = 1;
2e879877
DM
2505 } elsif ($scfg->{type} eq 'drbd' || $scfg->{type} eq 'lvm' ||
2506 $scfg->{type} eq 'rbd' || $scfg->{type} eq 'lvmthin') {
50df544c
WB
2507 $mounted_dev = $path;
2508 &$domount($path);
b15c75fc
DM
2509 } else {
2510 die "unsupported storage type '$scfg->{type}'\n";
2511 }
50df544c 2512 return wantarray ? ($path, $use_loopdev, $mounted_dev) : $path;
b15c75fc
DM
2513 } else {
2514 die "unsupported image format '$format'\n";
2515 }
7c921c80 2516 } elsif ($type eq 'device') {
c2744c97 2517 push @extra_opts, '-o', 'ro' if $readonly;
471dd315 2518 PVE::Tools::run_command(['mount', @extra_opts, $volid, $mount_path]) if $mount_path;
50df544c 2519 return wantarray ? ($volid, 0, $volid) : $volid;
e2007ac2
DM
2520 } elsif ($type eq 'bind') {
2521 die "directory '$volid' does not exist\n" if ! -d $volid;
2cfae16e 2522 &$check_mount_path($volid);
c2744c97 2523 bindmount($volid, $mount_path, $readonly, @extra_opts) if $mount_path;
50df544c
WB
2524 warn "cannot enable quota control for bind mounts\n" if $quota;
2525 return wantarray ? ($volid, 0, undef) : $volid;
b15c75fc
DM
2526 }
2527
2528 die "unsupported storage";
cc6b0307
AD
2529}
2530
9205e9d0
AD
2531sub get_vm_volumes {
2532 my ($conf, $excludes) = @_;
2533
2534 my $vollist = [];
2535
706c9791 2536 foreach_mountpoint($conf, sub {
9205e9d0
AD
2537 my ($ms, $mountpoint) = @_;
2538
2539 return if $excludes && $ms eq $excludes;
2540
2541 my $volid = $mountpoint->{volume};
2542
7c921c80 2543 return if !$volid || $mountpoint->{type} ne 'volume';
9205e9d0
AD
2544
2545 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2546 return if !$sid;
2547
2548 push @$vollist, $volid;
2549 });
2550
2551 return $vollist;
2552}
2553
6c871c36 2554sub mkfs {
d216e891 2555 my ($dev, $rootuid, $rootgid) = @_;
6c871c36 2556
d216e891
WB
2557 PVE::Tools::run_command(['mkfs.ext4', '-O', 'mmp',
2558 '-E', "root_owner=$rootuid:$rootgid",
2559 $dev]);
6c871c36
DM
2560}
2561
2562sub format_disk {
d216e891 2563 my ($storage_cfg, $volid, $rootuid, $rootgid) = @_;
6c871c36
DM
2564
2565 if ($volid =~ m!^/dev/.+!) {
2566 mkfs($volid);
2567 return;
2568 }
2569
2570 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2571
2572 die "cannot format volume '$volid' with no storage\n" if !$storage;
2573
08ca136d
DM
2574 PVE::Storage::activate_volumes($storage_cfg, [$volid]);
2575
6c871c36
DM
2576 my $path = PVE::Storage::path($storage_cfg, $volid);
2577
2578 my ($vtype, undef, undef, undef, undef, $isBase, $format) =
2579 PVE::Storage::parse_volname($storage_cfg, $volid);
2580
2581 die "cannot format volume '$volid' (format == $format)\n"
2582 if $format ne 'raw';
2583
d216e891 2584 mkfs($path, $rootuid, $rootgid);
6c871c36
DM
2585}
2586
2587sub destroy_disks {
2588 my ($storecfg, $vollist) = @_;
2589
2590 foreach my $volid (@$vollist) {
2591 eval { PVE::Storage::vdisk_free($storecfg, $volid); };
2592 warn $@ if $@;
2593 }
2594}
2595
2596sub create_disks {
2597 my ($storecfg, $vmid, $settings, $conf) = @_;
2598
2599 my $vollist = [];
2600
2601 eval {
d216e891
WB
2602 my (undef, $rootuid, $rootgid) = PVE::LXC::parse_id_maps($conf);
2603 my $chown_vollist = [];
2604
6c871c36
DM
2605 foreach_mountpoint($settings, sub {
2606 my ($ms, $mountpoint) = @_;
2607
2608 my $volid = $mountpoint->{volume};
2609 my $mp = $mountpoint->{mp};
2610
2611 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2612
e2007ac2 2613 if ($storage && ($volid =~ m/^([^:\s]+):(\d+(\.\d+)?)$/)) {
8ed5ff9d 2614 my ($storeid, $size_gb) = ($1, $2);
6c871c36 2615
8ed5ff9d 2616 my $size_kb = int(${size_gb}*1024) * 1024;
6c871c36
DM
2617
2618 my $scfg = PVE::Storage::storage_config($storecfg, $storage);
2619 # fixme: use better naming ct-$vmid-disk-X.raw?
2620
2621 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs') {
8ed5ff9d 2622 if ($size_kb > 0) {
6c871c36 2623 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw',
8ed5ff9d 2624 undef, $size_kb);
d216e891 2625 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2626 } else {
2627 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'subvol',
2628 undef, 0);
d216e891 2629 push @$chown_vollist, $volid;
6c871c36
DM
2630 }
2631 } elsif ($scfg->{type} eq 'zfspool') {
2632
2633 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'subvol',
8ed5ff9d 2634 undef, $size_kb);
d216e891 2635 push @$chown_vollist, $volid;
2e879877 2636 } elsif ($scfg->{type} eq 'drbd' || $scfg->{type} eq 'lvm' || $scfg->{type} eq 'lvmthin') {
6c871c36 2637
8ed5ff9d 2638 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw', undef, $size_kb);
d216e891 2639 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2640
2641 } elsif ($scfg->{type} eq 'rbd') {
2642
2643 die "krbd option must be enabled on storage type '$scfg->{type}'\n" if !$scfg->{krbd};
8ed5ff9d 2644 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw', undef, $size_kb);
d216e891 2645 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2646 } else {
2647 die "unable to create containers on storage type '$scfg->{type}'\n";
2648 }
2649 push @$vollist, $volid;
71c780b9
WB
2650 $mountpoint->{volume} = $volid;
2651 $mountpoint->{size} = $size_kb * 1024;
2652 $conf->{$ms} = print_ct_mountpoint($mountpoint, $ms eq 'rootfs');
6c871c36 2653 } else {
e2007ac2
DM
2654 # use specified/existing volid/dir/device
2655 $conf->{$ms} = print_ct_mountpoint($mountpoint, $ms eq 'rootfs');
6c871c36
DM
2656 }
2657 });
d216e891
WB
2658
2659 PVE::Storage::activate_volumes($storecfg, $chown_vollist, undef);
2660 foreach my $volid (@$chown_vollist) {
2661 my $path = PVE::Storage::path($storecfg, $volid, undef);
2662 chown($rootuid, $rootgid, $path);
2663 }
2664 PVE::Storage::deactivate_volumes($storecfg, $chown_vollist, undef);
6c871c36
DM
2665 };
2666 # free allocated images on error
2667 if (my $err = $@) {
2668 destroy_disks($storecfg, $vollist);
2669 die $err;
2670 }
2671 return $vollist;
2672}
2673
68e8f3c5
DM
2674# bash completion helper
2675
2676sub complete_os_templates {
2677 my ($cmdname, $pname, $cvalue) = @_;
2678
2679 my $cfg = PVE::Storage::config();
2680
9e9bc3a6 2681 my $storeid;
68e8f3c5
DM
2682
2683 if ($cvalue =~ m/^([^:]+):/) {
2684 $storeid = $1;
2685 }
2686
2687 my $vtype = $cmdname eq 'restore' ? 'backup' : 'vztmpl';
2688 my $data = PVE::Storage::template_list($cfg, $storeid, $vtype);
2689
2690 my $res = [];
2691 foreach my $id (keys %$data) {
2692 foreach my $item (@{$data->{$id}}) {
2693 push @$res, $item->{volid} if defined($item->{volid});
2694 }
2695 }
2696
2697 return $res;
2698}
2699
68e8f3c5
DM
2700my $complete_ctid_full = sub {
2701 my ($running) = @_;
2702
2703 my $idlist = vmstatus();
2704
2705 my $active_hash = list_active_containers();
2706
2707 my $res = [];
2708
2709 foreach my $id (keys %$idlist) {
2710 my $d = $idlist->{$id};
2711 if (defined($running)) {
2712 next if $d->{template};
2713 next if $running && !$active_hash->{$id};
2714 next if !$running && $active_hash->{$id};
2715 }
2716 push @$res, $id;
2717
2718 }
2719 return $res;
2720};
2721
2722sub complete_ctid {
2723 return &$complete_ctid_full();
2724}
2725
2726sub complete_ctid_stopped {
2727 return &$complete_ctid_full(0);
2728}
2729
2730sub complete_ctid_running {
2731 return &$complete_ctid_full(1);
2732}
2733
c6a605f9
WB
2734sub parse_id_maps {
2735 my ($conf) = @_;
2736
2737 my $id_map = [];
2738 my $rootuid = 0;
2739 my $rootgid = 0;
2740
2741 my $lxc = $conf->{lxc};
2742 foreach my $entry (@$lxc) {
2743 my ($key, $value) = @$entry;
2744 next if $key ne 'lxc.id_map';
2745 if ($value =~ /^([ug])\s+(\d+)\s+(\d+)\s+(\d+)\s*$/) {
2746 my ($type, $ct, $host, $length) = ($1, $2, $3, $4);
2747 push @$id_map, [$type, $ct, $host, $length];
2748 if ($ct == 0) {
2749 $rootuid = $host if $type eq 'u';
2750 $rootgid = $host if $type eq 'g';
2751 }
2752 } else {
2753 die "failed to parse id_map: $value\n";
2754 }
2755 }
2756
2757 if (!@$id_map && $conf->{unprivileged}) {
2758 # Should we read them from /etc/subuid?
2759 $id_map = [ ['u', '0', '100000', '65536'],
2760 ['g', '0', '100000', '65536'] ];
2761 $rootuid = $rootgid = 100000;
2762 }
2763
2764 return ($id_map, $rootuid, $rootgid);
2765}
2766
01dce99b
WB
2767sub userns_command {
2768 my ($id_map) = @_;
2769 if (@$id_map) {
2770 return ['lxc-usernsexec', (map { ('-m', join(':', @$_)) } @$id_map), '--'];
2771 }
2772 return [];
2773}
2774
f76a2828 27751;