]> git.proxmox.com Git - pve-container.git/blame - src/PVE/LXC.pm
pct enter: check if container runs before lxc-attach
[pve-container.git] / src / PVE / LXC.pm
CommitLineData
f76a2828
DM
1package PVE::LXC;
2
3use strict;
4use warnings;
d14a9a1b 5use POSIX qw(EINTR);
f76a2828 6
34fdb3d7
WB
7use Socket;
8
f76a2828 9use File::Path;
2cfae16e
WB
10use File::Spec;
11use Cwd qw();
3cc56749 12use Fcntl qw(O_RDONLY);
f76a2828
DM
13
14use PVE::Cluster qw(cfs_register_file cfs_read_file);
f1ba1a4b 15use PVE::Exception qw(raise_perm_exc);
c65e0a6d 16use PVE::Storage;
f76a2828
DM
17use PVE::SafeSyslog;
18use PVE::INotify;
a3249355 19use PVE::JSONSchema qw(get_standard_option);
1bfe8728 20use PVE::Tools qw($IPV6RE $IPV4RE dir_glob_foreach lock_file lock_file_full);
68fba17b 21use PVE::Network;
52389a07 22use PVE::AccessControl;
228a5a1d 23use PVE::ProcFSTools;
688afc63 24use Time::HiRes qw (gettimeofday);
f76a2828
DM
25
26use Data::Dumper;
27
27916659
DM
28my $nodename = PVE::INotify::nodename();
29
688afc63
WL
30my $cpuinfo= PVE::ProcFSTools::read_cpuinfo();
31
f9897acd 32our $COMMON_TAR_FLAGS = [ '--sparse', '--numeric-owner', '--acls',
fc4e132e
WB
33 '--xattrs',
34 '--xattrs-include=user.*',
4132377b
WB
35 '--xattrs-include=security.capability',
36 '--warning=no-xattr-write' ];
fc4e132e 37
27916659 38cfs_register_file('/lxc/', \&parse_pct_config, \&write_pct_config);
f76a2828 39
769fbfab
WB
40my $rootfs_desc = {
41 volume => {
42 type => 'string',
43 default_key => 1,
da990295 44 format => 'pve-lxc-mp-string',
769fbfab
WB
45 format_description => 'volume',
46 description => 'Volume, device or directory to mount into the container.',
47 },
48 backup => {
49 type => 'boolean',
50 format_description => '[1|0]',
51 description => 'Whether to include the mountpoint in backups.',
52 optional => 1,
53 },
54 size => {
72d583ff
WB
55 type => 'string',
56 format => 'disk-size',
769fbfab 57 format_description => 'DiskSize',
769fbfab
WB
58 description => 'Volume size (read only value).',
59 optional => 1,
60 },
471dd315
WB
61 acl => {
62 type => 'boolean',
63 format_description => 'acl',
64 description => 'Explicitly enable or disable ACL support.',
65 optional => 1,
66 },
67 ro => {
68 type => 'boolean',
69 format_description => 'ro',
70 description => 'Read-only mountpoint (not supported with bind mounts)',
71 optional => 1,
72 },
50df544c
WB
73 quota => {
74 type => 'boolean',
75 format_description => '[0|1]',
76 description => 'Enable user quotas inside the container (not supported with zfs subvolumes)',
77 optional => 1,
78 },
769fbfab 79};
822de0c3 80
27916659 81PVE::JSONSchema::register_standard_option('pve-ct-rootfs', {
769fbfab 82 type => 'string', format => $rootfs_desc,
8fbd2935 83 description => "Use volume as container root.",
27916659
DM
84 optional => 1,
85});
86
52389a07
DM
87PVE::JSONSchema::register_standard_option('pve-lxc-snapshot-name', {
88 description => "The name of the snapshot.",
89 type => 'string', format => 'pve-configid',
90 maxLength => 40,
91});
92
27916659 93my $confdesc = {
09d3ec42
DM
94 lock => {
95 optional => 1,
96 type => 'string',
97 description => "Lock/unlock the VM.",
98 enum => [qw(migrate backup snapshot rollback)],
99 },
27916659
DM
100 onboot => {
101 optional => 1,
102 type => 'boolean',
103 description => "Specifies whether a VM will be started during system bootup.",
104 default => 0,
117636e5 105 },
27916659 106 startup => get_standard_option('pve-startup-order'),
bb1ac2de
DM
107 template => {
108 optional => 1,
109 type => 'boolean',
110 description => "Enable/disable Template.",
111 default => 0,
112 },
27916659
DM
113 arch => {
114 optional => 1,
115 type => 'string',
116 enum => ['amd64', 'i386'],
117 description => "OS architecture type.",
118 default => 'amd64',
117636e5 119 },
27916659
DM
120 ostype => {
121 optional => 1,
122 type => 'string',
238b7e3e
DM
123 enum => ['debian', 'ubuntu', 'centos', 'fedora', 'opensuse', 'archlinux', 'alpine', 'unmanaged'],
124 description => "OS type. This is used to setup configuration inside the container, and corresponds to lxc setup scripts in /usr/share/lxc/config/<ostype>.common.conf. Value 'unmanaged' can be used to skip and OS specific setup.",
a3249355 125 },
4f958489
DM
126 console => {
127 optional => 1,
128 type => 'boolean',
129 description => "Attach a console device (/dev/console) to the container.",
130 default => 1,
131 },
27916659
DM
132 tty => {
133 optional => 1,
134 type => 'integer',
135 description => "Specify the number of tty available to the container",
136 minimum => 0,
137 maximum => 6,
0d0ca400 138 default => 2,
611fe3aa 139 },
27916659
DM
140 cpulimit => {
141 optional => 1,
142 type => 'number',
c31ad455 143 description => "Limit of CPU usage. Note if the computer has 2 CPUs, it has a total of '2' CPU time. Value '0' indicates no CPU limit.",
27916659
DM
144 minimum => 0,
145 maximum => 128,
146 default => 0,
147 },
148 cpuunits => {
149 optional => 1,
150 type => 'integer',
c31ad455 151 description => "CPU weight for a VM. Argument is used in the kernel fair scheduler. The larger the number is, the more CPU time this VM gets. Number is relative to the weights of all the other running VMs.\n\nNOTE: You can disable fair-scheduler configuration by setting this to 0.",
27916659
DM
152 minimum => 0,
153 maximum => 500000,
81bee809 154 default => 1024,
27916659
DM
155 },
156 memory => {
157 optional => 1,
158 type => 'integer',
159 description => "Amount of RAM for the VM in MB.",
160 minimum => 16,
161 default => 512,
162 },
163 swap => {
164 optional => 1,
165 type => 'integer',
166 description => "Amount of SWAP for the VM in MB.",
167 minimum => 0,
168 default => 512,
169 },
170 hostname => {
171 optional => 1,
172 description => "Set a host name for the container.",
159aad3e 173 type => 'string', format => 'dns-name',
27916659
DM
174 maxLength => 255,
175 },
176 description => {
177 optional => 1,
178 type => 'string',
179 description => "Container description. Only used on the configuration web interface.",
180 },
181 searchdomain => {
182 optional => 1,
159aad3e 183 type => 'string', format => 'dns-name-list',
c31ad455 184 description => "Sets DNS search domains for a container. Create will automatically use the setting from the host if you neither set searchdomain nor nameserver.",
27916659
DM
185 },
186 nameserver => {
187 optional => 1,
159aad3e 188 type => 'string', format => 'address-list',
c31ad455 189 description => "Sets DNS server IP address for a container. Create will automatically use the setting from the host if you neither set searchdomain nor nameserver.",
27916659
DM
190 },
191 rootfs => get_standard_option('pve-ct-rootfs'),
09d3ec42
DM
192 parent => {
193 optional => 1,
194 type => 'string', format => 'pve-configid',
195 maxLength => 40,
196 description => "Parent snapshot name. This is used internally, and should not be modified.",
197 },
198 snaptime => {
199 optional => 1,
200 description => "Timestamp for snapshots.",
201 type => 'integer',
202 minimum => 0,
203 },
aca816ad
DM
204 cmode => {
205 optional => 1,
206 description => "Console mode. By default, the console command tries to open a connection to one of the available tty devices. By setting cmode to 'console' it tries to attach to /dev/console instead. If you set cmode to 'shell', it simply invokes a shell inside the container (no login).",
207 type => 'string',
208 enum => ['shell', 'console', 'tty'],
209 default => 'tty',
210 },
7e806596
AG
211 protection => {
212 optional => 1,
213 type => 'boolean',
c31ad455 214 description => "Sets the protection flag of the container. This will prevent the CT or CT's disk remove/update operation.",
7e806596
AG
215 default => 0,
216 },
425b62cb
WB
217 unprivileged => {
218 optional => 1,
219 type => 'boolean',
220 description => "Makes the container run as unprivileged user. (Should not be modified manually.)",
221 default => 0,
222 },
f76a2828
DM
223};
224
e576f689
DM
225my $valid_lxc_conf_keys = {
226 'lxc.include' => 1,
227 'lxc.arch' => 1,
228 'lxc.utsname' => 1,
229 'lxc.haltsignal' => 1,
230 'lxc.rebootsignal' => 1,
231 'lxc.stopsignal' => 1,
232 'lxc.init_cmd' => 1,
233 'lxc.network.type' => 1,
234 'lxc.network.flags' => 1,
235 'lxc.network.link' => 1,
236 'lxc.network.mtu' => 1,
237 'lxc.network.name' => 1,
238 'lxc.network.hwaddr' => 1,
239 'lxc.network.ipv4' => 1,
240 'lxc.network.ipv4.gateway' => 1,
241 'lxc.network.ipv6' => 1,
242 'lxc.network.ipv6.gateway' => 1,
243 'lxc.network.script.up' => 1,
244 'lxc.network.script.down' => 1,
245 'lxc.pts' => 1,
246 'lxc.console.logfile' => 1,
247 'lxc.console' => 1,
248 'lxc.tty' => 1,
249 'lxc.devttydir' => 1,
250 'lxc.hook.autodev' => 1,
251 'lxc.autodev' => 1,
252 'lxc.kmsg' => 1,
253 'lxc.mount' => 1,
254 'lxc.mount.entry' => 1,
255 'lxc.mount.auto' => 1,
312e9850 256 'lxc.rootfs' => 'lxc.rootfs is auto generated from rootfs',
e576f689 257 'lxc.rootfs.mount' => 1,
312e9850
WB
258 'lxc.rootfs.options' => 'lxc.rootfs.options is not supported' .
259 ', please use mountpoint options in the "rootfs" key',
e576f689
DM
260 # lxc.cgroup.*
261 'lxc.cap.drop' => 1,
262 'lxc.cap.keep' => 1,
263 'lxc.aa_profile' => 1,
264 'lxc.aa_allow_incomplete' => 1,
265 'lxc.se_context' => 1,
266 'lxc.seccomp' => 1,
267 'lxc.id_map' => 1,
268 'lxc.hook.pre-start' => 1,
269 'lxc.hook.pre-mount' => 1,
270 'lxc.hook.mount' => 1,
271 'lxc.hook.start' => 1,
53775872 272 'lxc.hook.stop' => 1,
e576f689
DM
273 'lxc.hook.post-stop' => 1,
274 'lxc.hook.clone' => 1,
275 'lxc.hook.destroy' => 1,
276 'lxc.loglevel' => 1,
277 'lxc.logfile' => 1,
278 'lxc.start.auto' => 1,
279 'lxc.start.delay' => 1,
280 'lxc.start.order' => 1,
281 'lxc.group' => 1,
282 'lxc.environment' => 1,
e576f689
DM
283};
284
769fbfab
WB
285my $netconf_desc = {
286 type => {
287 type => 'string',
288 optional => 1,
289 description => "Network interface type.",
290 enum => [qw(veth)],
291 },
292 name => {
293 type => 'string',
294 format_description => 'String',
295 description => 'Name of the network device as seen from inside the container. (lxc.network.name)',
296 pattern => '[-_.\w\d]+',
297 },
298 bridge => {
299 type => 'string',
300 format_description => 'vmbr<Number>',
301 description => 'Bridge to attach the network device to.',
302 pattern => '[-_.\w\d]+',
a7c080a7 303 optional => 1,
769fbfab
WB
304 },
305 hwaddr => {
306 type => 'string',
307 format_description => 'MAC',
308 description => 'Bridge to attach the network device to. (lxc.network.hwaddr)',
309 pattern => qr/(?:[a-f0-9]{2}:){5}[a-f0-9]{2}/i,
310 optional => 1,
311 },
312 mtu => {
313 type => 'integer',
314 format_description => 'Number',
315 description => 'Maximum transfer unit of the interface. (lxc.network.mtu)',
07521af1 316 minimum => 64, # minimum ethernet frame is 64 bytes
769fbfab
WB
317 optional => 1,
318 },
319 ip => {
320 type => 'string',
321 format => 'pve-ipv4-config',
322 format_description => 'IPv4Format/CIDR',
323 description => 'IPv4 address in CIDR format.',
324 optional => 1,
325 },
326 gw => {
327 type => 'string',
328 format => 'ipv4',
329 format_description => 'GatewayIPv4',
330 description => 'Default gateway for IPv4 traffic.',
331 optional => 1,
332 },
333 ip6 => {
334 type => 'string',
335 format => 'pve-ipv6-config',
336 format_description => 'IPv6Format/CIDR',
337 description => 'IPv6 address in CIDR format.',
338 optional => 1,
339 },
340 gw6 => {
341 type => 'string',
342 format => 'ipv6',
343 format_description => 'GatewayIPv6',
344 description => 'Default gateway for IPv6 traffic.',
345 optional => 1,
346 },
347 firewall => {
348 type => 'boolean',
349 format_description => '[1|0]',
350 description => "Controls whether this interface's firewall rules should be used.",
351 optional => 1,
352 },
353 tag => {
354 type => 'integer',
355 format_description => 'VlanNo',
356 minimum => '2',
357 maximum => '4094',
23eb2244
WB
358 description => "VLAN tag for this interface.",
359 optional => 1,
360 },
361 trunks => {
362 type => 'string',
363 pattern => qr/\d+(?:;\d+)*/,
364 format_description => 'vlanid[;vlanid...]',
365 description => "VLAN ids to pass through the interface",
769fbfab
WB
366 optional => 1,
367 },
368};
369PVE::JSONSchema::register_format('pve-lxc-network', $netconf_desc);
370
27916659
DM
371my $MAX_LXC_NETWORKS = 10;
372for (my $i = 0; $i < $MAX_LXC_NETWORKS; $i++) {
373 $confdesc->{"net$i"} = {
374 optional => 1,
1a0a239c 375 type => 'string', format => $netconf_desc,
769fbfab 376 description => "Specifies network interfaces for the container.",
27916659 377 };
90bc31f7
DM
378}
379
da990295
DC
380PVE::JSONSchema::register_format('pve-lxc-mp-string', \&verify_lxc_mp_string);
381sub verify_lxc_mp_string{
382 my ($mp, $noerr) = @_;
383
384 # do not allow:
385 # /./ or /../
386 # /. or /.. at the end
387 # ../ at the beginning
388
389 if($mp =~ m@/\.\.?/@ ||
390 $mp =~ m@/\.\.?$@ ||
391 $mp =~ m@^\.\./@){
392 return undef if $noerr;
393 die "$mp contains illegal character sequences\n";
394 }
395 return $mp;
396}
397
769fbfab
WB
398my $mp_desc = {
399 %$rootfs_desc,
400 mp => {
401 type => 'string',
da990295 402 format => 'pve-lxc-mp-string',
769fbfab
WB
403 format_description => 'Path',
404 description => 'Path to the mountpoint as seen from inside the container.',
769fbfab
WB
405 },
406};
407PVE::JSONSchema::register_format('pve-ct-mountpoint', $mp_desc);
408
69202f71
WB
409my $unuseddesc = {
410 optional => 1,
411 type => 'string', format => 'pve-volume-id',
412 description => "Reference to unused volumes.",
413};
414
02c9d10c
AD
415my $MAX_MOUNT_POINTS = 10;
416for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
417 $confdesc->{"mp$i"} = {
418 optional => 1,
769fbfab 419 type => 'string', format => $mp_desc,
566d5f81 420 description => "Use volume as container mount point (experimental feature).",
02c9d10c
AD
421 optional => 1,
422 };
423}
424
69202f71
WB
425my $MAX_UNUSED_DISKS = $MAX_MOUNT_POINTS;
426for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
427 $confdesc->{"unused$i"} = $unuseddesc;
428}
429
27916659
DM
430sub write_pct_config {
431 my ($filename, $conf) = @_;
f76a2828 432
27916659 433 delete $conf->{snapstate}; # just to be sure
f76a2828 434
27916659
DM
435 my $generate_raw_config = sub {
436 my ($conf) = @_;
f76a2828 437
27916659 438 my $raw = '';
cbb03fea 439
27916659
DM
440 # add description as comment to top of file
441 my $descr = $conf->{description} || '';
442 foreach my $cl (split(/\n/, $descr)) {
443 $raw .= '#' . PVE::Tools::encode_text($cl) . "\n";
a12a36e0 444 }
fff3a342 445
27916659 446 foreach my $key (sort keys %$conf) {
09d3ec42 447 next if $key eq 'digest' || $key eq 'description' || $key eq 'pending' ||
e576f689 448 $key eq 'snapshots' || $key eq 'snapname' || $key eq 'lxc';
545d10ba
DM
449 my $value = $conf->{$key};
450 die "detected invalid newline inside property '$key'\n" if $value =~ m/\n/;
451 $raw .= "$key: $value\n";
a12a36e0 452 }
e576f689
DM
453
454 if (my $lxcconf = $conf->{lxc}) {
455 foreach my $entry (@$lxcconf) {
456 my ($k, $v) = @$entry;
457 $raw .= "$k: $v\n";
458 }
459 }
460
27916659 461 return $raw;
a12a36e0 462 };
160f0941 463
27916659 464 my $raw = &$generate_raw_config($conf);
a12a36e0 465
27916659
DM
466 foreach my $snapname (sort keys %{$conf->{snapshots}}) {
467 $raw .= "\n[$snapname]\n";
468 $raw .= &$generate_raw_config($conf->{snapshots}->{$snapname});
f76a2828
DM
469 }
470
f76a2828
DM
471 return $raw;
472}
473
27916659
DM
474sub check_type {
475 my ($key, $value) = @_;
822de0c3 476
27916659 477 die "unknown setting '$key'\n" if !$confdesc->{$key};
822de0c3 478
27916659
DM
479 my $type = $confdesc->{$key}->{type};
480
481 if (!defined($value)) {
482 die "got undefined value\n";
483 }
484
485 if ($value =~ m/[\n\r]/) {
486 die "property contains a line feed\n";
487 }
822de0c3 488
27916659
DM
489 if ($type eq 'boolean') {
490 return 1 if ($value eq '1') || ($value =~ m/^(on|yes|true)$/i);
491 return 0 if ($value eq '0') || ($value =~ m/^(off|no|false)$/i);
492 die "type check ('boolean') failed - got '$value'\n";
493 } elsif ($type eq 'integer') {
494 return int($1) if $value =~ m/^(\d+)$/;
495 die "type check ('integer') failed - got '$value'\n";
496 } elsif ($type eq 'number') {
497 return $value if $value =~ m/^(\d+)(\.\d+)?$/;
498 die "type check ('number') failed - got '$value'\n";
499 } elsif ($type eq 'string') {
500 if (my $fmt = $confdesc->{$key}->{format}) {
501 PVE::JSONSchema::check_format($fmt, $value);
502 return $value;
503 }
cbb03fea 504 return $value;
822de0c3 505 } else {
27916659 506 die "internal error"
822de0c3 507 }
822de0c3
DM
508}
509
27916659 510sub parse_pct_config {
f76a2828
DM
511 my ($filename, $raw) = @_;
512
513 return undef if !defined($raw);
514
27916659 515 my $res = {
f76a2828 516 digest => Digest::SHA::sha1_hex($raw),
27916659 517 snapshots => {},
f76a2828
DM
518 };
519
27916659 520 $filename =~ m|/lxc/(\d+).conf$|
f76a2828
DM
521 || die "got strange filename '$filename'";
522
523 my $vmid = $1;
524
27916659
DM
525 my $conf = $res;
526 my $descr = '';
527 my $section = '';
528
529 my @lines = split(/\n/, $raw);
530 foreach my $line (@lines) {
531 next if $line =~ m/^\s*$/;
532
533 if ($line =~ m/^\[([a-z][a-z0-9_\-]+)\]\s*$/i) {
534 $section = $1;
535 $conf->{description} = $descr if $descr;
536 $descr = '';
537 $conf = $res->{snapshots}->{$section} = {};
538 next;
a12a36e0 539 }
a12a36e0 540
27916659
DM
541 if ($line =~ m/^\#(.*)\s*$/) {
542 $descr .= PVE::Tools::decode_text($1) . "\n";
543 next;
f76a2828 544 }
5d186e16 545
545d10ba 546 if ($line =~ m/^(lxc\.[a-z0-9_\-\.]+)(:|\s*=)\s*(.*?)\s*$/) {
e576f689
DM
547 my $key = $1;
548 my $value = $3;
a23d627d
WB
549 my $validity = $valid_lxc_conf_keys->{$key} || 0;
550 if ($validity eq 1 || $key =~ m/^lxc\.cgroup\./) {
e576f689 551 push @{$conf->{lxc}}, [$key, $value];
a23d627d 552 } elsif (my $errmsg = $validity) {
312e9850 553 warn "vm $vmid - $key: $errmsg\n";
e576f689
DM
554 } else {
555 warn "vm $vmid - unable to parse config: $line\n";
556 }
557 } elsif ($line =~ m/^(description):\s*(.*\S)\s*$/) {
27916659
DM
558 $descr .= PVE::Tools::decode_text($2);
559 } elsif ($line =~ m/snapstate:\s*(prepare|delete)\s*$/) {
560 $conf->{snapstate} = $1;
fe9a4ab3 561 } elsif ($line =~ m/^([a-z][a-z_]*\d*):\s*(\S.*)\s*$/) {
27916659 562 my $key = $1;
5d186e16 563 my $value = $2;
27916659
DM
564 eval { $value = check_type($key, $value); };
565 warn "vm $vmid - unable to parse value of '$key' - $@" if $@;
566 $conf->{$key} = $value;
5d186e16 567 } else {
27916659 568 warn "vm $vmid - unable to parse config: $line\n";
5d186e16 569 }
7dfc49cc
DM
570 }
571
27916659 572 $conf->{description} = $descr if $descr;
5d186e16 573
27916659
DM
574 delete $res->{snapstate}; # just to be sure
575
576 return $res;
f76a2828
DM
577}
578
579sub config_list {
580 my $vmlist = PVE::Cluster::get_vmlist();
581 my $res = {};
582 return $res if !$vmlist || !$vmlist->{ids};
583 my $ids = $vmlist->{ids};
584
585 foreach my $vmid (keys %$ids) {
586 next if !$vmid; # skip CT0
587 my $d = $ids->{$vmid};
588 next if !$d->{node} || $d->{node} ne $nodename;
589 next if !$d->{type} || $d->{type} ne 'lxc';
590 $res->{$vmid}->{type} = 'lxc';
591 }
592 return $res;
593}
594
595sub cfs_config_path {
596 my ($vmid, $node) = @_;
597
598 $node = $nodename if !$node;
27916659 599 return "nodes/$node/lxc/$vmid.conf";
f76a2828
DM
600}
601
9c2d4ce9
DM
602sub config_file {
603 my ($vmid, $node) = @_;
604
605 my $cfspath = cfs_config_path($vmid, $node);
606 return "/etc/pve/$cfspath";
607}
608
f76a2828 609sub load_config {
d18499cf 610 my ($vmid, $node) = @_;
f76a2828 611
d18499cf
TL
612 $node = $nodename if !$node;
613 my $cfspath = cfs_config_path($vmid, $node);
f76a2828
DM
614
615 my $conf = PVE::Cluster::cfs_read_file($cfspath);
c31ad455 616 die "container $vmid does not exist\n" if !defined($conf);
f76a2828
DM
617
618 return $conf;
619}
620
5b4657d0
DM
621sub create_config {
622 my ($vmid, $conf) = @_;
623
624 my $dir = "/etc/pve/nodes/$nodename/lxc";
625 mkdir $dir;
626
5b4657d0
DM
627 write_config($vmid, $conf);
628}
629
630sub destroy_config {
631 my ($vmid) = @_;
632
27916659 633 unlink config_file($vmid, $nodename);
5b4657d0
DM
634}
635
f76a2828
DM
636sub write_config {
637 my ($vmid, $conf) = @_;
638
639 my $cfspath = cfs_config_path($vmid);
640
641 PVE::Cluster::cfs_write_file($cfspath, $conf);
642}
643
d14a9a1b 644# flock: we use one file handle per process, so lock file
c31ad455 645# can be called multiple times and will succeed for the same process.
d14a9a1b
DM
646
647my $lock_handles = {};
648my $lockdir = "/run/lock/lxc";
649
3cc56749 650sub config_file_lock {
d14a9a1b 651 my ($vmid) = @_;
cbb03fea 652
53396388 653 return "$lockdir/pve-config-${vmid}.lock";
d14a9a1b
DM
654}
655
3cc56749 656sub lock_config_full {
2d3f23be 657 my ($vmid, $timeout, $code, @param) = @_;
d14a9a1b 658
3cc56749 659 my $filename = config_file_lock($vmid);
d14a9a1b 660
3cc56749
FG
661 mkdir $lockdir if !-d $lockdir;
662
663 my $res = lock_file($filename, $timeout, $code, @param);
664
665 die $@ if $@;
666
667 return $res;
668}
669
670sub lock_config_mode {
671 my ($vmid, $timeout, $shared, $code, @param) = @_;
672
673 my $filename = config_file_lock($vmid);
d14a9a1b 674
f99e8278
AD
675 mkdir $lockdir if !-d $lockdir;
676
3cc56749 677 my $res = lock_file_full($filename, $timeout, $shared, $code, @param);
f76a2828 678
2d3f23be 679 die $@ if $@;
f76a2828
DM
680
681 return $res;
682}
683
3cc56749
FG
684sub lock_config {
685 my ($vmid, $code, @param) = @_;
686
687 return lock_config_full($vmid, 10, $code, @param);
688}
689
ec52ac21
DM
690sub option_exists {
691 my ($name) = @_;
692
693 return defined($confdesc->{$name});
694}
f76a2828
DM
695
696# add JSON properties for create and set function
697sub json_config_properties {
698 my $prop = shift;
699
700 foreach my $opt (keys %$confdesc) {
09d3ec42 701 next if $opt eq 'parent' || $opt eq 'snaptime';
27916659
DM
702 next if $prop->{$opt};
703 $prop->{$opt} = $confdesc->{$opt};
704 }
705
706 return $prop;
707}
708
822de0c3
DM
709# container status helpers
710
711sub list_active_containers {
cbb03fea 712
822de0c3
DM
713 my $filename = "/proc/net/unix";
714
715 # similar test is used by lcxcontainers.c: list_active_containers
716 my $res = {};
cbb03fea 717
822de0c3
DM
718 my $fh = IO::File->new ($filename, "r");
719 return $res if !$fh;
720
721 while (defined(my $line = <$fh>)) {
722 if ($line =~ m/^[a-f0-9]+:\s\S+\s\S+\s\S+\s\S+\s\S+\s\d+\s(\S+)$/) {
723 my $path = $1;
27916659 724 if ($path =~ m!^@/var/lib/lxc/(\d+)/command$!) {
822de0c3
DM
725 $res->{$1} = 1;
726 }
727 }
728 }
729
730 close($fh);
cbb03fea 731
822de0c3
DM
732 return $res;
733}
f76a2828 734
5c752bbf
DM
735# warning: this is slow
736sub check_running {
737 my ($vmid) = @_;
738
739 my $active_hash = list_active_containers();
740
741 return 1 if defined($active_hash->{$vmid});
cbb03fea 742
5c752bbf
DM
743 return undef;
744}
745
10fc3ba5 746sub get_container_disk_usage {
73e03cb7 747 my ($vmid, $pid) = @_;
10fc3ba5 748
73e03cb7 749 return PVE::Tools::df("/proc/$pid/root/", 1);
10fc3ba5
DM
750}
751
688afc63
WL
752my $last_proc_vmid_stat;
753
754my $parse_cpuacct_stat = sub {
755 my ($vmid) = @_;
756
757 my $raw = read_cgroup_value('cpuacct', $vmid, 'cpuacct.stat', 1);
758
759 my $stat = {};
760
761 if ($raw =~ m/^user (\d+)\nsystem (\d+)\n/) {
762
763 $stat->{utime} = $1;
764 $stat->{stime} = $2;
765
766 }
767
768 return $stat;
769};
770
f76a2828
DM
771sub vmstatus {
772 my ($opt_vmid) = @_;
773
774 my $list = $opt_vmid ? { $opt_vmid => { type => 'lxc' }} : config_list();
775
822de0c3 776 my $active_hash = list_active_containers();
cbb03fea 777
688afc63
WL
778 my $cpucount = $cpuinfo->{cpus} || 1;
779
780 my $cdtime = gettimeofday;
781
782 my $uptime = (PVE::ProcFSTools::read_proc_uptime(1))[0];
783
f76a2828 784 foreach my $vmid (keys %$list) {
f76a2828 785 my $d = $list->{$vmid};
10fc3ba5 786
d5588ee3
DM
787 eval { $d->{pid} = find_lxc_pid($vmid) if defined($active_hash->{$vmid}); };
788 warn $@ if $@; # ignore errors (consider them stopped)
cbb03fea 789
d5588ee3 790 $d->{status} = $d->{pid} ? 'running' : 'stopped';
f76a2828
DM
791
792 my $cfspath = cfs_config_path($vmid);
238a56cb 793 my $conf = PVE::Cluster::cfs_read_file($cfspath) || {};
cbb03fea 794
27916659 795 $d->{name} = $conf->{'hostname'} || "CT$vmid";
238a56cb 796 $d->{name} =~ s/[\s]//g;
cbb03fea 797
9db5687d 798 $d->{cpus} = $conf->{cpulimit} || $cpucount;
44da0641 799
d5588ee3
DM
800 if ($d->{pid}) {
801 my $res = get_container_disk_usage($vmid, $d->{pid});
27916659
DM
802 $d->{disk} = $res->{used};
803 $d->{maxdisk} = $res->{total};
804 } else {
805 $d->{disk} = 0;
806 # use 4GB by default ??
807 if (my $rootfs = $conf->{rootfs}) {
44a9face 808 my $rootinfo = parse_ct_rootfs($rootfs);
27916659
DM
809 $d->{maxdisk} = int(($rootinfo->{size} || 4)*1024*1024)*1024;
810 } else {
811 $d->{maxdisk} = 4*1024*1024*1024;
10fc3ba5 812 }
238a56cb 813 }
cbb03fea 814
238a56cb
DM
815 $d->{mem} = 0;
816 $d->{swap} = 0;
95df9a12
DM
817 $d->{maxmem} = ($conf->{memory}||512)*1024*1024;
818 $d->{maxswap} = ($conf->{swap}//0)*1024*1024;
e901d418 819
238a56cb
DM
820 $d->{uptime} = 0;
821 $d->{cpu} = 0;
e901d418 822
238a56cb
DM
823 $d->{netout} = 0;
824 $d->{netin} = 0;
f76a2828 825
238a56cb
DM
826 $d->{diskread} = 0;
827 $d->{diskwrite} = 0;
bb1ac2de
DM
828
829 $d->{template} = is_template($conf);
f76a2828 830 }
cbb03fea 831
238a56cb
DM
832 foreach my $vmid (keys %$list) {
833 my $d = $list->{$vmid};
d5588ee3
DM
834 my $pid = $d->{pid};
835
836 next if !$pid; # skip stopped CTs
f76a2828 837
88a8696b
TL
838 my $ctime = (stat("/proc/$pid"))[10]; # 10 = ctime
839 $d->{uptime} = time - $ctime; # the method lxcfs uses
22a77285 840
238a56cb
DM
841 $d->{mem} = read_cgroup_value('memory', $vmid, 'memory.usage_in_bytes');
842 $d->{swap} = read_cgroup_value('memory', $vmid, 'memory.memsw.usage_in_bytes') - $d->{mem};
b5289322
AD
843
844 my $blkio_bytes = read_cgroup_value('blkio', $vmid, 'blkio.throttle.io_service_bytes', 1);
1e647c7c 845 my @bytes = split(/\n/, $blkio_bytes);
b5289322 846 foreach my $byte (@bytes) {
1e647c7c
DM
847 if (my ($key, $value) = $byte =~ /(Read|Write)\s+(\d+)/) {
848 $d->{diskread} = $2 if $key eq 'Read';
849 $d->{diskwrite} = $2 if $key eq 'Write';
850 }
b5289322 851 }
688afc63
WL
852
853 my $pstat = &$parse_cpuacct_stat($vmid);
854
855 my $used = $pstat->{utime} + $pstat->{stime};
856
857 my $old = $last_proc_vmid_stat->{$vmid};
858 if (!$old) {
859 $last_proc_vmid_stat->{$vmid} = {
860 time => $cdtime,
861 used => $used,
862 cpu => 0,
863 };
864 next;
865 }
866
867 my $dtime = ($cdtime - $old->{time}) * $cpucount * $cpuinfo->{user_hz};
868
869 if ($dtime > 1000) {
870 my $dutime = $used - $old->{used};
871
872 $d->{cpu} = (($dutime/$dtime)* $cpucount) / $d->{cpus};
873 $last_proc_vmid_stat->{$vmid} = {
874 time => $cdtime,
875 used => $used,
876 cpu => $d->{cpu},
877 };
878 } else {
879 $d->{cpu} = $old->{cpu};
880 }
238a56cb 881 }
cbb03fea 882
68b8f4d1
WL
883 my $netdev = PVE::ProcFSTools::read_proc_net_dev();
884
885 foreach my $dev (keys %$netdev) {
886 next if $dev !~ m/^veth([1-9]\d*)i/;
887 my $vmid = $1;
888 my $d = $list->{$vmid};
889
890 next if !$d;
891
892 $d->{netout} += $netdev->{$dev}->{receive};
893 $d->{netin} += $netdev->{$dev}->{transmit};
894
895 }
896
f76a2828
DM
897 return $list;
898}
899
7c921c80
WB
900sub classify_mountpoint {
901 my ($vol) = @_;
902 if ($vol =~ m!^/!) {
903 return 'device' if $vol =~ m!^/dev/!;
904 return 'bind';
905 }
906 return 'volume';
907}
908
44a9face
DM
909my $parse_ct_mountpoint_full = sub {
910 my ($desc, $data, $noerr) = @_;
27916659
DM
911
912 $data //= '';
913
1b2c1e8c 914 my $res;
44a9face 915 eval { $res = PVE::JSONSchema::parse_property_string($desc, $data) };
1b2c1e8c 916 if ($@) {
ca7feb1a
WB
917 return undef if $noerr;
918 die $@;
27916659
DM
919 }
920
bf4a209a 921 if (defined(my $size = $res->{size})) {
ca7feb1a
WB
922 $size = PVE::JSONSchema::parse_size($size);
923 if (!defined($size)) {
924 return undef if $noerr;
925 die "invalid size: $size\n";
926 }
927 $res->{size} = $size;
27916659
DM
928 }
929
7c921c80
WB
930 $res->{type} = classify_mountpoint($res->{volume});
931
27916659 932 return $res;
44a9face
DM
933};
934
935sub parse_ct_rootfs {
936 my ($data, $noerr) = @_;
937
938 my $res = &$parse_ct_mountpoint_full($rootfs_desc, $data, $noerr);
939
940 $res->{mp} = '/' if defined($res);
941
942 return $res;
943}
944
945sub parse_ct_mountpoint {
946 my ($data, $noerr) = @_;
947
948 return &$parse_ct_mountpoint_full($mp_desc, $data, $noerr);
27916659 949}
7dfc49cc 950
dde7b02b 951sub print_ct_mountpoint {
4fee75fd 952 my ($info, $nomp) = @_;
7c921c80
WB
953 my $skip = [ 'type' ];
954 push @$skip, 'mp' if $nomp;
6708ba93 955 return PVE::JSONSchema::print_property_string($info, $mp_desc, $skip);
bb1ac2de
DM
956}
957
7dfc49cc 958sub print_lxc_network {
f76a2828 959 my $net = shift;
6708ba93 960 return PVE::JSONSchema::print_property_string($net, $netconf_desc);
f76a2828
DM
961}
962
7dfc49cc
DM
963sub parse_lxc_network {
964 my ($data) = @_;
965
966 my $res = {};
967
968 return $res if !$data;
969
ca7feb1a 970 $res = PVE::JSONSchema::parse_property_string($netconf_desc, $data);
7dfc49cc
DM
971
972 $res->{type} = 'veth';
93cdbbfb 973 $res->{hwaddr} = PVE::Tools::random_ether_addr() if !$res->{hwaddr};
cbb03fea 974
7dfc49cc
DM
975 return $res;
976}
f76a2828 977
238a56cb
DM
978sub read_cgroup_value {
979 my ($group, $vmid, $name, $full) = @_;
980
981 my $path = "/sys/fs/cgroup/$group/lxc/$vmid/$name";
982
983 return PVE::Tools::file_get_contents($path) if $full;
984
985 return PVE::Tools::file_read_firstline($path);
986}
987
bf0b8c43
AD
988sub write_cgroup_value {
989 my ($group, $vmid, $name, $value) = @_;
990
991 my $path = "/sys/fs/cgroup/$group/lxc/$vmid/$name";
992 PVE::ProcFSTools::write_proc_entry($path, $value) if -e $path;
993
994}
995
52f1d76b
DM
996sub find_lxc_console_pids {
997
998 my $res = {};
999
1000 PVE::Tools::dir_glob_foreach('/proc', '\d+', sub {
1001 my ($pid) = @_;
1002
1003 my $cmdline = PVE::Tools::file_read_firstline("/proc/$pid/cmdline");
1004 return if !$cmdline;
1005
1006 my @args = split(/\0/, $cmdline);
1007
c31ad455 1008 # search for lxc-console -n <vmid>
cbb03fea 1009 return if scalar(@args) != 3;
52f1d76b
DM
1010 return if $args[1] ne '-n';
1011 return if $args[2] !~ m/^\d+$/;
1012 return if $args[0] !~ m|^(/usr/bin/)?lxc-console$|;
cbb03fea 1013
52f1d76b 1014 my $vmid = $args[2];
cbb03fea 1015
52f1d76b
DM
1016 push @{$res->{$vmid}}, $pid;
1017 });
1018
1019 return $res;
1020}
1021
bedeaaf1
AD
1022sub find_lxc_pid {
1023 my ($vmid) = @_;
1024
1025 my $pid = undef;
1026 my $parser = sub {
1027 my $line = shift;
8b25977f 1028 $pid = $1 if $line =~ m/^PID:\s+(\d+)$/;
bedeaaf1 1029 };
c39aa40a 1030 PVE::Tools::run_command(['lxc-info', '-n', $vmid, '-p'], outfunc => $parser);
bedeaaf1 1031
8b25977f 1032 die "unable to get PID for CT $vmid (not running?)\n" if !$pid;
cbb03fea 1033
8b25977f 1034 return $pid;
bedeaaf1
AD
1035}
1036
cbb03fea 1037# Note: we cannot use Net:IP, because that only allows strict
55fa4e09
DM
1038# CIDR networks
1039sub parse_ipv4_cidr {
1040 my ($cidr, $noerr) = @_;
1041
f7a7b413
WB
1042 if ($cidr =~ m!^($IPV4RE)(?:/(\d+))$! && ($2 > 7) && ($2 <= 32)) {
1043 return { address => $1, netmask => $PVE::Network::ipv4_reverse_mask->[$2] };
55fa4e09 1044 }
cbb03fea 1045
55fa4e09 1046 return undef if $noerr;
cbb03fea 1047
55fa4e09
DM
1048 die "unable to parse ipv4 address/mask\n";
1049}
93285df8 1050
a12a36e0
WL
1051sub check_lock {
1052 my ($conf) = @_;
1053
27916659 1054 die "VM is locked ($conf->{'lock'})\n" if $conf->{'lock'};
a12a36e0
WL
1055}
1056
e22af68f
AG
1057sub check_protection {
1058 my ($vm_conf, $err_msg) = @_;
1059
1060 if ($vm_conf->{protection}) {
1061 die "$err_msg - protection mode enabled\n";
1062 }
1063}
1064
27916659 1065sub update_lxc_config {
c628ffa1 1066 my ($storage_cfg, $vmid, $conf) = @_;
b80dd50a 1067
bb1ac2de
DM
1068 my $dir = "/var/lib/lxc/$vmid";
1069
1070 if ($conf->{template}) {
1071
1072 unlink "$dir/config";
1073
1074 return;
1075 }
1076
27916659 1077 my $raw = '';
b80dd50a 1078
27916659
DM
1079 die "missing 'arch' - internal error" if !$conf->{arch};
1080 $raw .= "lxc.arch = $conf->{arch}\n";
b80dd50a 1081
425b62cb
WB
1082 my $unprivileged = $conf->{unprivileged};
1083 my $custom_idmap = grep { $_->[0] eq 'lxc.id_map' } @{$conf->{lxc}};
1084
27916659 1085 my $ostype = $conf->{ostype} || die "missing 'ostype' - internal error";
238b7e3e 1086 if ($ostype =~ /^(?:debian | ubuntu | centos | fedora | opensuse | archlinux | alpine | unmanaged)$/x) {
c34f7efe
WB
1087 my $inc ="/usr/share/lxc/config/$ostype.common.conf";
1088 $inc ="/usr/share/lxc/config/common.conf" if !-f $inc;
1089 $raw .= "lxc.include = $inc\n";
425b62cb 1090 if ($unprivileged || $custom_idmap) {
c34f7efe
WB
1091 $inc = "/usr/share/lxc/config/$ostype.userns.conf";
1092 $inc = "/usr/share/lxc/config/userns.conf" if !-f $inc;
1093 $raw .= "lxc.include = $inc\n"
425b62cb 1094 }
27916659 1095 } else {
9a7a910b 1096 die "implement me (ostype $ostype)";
27916659 1097 }
b80dd50a 1098
50df544c
WB
1099 # WARNING: DO NOT REMOVE this without making sure that loop device nodes
1100 # cannot be exposed to the container with r/w access (cgroup perms).
1101 # When this is enabled mounts will still remain in the monitor's namespace
1102 # after the container unmounted them and thus will not detach from their
1103 # files while the container is running!
c16b8890 1104 $raw .= "lxc.monitor.unshare = 1\n";
58cc92a9 1105
425b62cb
WB
1106 # Should we read them from /etc/subuid?
1107 if ($unprivileged && !$custom_idmap) {
1108 $raw .= "lxc.id_map = u 0 100000 65536\n";
1109 $raw .= "lxc.id_map = g 0 100000 65536\n";
1110 }
1111
6f035afe 1112 if (!has_dev_console($conf)) {
eeaea429
DM
1113 $raw .= "lxc.console = none\n";
1114 $raw .= "lxc.cgroup.devices.deny = c 5:1 rwm\n";
1115 }
4f958489 1116
0d0ca400 1117 my $ttycount = get_tty_count($conf);
27916659 1118 $raw .= "lxc.tty = $ttycount\n";
cbb03fea 1119
c31ad455 1120 # some init scripts expect a linux terminal (turnkey).
a691a5a3
DM
1121 $raw .= "lxc.environment = TERM=linux\n";
1122
27916659
DM
1123 my $utsname = $conf->{hostname} || "CT$vmid";
1124 $raw .= "lxc.utsname = $utsname\n";
cbb03fea 1125
27916659
DM
1126 my $memory = $conf->{memory} || 512;
1127 my $swap = $conf->{swap} // 0;
1128
1129 my $lxcmem = int($memory*1024*1024);
1130 $raw .= "lxc.cgroup.memory.limit_in_bytes = $lxcmem\n";
a12a36e0 1131
27916659
DM
1132 my $lxcswap = int(($memory + $swap)*1024*1024);
1133 $raw .= "lxc.cgroup.memory.memsw.limit_in_bytes = $lxcswap\n";
1134
1135 if (my $cpulimit = $conf->{cpulimit}) {
1136 $raw .= "lxc.cgroup.cpu.cfs_period_us = 100000\n";
1137 my $value = int(100000*$cpulimit);
1138 $raw .= "lxc.cgroup.cpu.cfs_quota_us = $value\n";
a12a36e0
WL
1139 }
1140
27916659
DM
1141 my $shares = $conf->{cpuunits} || 1024;
1142 $raw .= "lxc.cgroup.cpu.shares = $shares\n";
1143
44a9face 1144 my $mountpoint = parse_ct_rootfs($conf->{rootfs});
a3076d81 1145
c9a5774b 1146 $raw .= "lxc.rootfs = $dir/rootfs\n";
27916659
DM
1147
1148 my $netcount = 0;
1149 foreach my $k (keys %$conf) {
1150 next if $k !~ m/^net(\d+)$/;
1151 my $ind = $1;
a16d94c8 1152 my $d = parse_lxc_network($conf->{$k});
27916659
DM
1153 $netcount++;
1154 $raw .= "lxc.network.type = veth\n";
18862537 1155 $raw .= "lxc.network.veth.pair = veth${vmid}i${ind}\n";
27916659
DM
1156 $raw .= "lxc.network.hwaddr = $d->{hwaddr}\n" if defined($d->{hwaddr});
1157 $raw .= "lxc.network.name = $d->{name}\n" if defined($d->{name});
1158 $raw .= "lxc.network.mtu = $d->{mtu}\n" if defined($d->{mtu});
a12a36e0
WL
1159 }
1160
e576f689
DM
1161 if (my $lxcconf = $conf->{lxc}) {
1162 foreach my $entry (@$lxcconf) {
1163 my ($k, $v) = @$entry;
1164 $netcount++ if $k eq 'lxc.network.type';
1165 $raw .= "$k = $v\n";
1166 }
1167 }
27916659 1168
e576f689
DM
1169 $raw .= "lxc.network.type = empty\n" if !$netcount;
1170
27916659
DM
1171 File::Path::mkpath("$dir/rootfs");
1172
1173 PVE::Tools::file_set_contents("$dir/config", $raw);
b80dd50a
DM
1174}
1175
117636e5
DM
1176# verify and cleanup nameserver list (replace \0 with ' ')
1177sub verify_nameserver_list {
1178 my ($nameserver_list) = @_;
1179
1180 my @list = ();
1181 foreach my $server (PVE::Tools::split_list($nameserver_list)) {
1182 PVE::JSONSchema::pve_verify_ip($server);
1183 push @list, $server;
1184 }
1185
1186 return join(' ', @list);
1187}
1188
1189sub verify_searchdomain_list {
1190 my ($searchdomain_list) = @_;
1191
1192 my @list = ();
1193 foreach my $server (PVE::Tools::split_list($searchdomain_list)) {
1194 # todo: should we add checks for valid dns domains?
1195 push @list, $server;
1196 }
1197
1198 return join(' ', @list);
1199}
1200
12e95ae4
FG
1201sub is_volume_in_use {
1202 my ($config, $volid) = @_;
1203 my $used = 0;
1204
1205 foreach_mountpoint($config, sub {
1206 my ($ms, $mountpoint) = @_;
1207 return if $used;
1208 if ($mountpoint->{type} eq 'volume' && $mountpoint->{volume} eq $volid) {
1209 $used = 1;
1210 }
1211 });
1212
1213 return $used;
1214}
1215
69202f71
WB
1216sub add_unused_volume {
1217 my ($config, $volid) = @_;
1218
1219 my $key;
1220 for (my $ind = $MAX_UNUSED_DISKS - 1; $ind >= 0; $ind--) {
1221 my $test = "unused$ind";
1222 if (my $vid = $config->{$test}) {
1223 return if $vid eq $volid; # do not add duplicates
1224 } else {
1225 $key = $test;
1226 }
1227 }
1228
c31ad455 1229 die "Too many unused volumes - please delete them first.\n" if !$key;
69202f71
WB
1230
1231 $config->{$key} = $volid;
1232
1233 return $key;
1234}
1235
27916659 1236sub update_pct_config {
93285df8
DM
1237 my ($vmid, $conf, $running, $param, $delete) = @_;
1238
bf0b8c43
AD
1239 my @nohotplug;
1240
7b49dfe0 1241 my $new_disks = 0;
69202f71 1242 my @deleted_volumes;
4fee75fd 1243
cbb03fea
DM
1244 my $rootdir;
1245 if ($running) {
bedeaaf1 1246 my $pid = find_lxc_pid($vmid);
cbb03fea 1247 $rootdir = "/proc/$pid/root";
bedeaaf1
AD
1248 }
1249
7a168607
DM
1250 my $hotplug_error = sub {
1251 if ($running) {
a6a77cfa
WB
1252 push @nohotplug, @_;
1253 return 1;
7a168607
DM
1254 } else {
1255 return 0;
a6a77cfa 1256 }
7a168607 1257 };
a6a77cfa 1258
93285df8
DM
1259 if (defined($delete)) {
1260 foreach my $opt (@$delete) {
a61a5448
WB
1261 if (!exists($conf->{$opt})) {
1262 warn "no such option: $opt\n";
1263 next;
1264 }
1265
27916659 1266 if ($opt eq 'hostname' || $opt eq 'memory' || $opt eq 'rootfs') {
93285df8
DM
1267 die "unable to delete required option '$opt'\n";
1268 } elsif ($opt eq 'swap') {
27916659 1269 delete $conf->{$opt};
bf0b8c43 1270 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", -1);
40603eb3 1271 } elsif ($opt eq 'description' || $opt eq 'onboot' || $opt eq 'startup') {
27916659 1272 delete $conf->{$opt};
4f958489 1273 } elsif ($opt eq 'nameserver' || $opt eq 'searchdomain' ||
40603eb3 1274 $opt eq 'tty' || $opt eq 'console' || $opt eq 'cmode') {
a6a77cfa 1275 next if $hotplug_error->($opt);
27916659 1276 delete $conf->{$opt};
68fba17b 1277 } elsif ($opt =~ m/^net(\d)$/) {
93285df8 1278 delete $conf->{$opt};
68fba17b
AD
1279 next if !$running;
1280 my $netid = $1;
18862537 1281 PVE::Network::veth_delete("veth${vmid}i$netid");
7e806596
AG
1282 } elsif ($opt eq 'protection') {
1283 delete $conf->{$opt};
69202f71 1284 } elsif ($opt =~ m/^unused(\d+)$/) {
a6a77cfa 1285 next if $hotplug_error->($opt);
69202f71
WB
1286 check_protection($conf, "can't remove CT $vmid drive '$opt'");
1287 push @deleted_volumes, $conf->{$opt};
1288 delete $conf->{$opt};
4fee75fd 1289 } elsif ($opt =~ m/^mp(\d+)$/) {
a6a77cfa 1290 next if $hotplug_error->($opt);
e22af68f 1291 check_protection($conf, "can't remove CT $vmid drive '$opt'");
12e95ae4 1292 my $mp = parse_ct_mountpoint($conf->{$opt});
4fee75fd 1293 delete $conf->{$opt};
12e95ae4
FG
1294 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1295 add_unused_volume($conf, $mp->{volume});
1296 }
425b62cb
WB
1297 } elsif ($opt eq 'unprivileged') {
1298 die "unable to delete read-only option: '$opt'\n";
93285df8 1299 } else {
9a7a910b 1300 die "implement me (delete: $opt)"
93285df8 1301 }
706c9791 1302 write_config($vmid, $conf) if $running;
93285df8
DM
1303 }
1304 }
1305
be6383d7
WB
1306 # There's no separate swap size to configure, there's memory and "total"
1307 # memory (iow. memory+swap). This means we have to change them together.
27916659
DM
1308 my $wanted_memory = PVE::Tools::extract_param($param, 'memory');
1309 my $wanted_swap = PVE::Tools::extract_param($param, 'swap');
be6383d7 1310 if (defined($wanted_memory) || defined($wanted_swap)) {
27916659 1311
a2c57b0c
WB
1312 my $old_memory = ($conf->{memory} || 512);
1313 my $old_swap = ($conf->{swap} || 0);
1314
1315 $wanted_memory //= $old_memory;
1316 $wanted_swap //= $old_swap;
27916659
DM
1317
1318 my $total = $wanted_memory + $wanted_swap;
1319 if ($running) {
a2c57b0c
WB
1320 my $old_total = $old_memory + $old_swap;
1321 if ($total > $old_total) {
1322 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", int($total*1024*1024));
1323 write_cgroup_value("memory", $vmid, "memory.limit_in_bytes", int($wanted_memory*1024*1024));
1324 } else {
1325 write_cgroup_value("memory", $vmid, "memory.limit_in_bytes", int($wanted_memory*1024*1024));
1326 write_cgroup_value("memory", $vmid, "memory.memsw.limit_in_bytes", int($total*1024*1024));
1327 }
be6383d7 1328 }
27916659
DM
1329 $conf->{memory} = $wanted_memory;
1330 $conf->{swap} = $wanted_swap;
1331
706c9791 1332 write_config($vmid, $conf) if $running;
be6383d7
WB
1333 }
1334
dfab6edb
WB
1335 my $used_volids = {};
1336
93285df8
DM
1337 foreach my $opt (keys %$param) {
1338 my $value = $param->{$opt};
1339 if ($opt eq 'hostname') {
27916659 1340 $conf->{$opt} = $value;
a99b3509 1341 } elsif ($opt eq 'onboot') {
27916659 1342 $conf->{$opt} = $value ? 1 : 0;
a3249355 1343 } elsif ($opt eq 'startup') {
27916659 1344 $conf->{$opt} = $value;
40603eb3 1345 } elsif ($opt eq 'tty' || $opt eq 'console' || $opt eq 'cmode') {
a6a77cfa 1346 next if $hotplug_error->($opt);
e576f689 1347 $conf->{$opt} = $value;
ffa1d001 1348 } elsif ($opt eq 'nameserver') {
a6a77cfa 1349 next if $hotplug_error->($opt);
117636e5 1350 my $list = verify_nameserver_list($value);
27916659 1351 $conf->{$opt} = $list;
ffa1d001 1352 } elsif ($opt eq 'searchdomain') {
a6a77cfa 1353 next if $hotplug_error->($opt);
117636e5 1354 my $list = verify_searchdomain_list($value);
27916659 1355 $conf->{$opt} = $list;
45573f7c 1356 } elsif ($opt eq 'cpulimit') {
a6a77cfa 1357 next if $hotplug_error->($opt); # FIXME: hotplug
27916659 1358 $conf->{$opt} = $value;
b80dd50a 1359 } elsif ($opt eq 'cpuunits') {
27916659 1360 $conf->{$opt} = $value;
bf0b8c43 1361 write_cgroup_value("cpu", $vmid, "cpu.shares", $value);
93285df8 1362 } elsif ($opt eq 'description') {
27916659 1363 $conf->{$opt} = PVE::Tools::encode_text($value);
93285df8
DM
1364 } elsif ($opt =~ m/^net(\d+)$/) {
1365 my $netid = $1;
a16d94c8 1366 my $net = parse_lxc_network($value);
27916659
DM
1367 if (!$running) {
1368 $conf->{$opt} = print_lxc_network($net);
cbb03fea 1369 } else {
bedeaaf1
AD
1370 update_net($vmid, $conf, $opt, $net, $netid, $rootdir);
1371 }
7e806596
AG
1372 } elsif ($opt eq 'protection') {
1373 $conf->{$opt} = $value ? 1 : 0;
4fee75fd 1374 } elsif ($opt =~ m/^mp(\d+)$/) {
a6a77cfa 1375 next if $hotplug_error->($opt);
e22af68f 1376 check_protection($conf, "can't update CT $vmid drive '$opt'");
12e95ae4 1377 my $old = $conf->{$opt};
4fee75fd 1378 $conf->{$opt} = $value;
12e95ae4
FG
1379 if (defined($old)) {
1380 my $mp = parse_ct_mountpoint($old);
1381 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1382 add_unused_volume($conf, $mp->{volume});
1383 }
1384 }
7b49dfe0 1385 $new_disks = 1;
dfab6edb
WB
1386 my $mp = parse_ct_mountpoint($value);
1387 $used_volids->{$mp->{volume}} = 1;
4fee75fd 1388 } elsif ($opt eq 'rootfs') {
55ce8db8 1389 next if $hotplug_error->($opt);
e22af68f 1390 check_protection($conf, "can't update CT $vmid drive '$opt'");
12e95ae4 1391 my $old = $conf->{$opt};
55ce8db8 1392 $conf->{$opt} = $value;
12e95ae4
FG
1393 if (defined($old)) {
1394 my $mp = parse_ct_rootfs($old);
1395 if ($mp->{type} eq 'volume' && !is_volume_in_use($conf, $mp->{volume})) {
1396 add_unused_volume($conf, $mp->{volume});
1397 }
1398 }
dfab6edb
WB
1399 my $mp = parse_ct_rootfs($value);
1400 $used_volids->{$mp->{volume}} = 1;
425b62cb
WB
1401 } elsif ($opt eq 'unprivileged') {
1402 die "unable to modify read-only option: '$opt'\n";
238b7e3e
DM
1403 } elsif ($opt eq 'ostype') {
1404 next if $hotplug_error->($opt);
1405 $conf->{$opt} = $value;
93285df8 1406 } else {
a92f66c9 1407 die "implement me: $opt";
93285df8 1408 }
706c9791 1409 write_config($vmid, $conf) if $running;
93285df8 1410 }
bf0b8c43 1411
dfab6edb
WB
1412 # Cleanup config:
1413
1414 # Remove unused disks after re-adding
1415 foreach my $key (keys %$conf) {
1416 next if $key !~ /^unused\d+/;
1417 my $volid = $conf->{$key};
1418 if ($used_volids->{$volid}) {
1419 delete $conf->{$key};
1420 }
1421 }
1422
1423 # Apply deletions and creations of new volumes
69202f71
WB
1424 if (@deleted_volumes) {
1425 my $storage_cfg = PVE::Storage::config();
1426 foreach my $volume (@deleted_volumes) {
dfab6edb 1427 next if $used_volids->{$volume}; # could have been re-added, too
69202f71
WB
1428 delete_mountpoint_volume($storage_cfg, $vmid, $volume);
1429 }
1430 }
1431
7b49dfe0 1432 if ($new_disks) {
4fee75fd 1433 my $storage_cfg = PVE::Storage::config();
6c871c36 1434 create_disks($storage_cfg, $vmid, $conf, $conf);
4fee75fd 1435 }
694c25df
WB
1436
1437 # This should be the last thing we do here
1438 if ($running && scalar(@nohotplug)) {
1439 die "unable to modify " . join(',', @nohotplug) . " while container is running\n";
1440 }
93285df8 1441}
c325b32f 1442
6f035afe
DM
1443sub has_dev_console {
1444 my ($conf) = @_;
1445
1446 return !(defined($conf->{console}) && !$conf->{console});
1447}
1448
0d0ca400
DM
1449sub get_tty_count {
1450 my ($conf) = @_;
1451
1452 return $conf->{tty} // $confdesc->{tty}->{default};
1453}
1454
aca816ad
DM
1455sub get_cmode {
1456 my ($conf) = @_;
1457
1458 return $conf->{cmode} // $confdesc->{cmode}->{default};
1459}
1460
1461sub get_console_command {
1462 my ($vmid, $conf) = @_;
1463
1464 my $cmode = get_cmode($conf);
1465
1466 if ($cmode eq 'console') {
1467 return ['lxc-console', '-n', $vmid, '-t', 0];
1468 } elsif ($cmode eq 'tty') {
1469 return ['lxc-console', '-n', $vmid];
1470 } elsif ($cmode eq 'shell') {
1471 return ['lxc-attach', '--clear-env', '-n', $vmid];
1472 } else {
1473 die "internal error";
1474 }
1475}
1476
c325b32f
DM
1477sub get_primary_ips {
1478 my ($conf) = @_;
1479
1480 # return data from net0
cbb03fea 1481
27916659 1482 return undef if !defined($conf->{net0});
a16d94c8 1483 my $net = parse_lxc_network($conf->{net0});
c325b32f
DM
1484
1485 my $ipv4 = $net->{ip};
db78a181
WB
1486 if ($ipv4) {
1487 if ($ipv4 =~ /^(dhcp|manual)$/) {
1488 $ipv4 = undef
1489 } else {
1490 $ipv4 =~ s!/\d+$!!;
1491 }
1492 }
65e5eaa3 1493 my $ipv6 = $net->{ip6};
db78a181 1494 if ($ipv6) {
5f291c7d 1495 if ($ipv6 =~ /^(auto|dhcp|manual)$/) {
db78a181
WB
1496 $ipv6 = undef;
1497 } else {
1498 $ipv6 =~ s!/\d+$!!;
1499 }
1500 }
cbb03fea 1501
c325b32f
DM
1502 return ($ipv4, $ipv6);
1503}
148d1cb4 1504
b407293b
WB
1505sub delete_mountpoint_volume {
1506 my ($storage_cfg, $vmid, $volume) = @_;
1507
7c921c80 1508 return if classify_mountpoint($volume) ne 'volume';
b407293b
WB
1509
1510 my ($vtype, $name, $owner) = PVE::Storage::parse_volname($storage_cfg, $volume);
1511 PVE::Storage::vdisk_free($storage_cfg, $volume) if $vmid == $owner;
1512}
ef241384 1513
27916659 1514sub destroy_lxc_container {
148d1cb4
DM
1515 my ($storage_cfg, $vmid, $conf) = @_;
1516
db8989e1
WB
1517 foreach_mountpoint($conf, sub {
1518 my ($ms, $mountpoint) = @_;
b407293b 1519 delete_mountpoint_volume($storage_cfg, $vmid, $mountpoint->{volume});
db8989e1
WB
1520 });
1521
27916659
DM
1522 rmdir "/var/lib/lxc/$vmid/rootfs";
1523 unlink "/var/lib/lxc/$vmid/config";
1524 rmdir "/var/lib/lxc/$vmid";
1525 destroy_config($vmid);
1526
1527 #my $cmd = ['lxc-destroy', '-n', $vmid ];
1528 #PVE::Tools::run_command($cmd);
148d1cb4 1529}
68fba17b 1530
ef241384 1531sub vm_stop_cleanup {
5fa890f0 1532 my ($storage_cfg, $vmid, $conf, $keepActive) = @_;
ef241384
DM
1533
1534 eval {
1535 if (!$keepActive) {
bf9d912c 1536
09aa32fd 1537 my $vollist = get_vm_volumes($conf);
a8b6b8a7 1538 PVE::Storage::deactivate_volumes($storage_cfg, $vollist);
ef241384
DM
1539 }
1540 };
1541 warn $@ if $@; # avoid errors - just warn
1542}
1543
93cdbbfb
AD
1544my $safe_num_ne = sub {
1545 my ($a, $b) = @_;
1546
1547 return 0 if !defined($a) && !defined($b);
1548 return 1 if !defined($a);
1549 return 1 if !defined($b);
1550
1551 return $a != $b;
1552};
1553
1554my $safe_string_ne = sub {
1555 my ($a, $b) = @_;
1556
1557 return 0 if !defined($a) && !defined($b);
1558 return 1 if !defined($a);
1559 return 1 if !defined($b);
1560
1561 return $a ne $b;
1562};
1563
1564sub update_net {
bedeaaf1 1565 my ($vmid, $conf, $opt, $newnet, $netid, $rootdir) = @_;
93cdbbfb 1566
18862537
WB
1567 if ($newnet->{type} ne 'veth') {
1568 # for when there are physical interfaces
1569 die "cannot update interface of type $newnet->{type}";
1570 }
1571
1572 my $veth = "veth${vmid}i${netid}";
93cdbbfb
AD
1573 my $eth = $newnet->{name};
1574
18862537
WB
1575 if (my $oldnetcfg = $conf->{$opt}) {
1576 my $oldnet = parse_lxc_network($oldnetcfg);
1577
1578 if (&$safe_string_ne($oldnet->{hwaddr}, $newnet->{hwaddr}) ||
1579 &$safe_string_ne($oldnet->{name}, $newnet->{name})) {
93cdbbfb 1580
18862537 1581 PVE::Network::veth_delete($veth);
bedeaaf1 1582 delete $conf->{$opt};
706c9791 1583 write_config($vmid, $conf);
93cdbbfb 1584
18862537 1585 hotplug_net($vmid, $conf, $opt, $newnet, $netid);
bedeaaf1 1586
18862537
WB
1587 } elsif (&$safe_string_ne($oldnet->{bridge}, $newnet->{bridge}) ||
1588 &$safe_num_ne($oldnet->{tag}, $newnet->{tag}) ||
1589 &$safe_num_ne($oldnet->{firewall}, $newnet->{firewall})) {
bedeaaf1 1590
18862537 1591 if ($oldnet->{bridge}) {
bedeaaf1 1592 PVE::Network::tap_unplug($veth);
18862537
WB
1593 foreach (qw(bridge tag firewall)) {
1594 delete $oldnet->{$_};
1595 }
1596 $conf->{$opt} = print_lxc_network($oldnet);
706c9791 1597 write_config($vmid, $conf);
bedeaaf1 1598 }
93cdbbfb 1599
23eb2244 1600 PVE::Network::tap_plug($veth, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks});
18862537
WB
1601 foreach (qw(bridge tag firewall)) {
1602 $oldnet->{$_} = $newnet->{$_} if $newnet->{$_};
1603 }
1604 $conf->{$opt} = print_lxc_network($oldnet);
706c9791 1605 write_config($vmid, $conf);
93cdbbfb
AD
1606 }
1607 } else {
18862537 1608 hotplug_net($vmid, $conf, $opt, $newnet, $netid);
93cdbbfb
AD
1609 }
1610
bedeaaf1 1611 update_ipconfig($vmid, $conf, $opt, $eth, $newnet, $rootdir);
93cdbbfb
AD
1612}
1613
1614sub hotplug_net {
18862537 1615 my ($vmid, $conf, $opt, $newnet, $netid) = @_;
93cdbbfb 1616
18862537 1617 my $veth = "veth${vmid}i${netid}";
cbb03fea 1618 my $vethpeer = $veth . "p";
93cdbbfb
AD
1619 my $eth = $newnet->{name};
1620
1621 PVE::Network::veth_create($veth, $vethpeer, $newnet->{bridge}, $newnet->{hwaddr});
23eb2244 1622 PVE::Network::tap_plug($veth, $newnet->{bridge}, $newnet->{tag}, $newnet->{firewall}, $newnet->{trunks});
93cdbbfb 1623
cbb03fea 1624 # attach peer in container
93cdbbfb
AD
1625 my $cmd = ['lxc-device', '-n', $vmid, 'add', $vethpeer, "$eth" ];
1626 PVE::Tools::run_command($cmd);
1627
cbb03fea 1628 # link up peer in container
93cdbbfb
AD
1629 $cmd = ['lxc-attach', '-n', $vmid, '-s', 'NETWORK', '--', '/sbin/ip', 'link', 'set', $eth ,'up' ];
1630 PVE::Tools::run_command($cmd);
bedeaaf1 1631
18862537
WB
1632 my $done = { type => 'veth' };
1633 foreach (qw(bridge tag firewall hwaddr name)) {
1634 $done->{$_} = $newnet->{$_} if $newnet->{$_};
1635 }
1636 $conf->{$opt} = print_lxc_network($done);
bedeaaf1 1637
706c9791 1638 write_config($vmid, $conf);
93cdbbfb
AD
1639}
1640
68a05bb3 1641sub update_ipconfig {
bedeaaf1
AD
1642 my ($vmid, $conf, $opt, $eth, $newnet, $rootdir) = @_;
1643
f2104b80 1644 my $lxc_setup = PVE::LXC::Setup->new($conf, $rootdir);
bedeaaf1 1645
18862537 1646 my $optdata = parse_lxc_network($conf->{$opt});
84e0c123
WB
1647 my $deleted = [];
1648 my $added = [];
8d723477
WB
1649 my $nscmd = sub {
1650 my $cmdargs = shift;
1651 PVE::Tools::run_command(['lxc-attach', '-n', $vmid, '-s', 'NETWORK', '--', @_], %$cmdargs);
84e0c123 1652 };
8d723477 1653 my $ipcmd = sub { &$nscmd({}, '/sbin/ip', @_) };
2bfd1615 1654
84e0c123 1655 my $change_ip_config = sub {
f39002a6
DM
1656 my ($ipversion) = @_;
1657
1658 my $family_opt = "-$ipversion";
1659 my $suffix = $ipversion == 4 ? '' : $ipversion;
84e0c123
WB
1660 my $gw= "gw$suffix";
1661 my $ip= "ip$suffix";
bedeaaf1 1662
6178b0dd
WB
1663 my $newip = $newnet->{$ip};
1664 my $newgw = $newnet->{$gw};
1665 my $oldip = $optdata->{$ip};
1666
1667 my $change_ip = &$safe_string_ne($oldip, $newip);
1668 my $change_gw = &$safe_string_ne($optdata->{$gw}, $newgw);
bedeaaf1 1669
84e0c123 1670 return if !$change_ip && !$change_gw;
68a05bb3 1671
84e0c123 1672 # step 1: add new IP, if this fails we cancel
292aff54
WB
1673 my $is_real_ip = ($newip && $newip !~ /^(?:auto|dhcp|manual)$/);
1674 if ($change_ip && $is_real_ip) {
8d723477 1675 eval { &$ipcmd($family_opt, 'addr', 'add', $newip, 'dev', $eth); };
84e0c123
WB
1676 if (my $err = $@) {
1677 warn $err;
1678 return;
1679 }
bedeaaf1 1680 }
bedeaaf1 1681
84e0c123
WB
1682 # step 2: replace gateway
1683 # If this fails we delete the added IP and cancel.
1684 # If it succeeds we save the config and delete the old IP, ignoring
1685 # errors. The config is then saved.
1686 # Note: 'ip route replace' can add
1687 if ($change_gw) {
6178b0dd 1688 if ($newgw) {
292aff54
WB
1689 eval {
1690 if ($is_real_ip && !PVE::Network::is_ip_in_cidr($newgw, $newip, $ipversion)) {
1691 &$ipcmd($family_opt, 'route', 'add', $newgw, 'dev', $eth);
1692 }
1693 &$ipcmd($family_opt, 'route', 'replace', 'default', 'via', $newgw);
1694 };
84e0c123
WB
1695 if (my $err = $@) {
1696 warn $err;
1697 # the route was not replaced, the old IP is still available
1698 # rollback (delete new IP) and cancel
1699 if ($change_ip) {
8d723477 1700 eval { &$ipcmd($family_opt, 'addr', 'del', $newip, 'dev', $eth); };
84e0c123
WB
1701 warn $@ if $@; # no need to die here
1702 }
1703 return;
1704 }
1705 } else {
8d723477 1706 eval { &$ipcmd($family_opt, 'route', 'del', 'default'); };
84e0c123
WB
1707 # if the route was not deleted, the guest might have deleted it manually
1708 # warn and continue
1709 warn $@ if $@;
1710 }
2bfd1615 1711 }
2bfd1615 1712
6178b0dd 1713 # from this point on we save the configuration
84e0c123 1714 # step 3: delete old IP ignoring errors
6178b0dd 1715 if ($change_ip && $oldip && $oldip !~ /^(?:auto|dhcp)$/) {
8d723477
WB
1716 # We need to enable promote_secondaries, otherwise our newly added
1717 # address will be removed along with the old one.
1718 my $promote = 0;
1719 eval {
1720 if ($ipversion == 4) {
1721 &$nscmd({ outfunc => sub { $promote = int(shift) } },
1722 'cat', "/proc/sys/net/ipv4/conf/$eth/promote_secondaries");
1723 &$nscmd({}, 'sysctl', "net.ipv4.conf.$eth.promote_secondaries=1");
1724 }
1725 &$ipcmd($family_opt, 'addr', 'del', $oldip, 'dev', $eth);
1726 };
84e0c123 1727 warn $@ if $@; # no need to die here
8d723477
WB
1728
1729 if ($ipversion == 4) {
1730 &$nscmd({}, 'sysctl', "net.ipv4.conf.$eth.promote_secondaries=$promote");
1731 }
bedeaaf1
AD
1732 }
1733
84e0c123
WB
1734 foreach my $property ($ip, $gw) {
1735 if ($newnet->{$property}) {
1736 $optdata->{$property} = $newnet->{$property};
1737 } else {
1738 delete $optdata->{$property};
1739 }
bedeaaf1 1740 }
18862537 1741 $conf->{$opt} = print_lxc_network($optdata);
706c9791 1742 write_config($vmid, $conf);
84e0c123
WB
1743 $lxc_setup->setup_network($conf);
1744 };
bedeaaf1 1745
f39002a6
DM
1746 &$change_ip_config(4);
1747 &$change_ip_config(6);
489e960d
WL
1748
1749}
1750
a92f66c9
WL
1751# Internal snapshots
1752
1753# NOTE: Snapshot create/delete involves several non-atomic
c31ad455
FG
1754# actions, and can take a long time.
1755# So we try to avoid locking the file and use the 'lock' variable
a92f66c9
WL
1756# inside the config file instead.
1757
1758my $snapshot_copy_config = sub {
1759 my ($source, $dest) = @_;
1760
1761 foreach my $k (keys %$source) {
1762 next if $k eq 'snapshots';
09d3ec42
DM
1763 next if $k eq 'snapstate';
1764 next if $k eq 'snaptime';
1765 next if $k eq 'vmstate';
1766 next if $k eq 'lock';
a92f66c9 1767 next if $k eq 'digest';
09d3ec42 1768 next if $k eq 'description';
0f8b9438 1769 next if $k =~ m/^unused\d+$/;
a92f66c9
WL
1770
1771 $dest->{$k} = $source->{$k};
1772 }
1773};
1774
0f8b9438
FG
1775my $snapshot_apply_config = sub {
1776 my ($conf, $snap) = @_;
1777
1778 # copy snapshot list
1779 my $newconf = {
1780 snapshots => $conf->{snapshots},
1781 };
1782
1783 # keep description and list of unused disks
1784 foreach my $k (keys %$conf) {
1785 next if !($k =~ m/^unused\d+$/ || $k eq 'description');
1786 $newconf->{$k} = $conf->{$k};
1787 }
1788
1789 &$snapshot_copy_config($snap, $newconf);
1790
1791 return $newconf;
1792};
1793
1794my $snapshot_save_vmstate = sub {
1795 die "implement me - snapshot_save_vmstate\n";
1796};
1797
0bfffef4
FG
1798sub snapshot_prepare {
1799 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
a92f66c9
WL
1800
1801 my $snap;
1802
1803 my $updatefn = sub {
1804
1805 my $conf = load_config($vmid);
1806
bb1ac2de
DM
1807 die "you can't take a snapshot if it's a template\n"
1808 if is_template($conf);
1809
a92f66c9
WL
1810 check_lock($conf);
1811
09d3ec42 1812 $conf->{lock} = 'snapshot';
a92f66c9
WL
1813
1814 die "snapshot name '$snapname' already used\n"
1815 if defined($conf->{snapshots}->{$snapname});
1816
1817 my $storecfg = PVE::Storage::config();
0f8b9438
FG
1818
1819 # workaround until mp snapshots are implemented
5d385379
FG
1820 my $feature = $snapname eq 'vzdump' ? 'vzdump' : 'snapshot';
1821 die "snapshot feature is not available\n" if !has_feature($feature, $conf, $storecfg);
a92f66c9
WL
1822
1823 $snap = $conf->{snapshots}->{$snapname} = {};
1824
0f8b9438
FG
1825 if ($save_vmstate && check_running($vmid)) {
1826 &$snapshot_save_vmstate($vmid, $conf, $snapname, $storecfg);
1827 }
1828
a92f66c9
WL
1829 &$snapshot_copy_config($conf, $snap);
1830
0f8b9438
FG
1831 $snap->{snapstate} = "prepare";
1832 $snap->{snaptime} = time();
1833 $snap->{description} = $comment if $comment;
a92f66c9 1834
706c9791 1835 write_config($vmid, $conf);
a92f66c9
WL
1836 };
1837
3cc56749 1838 lock_config($vmid, $updatefn);
a92f66c9
WL
1839
1840 return $snap;
0bfffef4 1841}
a92f66c9 1842
0bfffef4 1843sub snapshot_commit {
a92f66c9
WL
1844 my ($vmid, $snapname) = @_;
1845
1846 my $updatefn = sub {
1847
1848 my $conf = load_config($vmid);
1849
1850 die "missing snapshot lock\n"
09d3ec42 1851 if !($conf->{lock} && $conf->{lock} eq 'snapshot');
a92f66c9 1852
0f8b9438
FG
1853 my $snap = $conf->{snapshots}->{$snapname};
1854 die "snapshot '$snapname' does not exist\n" if !defined($snap);
a92f66c9
WL
1855
1856 die "wrong snapshot state\n"
0f8b9438 1857 if !($snap->{snapstate} && $snap->{snapstate} eq "prepare");
a92f66c9 1858
0f8b9438 1859 delete $snap->{snapstate};
09d3ec42 1860 delete $conf->{lock};
a92f66c9 1861
0f8b9438
FG
1862 my $newconf = &$snapshot_apply_config($conf, $snap);
1863
1864 $newconf->{parent} = $snapname;
1865
1866 write_config($vmid, $newconf);
a92f66c9
WL
1867 };
1868
0bfffef4
FG
1869 lock_config($vmid, $updatefn);
1870}
a92f66c9
WL
1871
1872sub has_feature {
1873 my ($feature, $conf, $storecfg, $snapname) = @_;
09d3ec42 1874
a92f66c9 1875 my $err;
5d385379
FG
1876 my $vzdump = $feature eq 'vzdump';
1877 $feature = 'snapshot' if $vzdump;
09d3ec42 1878
8bf50651
DM
1879 foreach_mountpoint($conf, sub {
1880 my ($ms, $mountpoint) = @_;
1881
2c3ed8c4 1882 return if $err; # skip further test
5d385379 1883 return if $vzdump && $ms ne 'rootfs' && !$mountpoint->{backup};
2c3ed8c4 1884
8bf50651
DM
1885 $err = 1 if !PVE::Storage::volume_has_feature($storecfg, $feature, $mountpoint->{volume}, $snapname);
1886
1887 # TODO: implement support for mountpoints
1888 die "unable to handle mountpoint '$ms' - feature not implemented\n"
1889 if $ms ne 'rootfs';
1890 });
a92f66c9
WL
1891
1892 return $err ? 0 : 1;
1893}
1894
34fdb3d7
WB
1895my $enter_namespace = sub {
1896 my ($vmid, $pid, $which, $type) = @_;
1897 sysopen my $fd, "/proc/$pid/ns/$which", O_RDONLY
1898 or die "failed to open $which namespace of container $vmid: $!\n";
1899 PVE::Tools::setns(fileno($fd), $type)
1900 or die "failed to enter $which namespace of container $vmid: $!\n";
1901 close $fd;
1902};
1903
1904my $do_syncfs = sub {
1905 my ($vmid, $pid, $socket) = @_;
1906
1907 &$enter_namespace($vmid, $pid, 'mnt', PVE::Tools::CLONE_NEWNS);
1908
1909 # Tell the parent process to start reading our /proc/mounts
1910 print {$socket} "go\n";
1911 $socket->flush();
1912
1913 # Receive /proc/self/mounts
1914 my $mountdata = do { local $/ = undef; <$socket> };
1915 close $socket;
1916
1917 # Now sync all mountpoints...
1918 my $mounts = PVE::ProcFSTools::parse_mounts($mountdata);
1919 foreach my $mp (@$mounts) {
1920 my ($what, $dir, $fs) = @$mp;
1921 next if $fs eq 'fuse.lxcfs';
1922 eval { PVE::Tools::sync_mountpoint($dir); };
1923 warn $@ if $@;
1924 }
1925};
1926
1927sub sync_container_namespace {
1928 my ($vmid) = @_;
1929 my $pid = find_lxc_pid($vmid);
1930
1931 # SOCK_DGRAM is nicer for barriers but cannot be slurped
1932 socketpair my $pfd, my $cfd, AF_UNIX, SOCK_STREAM, PF_UNSPEC
1933 or die "failed to create socketpair: $!\n";
1934
1935 my $child = fork();
1936 die "fork failed: $!\n" if !defined($child);
1937
1938 if (!$child) {
1939 eval {
1940 close $pfd;
1941 &$do_syncfs($vmid, $pid, $cfd);
1942 };
1943 if (my $err = $@) {
1944 warn $err;
1945 POSIX::_exit(1);
1946 }
1947 POSIX::_exit(0);
1948 }
1949 close $cfd;
1950 my $go = <$pfd>;
1951 die "failed to enter container namespace\n" if $go ne "go\n";
1952
1953 open my $mounts, '<', "/proc/$child/mounts"
1954 or die "failed to open container's /proc/mounts: $!\n";
1955 my $mountdata = do { local $/ = undef; <$mounts> };
1956 close $mounts;
1957 print {$pfd} $mountdata;
1958 close $pfd;
1959
1960 while (waitpid($child, 0) != $child) {}
1961 die "failed to sync container namespace\n" if $? != 0;
1962}
1963
489e960d 1964sub snapshot_create {
0bfffef4 1965 my ($vmid, $snapname, $save_vmstate, $comment) = @_;
489e960d 1966
0bfffef4 1967 my $snap = snapshot_prepare($vmid, $snapname, $save_vmstate, $comment);
a92f66c9 1968
09d3ec42 1969 my $conf = load_config($vmid);
a92f66c9 1970
a92f66c9 1971 my $running = check_running($vmid);
2477a7f1
DM
1972
1973 my $unfreeze = 0;
74bf6d37
FG
1974
1975 my $drivehash = {};
1976
a92f66c9
WL
1977 eval {
1978 if ($running) {
2477a7f1 1979 $unfreeze = 1;
74bf6d37 1980 PVE::Tools::run_command(['/usr/bin/lxc-freeze', '-n', $vmid]);
34fdb3d7 1981 sync_container_namespace($vmid);
a92f66c9
WL
1982 };
1983
1984 my $storecfg = PVE::Storage::config();
44a9face 1985 my $rootinfo = parse_ct_rootfs($conf->{rootfs});
09d3ec42 1986 my $volid = $rootinfo->{volume};
a92f66c9 1987
a92f66c9 1988 PVE::Storage::volume_snapshot($storecfg, $volid, $snapname);
74bf6d37 1989 $drivehash->{rootfs} = 1;
a92f66c9 1990 };
2477a7f1
DM
1991 my $err = $@;
1992
1993 if ($unfreeze) {
1994 eval { PVE::Tools::run_command(['/usr/bin/lxc-unfreeze', '-n', $vmid]); };
1995 warn $@ if $@;
1996 }
1997
1998 if ($err) {
74bf6d37
FG
1999 eval { snapshot_delete($vmid, $snapname, 1, $drivehash); };
2000 warn "$@\n" if $@;
a92f66c9
WL
2001 die "$err\n";
2002 }
74bf6d37 2003
0bfffef4 2004 snapshot_commit($vmid, $snapname);
68a05bb3
AD
2005}
2006
74bf6d37 2007# Note: $drivehash is only set when called from snapshot_create.
57ccb3f8 2008sub snapshot_delete {
74bf6d37 2009 my ($vmid, $snapname, $force, $drivehash) = @_;
57ccb3f8 2010
4de963d4 2011 my $prepare = 1;
31429832 2012
4de963d4 2013 my $snap;
31429832 2014
7b2eb379 2015 my $unlink_parent = sub {
7b2eb379 2016 my ($confref, $new_parent) = @_;
31429832 2017
7b2eb379
FG
2018 if ($confref->{parent} && $confref->{parent} eq $snapname) {
2019 if ($new_parent) {
2020 $confref->{parent} = $new_parent;
31429832 2021 } else {
7b2eb379 2022 delete $confref->{parent};
31429832
WL
2023 }
2024 }
7b2eb379
FG
2025 };
2026
4de963d4
FG
2027 my $updatefn = sub {
2028 my ($remove_drive) = @_;
7b2eb379 2029
4de963d4 2030 my $conf = load_config($vmid);
74bf6d37 2031
4de963d4 2032 if (!$drivehash) {
74bf6d37 2033 check_lock($conf);
4de963d4
FG
2034 die "you can't delete a snapshot if vm is a template\n"
2035 if is_template($conf);
74bf6d37 2036 }
7b2eb379 2037
4de963d4
FG
2038 $snap = $conf->{snapshots}->{$snapname};
2039
2040 die "snapshot '$snapname' does not exist\n" if !defined($snap);
2041
2042 # remove parent refs
2043 if (!$prepare) {
2044 &$unlink_parent($conf, $snap->{parent});
2045 foreach my $sn (keys %{$conf->{snapshots}}) {
2046 next if $sn eq $snapname;
2047 &$unlink_parent($conf->{snapshots}->{$sn}, $snap->{parent});
2048 }
7b2eb379
FG
2049 }
2050
4de963d4
FG
2051 if ($remove_drive) {
2052 if ($remove_drive eq 'vmstate') {
2053 die "implement me - saving vmstate\n";
2054 } else {
2055 die "implement me - remove drive\n";
2056 }
2057 }
31429832 2058
4de963d4
FG
2059 if ($prepare) {
2060 $snap->{snapstate} = 'delete';
2061 } else {
2062 delete $conf->{snapshots}->{$snapname};
2063 delete $conf->{lock} if $drivehash;
2064 }
31429832 2065
706c9791 2066 write_config($vmid, $conf);
31429832
WL
2067 };
2068
4de963d4
FG
2069 lock_config($vmid, $updatefn);
2070
2071 # now remove vmstate file
2072 # never set for LXC!
2073 my $storecfg = PVE::Storage::config();
2074
2075 if ($snap->{vmstate}) {
2076 die "implement me - saving vmstate\n";
2077 };
31429832 2078
4de963d4
FG
2079 # now remove all volume snapshots
2080 # only rootfs for now!
31429832 2081 eval {
4de963d4
FG
2082 my $rootfs = $snap->{rootfs};
2083 my $rootinfo = parse_ct_rootfs($rootfs);
2084 my $volid = $rootinfo->{volume};
31429832
WL
2085 PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snapname);
2086 };
4de963d4
FG
2087 if (my $err = $@) {
2088 die $err if !$force;
2089 warn $err;
31429832 2090 }
4de963d4
FG
2091
2092 # now cleanup config
2093 $prepare = 0;
2094 lock_config($vmid, $updatefn);
57ccb3f8
WL
2095}
2096
723157f6
WL
2097sub snapshot_rollback {
2098 my ($vmid, $snapname) = @_;
2099
20e5d106
FG
2100 my $prepare = 1;
2101
6860ba0c
WL
2102 my $storecfg = PVE::Storage::config();
2103
2104 my $conf = load_config($vmid);
2105
20e5d106 2106 my $get_snapshot_config = sub {
bb1ac2de 2107
20e5d106 2108 die "you can't rollback if vm is a template\n" if is_template($conf);
6860ba0c 2109
20e5d106 2110 my $res = $conf->{snapshots}->{$snapname};
6860ba0c 2111
20e5d106
FG
2112 die "snapshot '$snapname' does not exist\n" if !defined($res);
2113
2114 return $res;
2115 };
2116
2117 my $snap = &$get_snapshot_config();
2118
2119 # only for rootfs for now!
09d3ec42 2120 my $rootfs = $snap->{rootfs};
44a9face 2121 my $rootinfo = parse_ct_rootfs($rootfs);
09d3ec42
DM
2122 my $volid = $rootinfo->{volume};
2123
2124 PVE::Storage::volume_rollback_is_possible($storecfg, $volid, $snapname);
6860ba0c
WL
2125
2126 my $updatefn = sub {
2127
20e5d106 2128 $conf = load_config($vmid);
6860ba0c 2129
20e5d106
FG
2130 $snap = &$get_snapshot_config();
2131
2132 die "unable to rollback to incomplete snapshot (snapstate = $snap->{snapstate})\n"
2133 if $snap->{snapstate};
6860ba0c 2134
20e5d106
FG
2135 if ($prepare) {
2136 check_lock($conf);
69d4afc7
FG
2137 PVE::Tools::run_command(['/usr/bin/lxc-stop', '-n', $vmid, '--kill'])
2138 if check_running($vmid);
20e5d106 2139 }
6860ba0c
WL
2140
2141 die "unable to rollback vm $vmid: vm is running\n"
2142 if check_running($vmid);
2143
20e5d106
FG
2144 if ($prepare) {
2145 $conf->{lock} = 'rollback';
2146 } else {
2147 die "got wrong lock\n" if !($conf->{lock} && $conf->{lock} eq 'rollback');
2148 delete $conf->{lock};
2149 }
6860ba0c
WL
2150
2151 my $forcemachine;
2152
20e5d106
FG
2153 if (!$prepare) {
2154 # copy snapshot config to current config
2155 $conf = &$snapshot_apply_config($conf, $snap);
2156 $conf->{parent} = $snapname;
2157 }
6860ba0c 2158
706c9791 2159 write_config($vmid, $conf);
6860ba0c 2160
20e5d106 2161 if (!$prepare && $snap->{vmstate}) {
19d36a45 2162 die "implement me - save vmstate\n";
20e5d106 2163 }
6860ba0c
WL
2164 };
2165
3cc56749 2166 lock_config($vmid, $updatefn);
6860ba0c 2167
20e5d106 2168 # only rootfs for now!
09d3ec42 2169 PVE::Storage::volume_snapshot_rollback($storecfg, $volid, $snapname);
6860ba0c 2170
20e5d106
FG
2171 $prepare = 0;
2172 lock_config($vmid, $updatefn);
723157f6 2173}
b935932a 2174
bb1ac2de
DM
2175sub template_create {
2176 my ($vmid, $conf) = @_;
2177
2178 my $storecfg = PVE::Storage::config();
2179
44a9face 2180 my $rootinfo = parse_ct_rootfs($conf->{rootfs});
bb1ac2de
DM
2181 my $volid = $rootinfo->{volume};
2182
2183 die "Template feature is not available for '$volid'\n"
2184 if !PVE::Storage::volume_has_feature($storecfg, 'template', $volid);
2185
2186 PVE::Storage::activate_volumes($storecfg, [$volid]);
2187
2188 my $template_volid = PVE::Storage::vdisk_create_base($storecfg, $volid);
2189 $rootinfo->{volume} = $template_volid;
4fee75fd 2190 $conf->{rootfs} = print_ct_mountpoint($rootinfo, 1);
bb1ac2de
DM
2191
2192 write_config($vmid, $conf);
2193}
2194
2195sub is_template {
2196 my ($conf) = @_;
2197
2198 return 1 if defined $conf->{template} && $conf->{template} == 1;
2199}
2200
9622e848
DM
2201sub mountpoint_names {
2202 my ($reverse) = @_;
ced7fddb 2203
9622e848 2204 my @names = ('rootfs');
eaebef36
DM
2205
2206 for (my $i = 0; $i < $MAX_MOUNT_POINTS; $i++) {
9622e848
DM
2207 push @names, "mp$i";
2208 }
2209
2210 return $reverse ? reverse @names : @names;
2211}
2212
3c9dbfa9 2213
9622e848
DM
2214sub foreach_mountpoint_full {
2215 my ($conf, $reverse, $func) = @_;
2216
2217 foreach my $key (mountpoint_names($reverse)) {
2218 my $value = $conf->{$key};
2219 next if !defined($value);
44a9face 2220 my $mountpoint = $key eq 'rootfs' ? parse_ct_rootfs($value, 1) : parse_ct_mountpoint($value, 1);
ca7feb1a 2221 next if !defined($mountpoint);
3c9dbfa9 2222
eaebef36 2223 &$func($key, $mountpoint);
ced7fddb
AD
2224 }
2225}
2226
9622e848
DM
2227sub foreach_mountpoint {
2228 my ($conf, $func) = @_;
2229
2230 foreach_mountpoint_full($conf, 0, $func);
2231}
2232
2233sub foreach_mountpoint_reverse {
2234 my ($conf, $func) = @_;
2235
2236 foreach_mountpoint_full($conf, 1, $func);
2237}
2238
52389a07 2239sub check_ct_modify_config_perm {
f1ba1a4b 2240 my ($rpcenv, $authuser, $vmid, $pool, $newconf, $delete) = @_;
52389a07 2241
c81f19d1 2242 return 1 if $authuser eq 'root@pam';
52389a07 2243
f1ba1a4b
WB
2244 my $check = sub {
2245 my ($opt, $delete) = @_;
52389a07
DM
2246 if ($opt eq 'cpus' || $opt eq 'cpuunits' || $opt eq 'cpulimit') {
2247 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.CPU']);
e59a61ed 2248 } elsif ($opt eq 'rootfs' || $opt =~ /^mp\d+$/) {
52389a07 2249 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Disk']);
f1ba1a4b
WB
2250 return if $delete;
2251 my $data = $opt eq 'rootfs' ? parse_ct_rootfs($newconf->{$opt})
2252 : parse_ct_mountpoint($newconf->{$opt});
2253 raise_perm_exc("mountpoint type $data->{type}") if $data->{type} ne 'volume';
52389a07
DM
2254 } elsif ($opt eq 'memory' || $opt eq 'swap') {
2255 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Memory']);
2256 } elsif ($opt =~ m/^net\d+$/ || $opt eq 'nameserver' ||
2257 $opt eq 'searchdomain' || $opt eq 'hostname') {
2258 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Network']);
2259 } else {
2260 $rpcenv->check_vm_perm($authuser, $vmid, $pool, ['VM.Config.Options']);
2261 }
f1ba1a4b
WB
2262 };
2263
2264 foreach my $opt (keys %$newconf) {
2265 &$check($opt, 0);
2266 }
2267 foreach my $opt (@$delete) {
2268 &$check($opt, 1);
52389a07
DM
2269 }
2270
2271 return 1;
2272}
2273
9622e848 2274sub umount_all {
da629848 2275 my ($vmid, $storage_cfg, $conf, $noerr) = @_;
9622e848
DM
2276
2277 my $rootdir = "/var/lib/lxc/$vmid/rootfs";
2278 my $volid_list = get_vm_volumes($conf);
2279
2280 foreach_mountpoint_reverse($conf, sub {
2281 my ($ms, $mountpoint) = @_;
2282
2283 my $volid = $mountpoint->{volume};
2284 my $mount = $mountpoint->{mp};
2285
2286 return if !$volid || !$mount;
2287
d18f96b4 2288 my $mount_path = "$rootdir/$mount";
f845a93d 2289 $mount_path =~ s!/+!/!g;
9622e848 2290
228a5a1d
WL
2291 return if !PVE::ProcFSTools::is_mounted($mount_path);
2292
9622e848 2293 eval {
d18f96b4 2294 PVE::Tools::run_command(['umount', '-d', $mount_path]);
9622e848
DM
2295 };
2296 if (my $err = $@) {
2297 if ($noerr) {
2298 warn $err;
2299 } else {
2300 die $err;
2301 }
2302 }
2303 });
9622e848
DM
2304}
2305
2306sub mount_all {
7b49dfe0 2307 my ($vmid, $storage_cfg, $conf) = @_;
9622e848
DM
2308
2309 my $rootdir = "/var/lib/lxc/$vmid/rootfs";
1adc7e53 2310 File::Path::make_path($rootdir);
9622e848
DM
2311
2312 my $volid_list = get_vm_volumes($conf);
2313 PVE::Storage::activate_volumes($storage_cfg, $volid_list);
2314
2315 eval {
9622e848
DM
2316 foreach_mountpoint($conf, sub {
2317 my ($ms, $mountpoint) = @_;
2318
da629848 2319 mountpoint_mount($mountpoint, $rootdir, $storage_cfg);
9622e848
DM
2320 });
2321 };
2322 if (my $err = $@) {
e2007ac2 2323 warn "mounting container failed\n";
9622e848 2324 umount_all($vmid, $storage_cfg, $conf, 1);
e2007ac2 2325 die $err;
9622e848
DM
2326 }
2327
da629848 2328 return $rootdir;
9622e848
DM
2329}
2330
2331
b15c75fc 2332sub mountpoint_mount_path {
da629848 2333 my ($mountpoint, $storage_cfg, $snapname) = @_;
b15c75fc 2334
da629848 2335 return mountpoint_mount($mountpoint, undef, $storage_cfg, $snapname);
b15c75fc 2336}
cc6b0307 2337
2cfae16e
WB
2338my $check_mount_path = sub {
2339 my ($path) = @_;
2340 $path = File::Spec->canonpath($path);
2341 my $real = Cwd::realpath($path);
2342 if ($real ne $path) {
2343 die "mount path modified by symlink: $path != $real";
2344 }
2345};
2346
21f292ff
WB
2347sub query_loopdev {
2348 my ($path) = @_;
2349 my $found;
2350 my $parser = sub {
2351 my $line = shift;
2352 if ($line =~ m@^(/dev/loop\d+):@) {
2353 $found = $1;
2354 }
2355 };
2356 my $cmd = ['losetup', '--associated', $path];
2357 PVE::Tools::run_command($cmd, outfunc => $parser);
2358 return $found;
2359}
2360
50df544c
WB
2361# Run a function with a file attached to a loop device.
2362# The loop device is always detached afterwards (or set to autoclear).
2363# Returns the loop device.
2364sub run_with_loopdev {
2365 my ($func, $file) = @_;
2366 my $device;
2367 my $parser = sub {
2368 my $line = shift;
2369 if ($line =~ m@^(/dev/loop\d+)$@) {
2370 $device = $1;
2371 }
2372 };
2373 PVE::Tools::run_command(['losetup', '--show', '-f', $file], outfunc => $parser);
2374 die "failed to setup loop device for $file\n" if !$device;
2375 eval { &$func($device); };
2376 my $err = $@;
2377 PVE::Tools::run_command(['losetup', '-d', $device]);
2378 die $err if $err;
2379 return $device;
2380}
2381
c2744c97
WB
2382sub bindmount {
2383 my ($dir, $dest, $ro, @extra_opts) = @_;
2384 PVE::Tools::run_command(['mount', '-o', 'bind', @extra_opts, $dir, $dest]);
2385 if ($ro) {
2386 eval { PVE::Tools::run_command(['mount', '-o', 'bind,remount,ro', $dest]); };
2387 if (my $err = $@) {
2388 warn "bindmount error\n";
2389 # don't leave writable bind-mounts behind...
2390 PVE::Tools::run_command(['umount', $dest]);
2391 die $err;
2392 }
2393 }
2394}
2395
b15c75fc 2396# use $rootdir = undef to just return the corresponding mount path
cc6b0307 2397sub mountpoint_mount {
da629848 2398 my ($mountpoint, $rootdir, $storage_cfg, $snapname) = @_;
cc6b0307
AD
2399
2400 my $volid = $mountpoint->{volume};
2401 my $mount = $mountpoint->{mp};
7c921c80 2402 my $type = $mountpoint->{type};
50df544c
WB
2403 my $quota = !$snapname && !$mountpoint->{ro} && $mountpoint->{quota};
2404 my $mounted_dev;
b15c75fc 2405
cc6b0307
AD
2406 return if !$volid || !$mount;
2407
b15c75fc
DM
2408 my $mount_path;
2409
2410 if (defined($rootdir)) {
2411 $rootdir =~ s!/+$!!;
2412 $mount_path = "$rootdir/$mount";
f845a93d 2413 $mount_path =~ s!/+!/!g;
2cfae16e 2414 &$check_mount_path($mount_path);
b15c75fc 2415 File::Path::mkpath($mount_path);
116ce06f 2416 }
b15c75fc
DM
2417
2418 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
cc6b0307 2419
b15c75fc 2420 die "unknown snapshot path for '$volid'" if !$storage && defined($snapname);
cc6b0307 2421
471dd315
WB
2422 my $optstring = '';
2423 if (defined($mountpoint->{acl})) {
2424 $optstring .= ($mountpoint->{acl} ? 'acl' : 'noacl');
2425 }
c2744c97 2426 my $readonly = $mountpoint->{ro};
471dd315
WB
2427
2428 my @extra_opts = ('-o', $optstring);
2429
b15c75fc
DM
2430 if ($storage) {
2431
2432 my $scfg = PVE::Storage::storage_config($storage_cfg, $storage);
2433 my $path = PVE::Storage::path($storage_cfg, $volid, $snapname);
2434
2435 my ($vtype, undef, undef, undef, undef, $isBase, $format) =
2436 PVE::Storage::parse_volname($storage_cfg, $volid);
2437
c87b9dd8
DM
2438 $format = 'iso' if $vtype eq 'iso'; # allow to handle iso files
2439
b15c75fc 2440 if ($format eq 'subvol') {
30de33be
DM
2441 if ($mount_path) {
2442 if ($snapname) {
e84f7f5d
DM
2443 if ($scfg->{type} eq 'zfspool') {
2444 my $path_arg = $path;
2445 $path_arg =~ s!^/+!!;
471dd315 2446 PVE::Tools::run_command(['mount', '-o', 'ro', @extra_opts, '-t', 'zfs', $path_arg, $mount_path]);
e84f7f5d 2447 } else {
30de33be
DM
2448 die "cannot mount subvol snapshots for storage type '$scfg->{type}'\n";
2449 }
e84f7f5d 2450 } else {
c2744c97 2451 bindmount($path, $mount_path, $readonly, @extra_opts);
50df544c 2452 warn "cannot enable quota control for bind mounted subvolumes\n" if $quota;
30de33be 2453 }
b15c75fc 2454 }
50df544c 2455 return wantarray ? ($path, 0, $mounted_dev) : $path;
c87b9dd8 2456 } elsif ($format eq 'raw' || $format eq 'iso') {
50df544c
WB
2457 my $domount = sub {
2458 my ($path) = @_;
2459 if ($mount_path) {
2460 if ($format eq 'iso') {
2461 PVE::Tools::run_command(['mount', '-o', 'ro', @extra_opts, $path, $mount_path]);
2462 } elsif ($isBase || defined($snapname)) {
2463 PVE::Tools::run_command(['mount', '-o', 'ro,noload', @extra_opts, $path, $mount_path]);
2464 } else {
2465 if ($quota) {
2466 push @extra_opts, '-o', 'usrjquota=aquota.user,grpjquota=aquota.group,jqfmt=vfsv0';
2467 }
c2744c97 2468 push @extra_opts, '-o', 'ro' if $readonly;
50df544c
WB
2469 PVE::Tools::run_command(['mount', @extra_opts, $path, $mount_path]);
2470 }
2471 }
2472 };
30de33be 2473 my $use_loopdev = 0;
b15c75fc 2474 if ($scfg->{path}) {
50df544c 2475 $mounted_dev = run_with_loopdev($domount, $path);
30de33be 2476 $use_loopdev = 1;
2e879877
DM
2477 } elsif ($scfg->{type} eq 'drbd' || $scfg->{type} eq 'lvm' ||
2478 $scfg->{type} eq 'rbd' || $scfg->{type} eq 'lvmthin') {
50df544c
WB
2479 $mounted_dev = $path;
2480 &$domount($path);
b15c75fc
DM
2481 } else {
2482 die "unsupported storage type '$scfg->{type}'\n";
2483 }
50df544c 2484 return wantarray ? ($path, $use_loopdev, $mounted_dev) : $path;
b15c75fc
DM
2485 } else {
2486 die "unsupported image format '$format'\n";
2487 }
7c921c80 2488 } elsif ($type eq 'device') {
c2744c97 2489 push @extra_opts, '-o', 'ro' if $readonly;
471dd315 2490 PVE::Tools::run_command(['mount', @extra_opts, $volid, $mount_path]) if $mount_path;
50df544c 2491 return wantarray ? ($volid, 0, $volid) : $volid;
e2007ac2
DM
2492 } elsif ($type eq 'bind') {
2493 die "directory '$volid' does not exist\n" if ! -d $volid;
2cfae16e 2494 &$check_mount_path($volid);
c2744c97 2495 bindmount($volid, $mount_path, $readonly, @extra_opts) if $mount_path;
50df544c
WB
2496 warn "cannot enable quota control for bind mounts\n" if $quota;
2497 return wantarray ? ($volid, 0, undef) : $volid;
b15c75fc
DM
2498 }
2499
2500 die "unsupported storage";
cc6b0307
AD
2501}
2502
9205e9d0
AD
2503sub get_vm_volumes {
2504 my ($conf, $excludes) = @_;
2505
2506 my $vollist = [];
2507
706c9791 2508 foreach_mountpoint($conf, sub {
9205e9d0
AD
2509 my ($ms, $mountpoint) = @_;
2510
2511 return if $excludes && $ms eq $excludes;
2512
2513 my $volid = $mountpoint->{volume};
2514
7c921c80 2515 return if !$volid || $mountpoint->{type} ne 'volume';
9205e9d0
AD
2516
2517 my ($sid, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2518 return if !$sid;
2519
2520 push @$vollist, $volid;
2521 });
2522
2523 return $vollist;
2524}
2525
6c871c36 2526sub mkfs {
d216e891 2527 my ($dev, $rootuid, $rootgid) = @_;
6c871c36 2528
d216e891
WB
2529 PVE::Tools::run_command(['mkfs.ext4', '-O', 'mmp',
2530 '-E', "root_owner=$rootuid:$rootgid",
2531 $dev]);
6c871c36
DM
2532}
2533
2534sub format_disk {
d216e891 2535 my ($storage_cfg, $volid, $rootuid, $rootgid) = @_;
6c871c36
DM
2536
2537 if ($volid =~ m!^/dev/.+!) {
2538 mkfs($volid);
2539 return;
2540 }
2541
2542 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2543
2544 die "cannot format volume '$volid' with no storage\n" if !$storage;
2545
08ca136d
DM
2546 PVE::Storage::activate_volumes($storage_cfg, [$volid]);
2547
6c871c36
DM
2548 my $path = PVE::Storage::path($storage_cfg, $volid);
2549
2550 my ($vtype, undef, undef, undef, undef, $isBase, $format) =
2551 PVE::Storage::parse_volname($storage_cfg, $volid);
2552
2553 die "cannot format volume '$volid' (format == $format)\n"
2554 if $format ne 'raw';
2555
d216e891 2556 mkfs($path, $rootuid, $rootgid);
6c871c36
DM
2557}
2558
2559sub destroy_disks {
2560 my ($storecfg, $vollist) = @_;
2561
2562 foreach my $volid (@$vollist) {
2563 eval { PVE::Storage::vdisk_free($storecfg, $volid); };
2564 warn $@ if $@;
2565 }
2566}
2567
2568sub create_disks {
2569 my ($storecfg, $vmid, $settings, $conf) = @_;
2570
2571 my $vollist = [];
2572
2573 eval {
d216e891
WB
2574 my (undef, $rootuid, $rootgid) = PVE::LXC::parse_id_maps($conf);
2575 my $chown_vollist = [];
2576
6c871c36
DM
2577 foreach_mountpoint($settings, sub {
2578 my ($ms, $mountpoint) = @_;
2579
2580 my $volid = $mountpoint->{volume};
2581 my $mp = $mountpoint->{mp};
2582
2583 my ($storage, $volname) = PVE::Storage::parse_volume_id($volid, 1);
2584
e2007ac2 2585 if ($storage && ($volid =~ m/^([^:\s]+):(\d+(\.\d+)?)$/)) {
8ed5ff9d 2586 my ($storeid, $size_gb) = ($1, $2);
6c871c36 2587
8ed5ff9d 2588 my $size_kb = int(${size_gb}*1024) * 1024;
6c871c36
DM
2589
2590 my $scfg = PVE::Storage::storage_config($storecfg, $storage);
2591 # fixme: use better naming ct-$vmid-disk-X.raw?
2592
2593 if ($scfg->{type} eq 'dir' || $scfg->{type} eq 'nfs') {
8ed5ff9d 2594 if ($size_kb > 0) {
6c871c36 2595 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw',
8ed5ff9d 2596 undef, $size_kb);
d216e891 2597 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2598 } else {
2599 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'subvol',
2600 undef, 0);
d216e891 2601 push @$chown_vollist, $volid;
6c871c36
DM
2602 }
2603 } elsif ($scfg->{type} eq 'zfspool') {
2604
2605 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'subvol',
8ed5ff9d 2606 undef, $size_kb);
d216e891 2607 push @$chown_vollist, $volid;
2e879877 2608 } elsif ($scfg->{type} eq 'drbd' || $scfg->{type} eq 'lvm' || $scfg->{type} eq 'lvmthin') {
6c871c36 2609
8ed5ff9d 2610 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw', undef, $size_kb);
d216e891 2611 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2612
2613 } elsif ($scfg->{type} eq 'rbd') {
2614
2615 die "krbd option must be enabled on storage type '$scfg->{type}'\n" if !$scfg->{krbd};
8ed5ff9d 2616 $volid = PVE::Storage::vdisk_alloc($storecfg, $storage, $vmid, 'raw', undef, $size_kb);
d216e891 2617 format_disk($storecfg, $volid, $rootuid, $rootgid);
6c871c36
DM
2618 } else {
2619 die "unable to create containers on storage type '$scfg->{type}'\n";
2620 }
2621 push @$vollist, $volid;
71c780b9
WB
2622 $mountpoint->{volume} = $volid;
2623 $mountpoint->{size} = $size_kb * 1024;
2624 $conf->{$ms} = print_ct_mountpoint($mountpoint, $ms eq 'rootfs');
6c871c36 2625 } else {
e2007ac2
DM
2626 # use specified/existing volid/dir/device
2627 $conf->{$ms} = print_ct_mountpoint($mountpoint, $ms eq 'rootfs');
6c871c36
DM
2628 }
2629 });
d216e891
WB
2630
2631 PVE::Storage::activate_volumes($storecfg, $chown_vollist, undef);
2632 foreach my $volid (@$chown_vollist) {
2633 my $path = PVE::Storage::path($storecfg, $volid, undef);
2634 chown($rootuid, $rootgid, $path);
2635 }
2636 PVE::Storage::deactivate_volumes($storecfg, $chown_vollist, undef);
6c871c36
DM
2637 };
2638 # free allocated images on error
2639 if (my $err = $@) {
2640 destroy_disks($storecfg, $vollist);
2641 die $err;
2642 }
2643 return $vollist;
2644}
2645
68e8f3c5
DM
2646# bash completion helper
2647
2648sub complete_os_templates {
2649 my ($cmdname, $pname, $cvalue) = @_;
2650
2651 my $cfg = PVE::Storage::config();
2652
9e9bc3a6 2653 my $storeid;
68e8f3c5
DM
2654
2655 if ($cvalue =~ m/^([^:]+):/) {
2656 $storeid = $1;
2657 }
2658
2659 my $vtype = $cmdname eq 'restore' ? 'backup' : 'vztmpl';
2660 my $data = PVE::Storage::template_list($cfg, $storeid, $vtype);
2661
2662 my $res = [];
2663 foreach my $id (keys %$data) {
2664 foreach my $item (@{$data->{$id}}) {
2665 push @$res, $item->{volid} if defined($item->{volid});
2666 }
2667 }
2668
2669 return $res;
2670}
2671
68e8f3c5
DM
2672my $complete_ctid_full = sub {
2673 my ($running) = @_;
2674
2675 my $idlist = vmstatus();
2676
2677 my $active_hash = list_active_containers();
2678
2679 my $res = [];
2680
2681 foreach my $id (keys %$idlist) {
2682 my $d = $idlist->{$id};
2683 if (defined($running)) {
2684 next if $d->{template};
2685 next if $running && !$active_hash->{$id};
2686 next if !$running && $active_hash->{$id};
2687 }
2688 push @$res, $id;
2689
2690 }
2691 return $res;
2692};
2693
2694sub complete_ctid {
2695 return &$complete_ctid_full();
2696}
2697
2698sub complete_ctid_stopped {
2699 return &$complete_ctid_full(0);
2700}
2701
2702sub complete_ctid_running {
2703 return &$complete_ctid_full(1);
2704}
2705
c6a605f9
WB
2706sub parse_id_maps {
2707 my ($conf) = @_;
2708
2709 my $id_map = [];
2710 my $rootuid = 0;
2711 my $rootgid = 0;
2712
2713 my $lxc = $conf->{lxc};
2714 foreach my $entry (@$lxc) {
2715 my ($key, $value) = @$entry;
2716 next if $key ne 'lxc.id_map';
2717 if ($value =~ /^([ug])\s+(\d+)\s+(\d+)\s+(\d+)\s*$/) {
2718 my ($type, $ct, $host, $length) = ($1, $2, $3, $4);
2719 push @$id_map, [$type, $ct, $host, $length];
2720 if ($ct == 0) {
2721 $rootuid = $host if $type eq 'u';
2722 $rootgid = $host if $type eq 'g';
2723 }
2724 } else {
2725 die "failed to parse id_map: $value\n";
2726 }
2727 }
2728
2729 if (!@$id_map && $conf->{unprivileged}) {
2730 # Should we read them from /etc/subuid?
2731 $id_map = [ ['u', '0', '100000', '65536'],
2732 ['g', '0', '100000', '65536'] ];
2733 $rootuid = $rootgid = 100000;
2734 }
2735
2736 return ($id_map, $rootuid, $rootgid);
2737}
2738
01dce99b
WB
2739sub userns_command {
2740 my ($id_map) = @_;
2741 if (@$id_map) {
2742 return ['lxc-usernsexec', (map { ('-m', join(':', @$_)) } @$id_map), '--'];
2743 }
2744 return [];
2745}
2746
f76a2828 27471;