+# Try to simulate packet traversal inside kernel. This invokes iptable
+# checks several times.
+sub route_packet {
+ my ($ruleset, $ipset_ruleset, $pkg, $from_info, $target, $start_state) = @_;
+
+ my $route_state = $start_state;
+
+ my $physdev_in;
+
+ my $ipt_invocation_counter = 0;
+ my $rule_check_counter = 0;
+
+ while ($route_state ne $target->{iface}) {
+
+ my $chain;
+ my $next_route_state;
+ my $next_physdev_in;
+
+ $pkg->{iface_in} = $pkg->{iface_out} = undef;
+ $pkg->{physdev_in} = $pkg->{physdev_out} = undef;
+
+ if ($route_state eq 'from-bport') {
+ $next_route_state = $from_info->{bridge} || die 'internal error';
+ $next_physdev_in = $from_info->{iface} || die 'internal error';
+ } elsif ($route_state eq 'host') {
+
+ if ($target->{type} eq 'bport') {
+ $pkg->{iface_in} = 'lo';
+ $pkg->{iface_out} = $target->{bridge} || die 'internal error';
+ $chain = 'PVEFW-OUTPUT';
+ $next_route_state = $target->{iface} || die 'internal error';
+ } elsif ($target->{type} eq 'ct') {
+ $pkg->{iface_in} = 'lo';
+ $pkg->{iface_out} = 'venet0';
+ $chain = 'PVEFW-OUTPUT';
+ $next_route_state = 'venet-in';
+ } elsif ($target->{type} eq 'vm') {
+ $pkg->{iface_in} = 'lo';
+ $pkg->{iface_out} = $target->{bridge} || die 'internal error';
+ $chain = 'PVEFW-OUTPUT';
+ $next_route_state = 'fwbr-in';
+ } else {
+ die "implement me";
+ }
+
+ } elsif ($route_state eq 'venet-out') {
+
+ if ($target->{type} eq 'host') {
+
+ $chain = 'PVEFW-INPUT';
+ $pkg->{iface_in} = 'venet0';
+ $pkg->{iface_out} = 'lo';
+ $next_route_state = 'host';
+
+ } elsif ($target->{type} eq 'bport') {
+
+ $chain = 'PVEFW-FORWARD';
+ $pkg->{iface_in} = 'venet0';
+ $pkg->{iface_out} = $target->{bridge} || die 'internal error';
+ $next_route_state = $target->{iface} || die 'internal error';
+
+ } elsif ($target->{type} eq 'vm') {
+
+ $chain = 'PVEFW-FORWARD';
+ $pkg->{iface_in} = 'venet0';
+ $pkg->{iface_out} = $target->{bridge} || die 'internal error';
+ $next_route_state = 'fwbr-in';
+
+ } elsif ($target->{type} eq 'ct') {
+
+ $chain = 'PVEFW-FORWARD';
+ $pkg->{iface_in} = 'venet0';
+ $pkg->{iface_out} = 'venet0';
+ $next_route_state = 'venet-in';
+
+ } else {
+ die "implement me";
+ }
+
+ } elsif ($route_state eq 'fwbr-out') {
+
+ $chain = 'PVEFW-FORWARD';
+ $next_route_state = $from_info->{bridge} || die 'internal error';
+ $next_physdev_in = $from_info->{fwpr} || die 'internal error';
+ $pkg->{iface_in} = $from_info->{fwbr} || die 'internal error';
+ $pkg->{iface_out} = $from_info->{fwbr} || die 'internal error';
+ $pkg->{physdev_in} = $from_info->{tapdev} || die 'internal error';
+ $pkg->{physdev_out} = $from_info->{fwln} || die 'internal error';
+
+ } elsif ($route_state eq 'fwbr-in') {
+
+ $chain = 'PVEFW-FORWARD';
+ $next_route_state = $target->{tapdev};
+ $pkg->{iface_in} = $target->{fwbr} || die 'internal error';
+ $pkg->{iface_out} = $target->{fwbr} || die 'internal error';
+ $pkg->{physdev_in} = $target->{fwln} || die 'internal error';
+ $pkg->{physdev_out} = $target->{tapdev} || die 'internal error';
+
+ } elsif ($route_state =~ m/^vmbr\d+$/) {
+
+ die "missing physdev_in - internal error?" if !$physdev_in;
+ $pkg->{physdev_in} = $physdev_in;
+
+ if ($target->{type} eq 'host') {
+
+ $chain = 'PVEFW-INPUT';
+ $pkg->{iface_in} = $route_state;
+ $pkg->{iface_out} = 'lo';
+ $next_route_state = 'host';
+
+ } elsif ($target->{type} eq 'bport') {
+
+ $chain = 'PVEFW-FORWARD';
+ $pkg->{iface_in} = $route_state;
+ $pkg->{iface_out} = $target->{bridge} || die 'internal error';
+ # conditionally set physdev_out (same behavior as kernel)
+ if ($route_state eq $target->{bridge}) {
+ $pkg->{physdev_out} = $target->{iface} || die 'internal error';
+ }
+ $next_route_state = $target->{iface};
+
+ } elsif ($target->{type} eq 'ct') {
+
+ $chain = 'PVEFW-FORWARD';
+ $pkg->{iface_in} = $route_state;
+ $pkg->{iface_out} = 'venet0';
+ $next_route_state = 'venet-in';
+
+ } elsif ($target->{type} eq 'vm') {
+
+ $chain = 'PVEFW-FORWARD';
+ $pkg->{iface_in} = $route_state;
+ $pkg->{iface_out} = $target->{bridge};
+ # conditionally set physdev_out (same behavior as kernel)
+ if ($route_state eq $target->{bridge}) {
+ $pkg->{physdev_out} = $target->{fwpr} || die 'internal error';
+ }
+ $next_route_state = 'fwbr-in';
+
+ } else {
+ die "implement me";
+ }
+
+ } else {
+ die "implement me $route_state";
+ }
+
+ die "internal error" if !defined($next_route_state);
+
+ if ($chain) {
+ add_trace("IPT check at $route_state (chain $chain)\n");
+ add_trace(Dumper($pkg));
+ $ipt_invocation_counter++;
+ my ($res, $ctr) = ruleset_simulate_chain($ruleset, $chain, $pkg);
+ $rule_check_counter += $ctr;
+ return ($res, $ipt_invocation_counter, $rule_check_counter) if $res ne 'ACCEPT';
+ }
+
+ $route_state = $next_route_state;
+
+ $physdev_in = $next_physdev_in;
+ }
+
+ return ('ACCEPT', $ipt_invocation_counter, $rule_check_counter);
+}
+
+sub extract_ct_info {
+ my ($vmdata, $vmid) = @_;
+
+ my $info = { type => 'ct', vmid => $vmid };
+
+ my $conf = $vmdata->{openvz}->{$vmid} || die "no such CT '$vmid'";
+ if ($conf->{ip_address}) {
+ $info->{ip_address} = $conf->{ip_address}->{value};
+ } else {
+ die "implement me";
+ }
+ return $info;
+}
+
+sub extract_vm_info {
+ my ($vmdata, $vmid) = @_;
+
+ my $info = { type => 'vm', vmid => $vmid };
+
+ my $conf = $vmdata->{qemu}->{$vmid} || die "no such VM '$vmid'";
+ my $net = PVE::QemuServer::parse_net($conf->{net0});
+ $info->{macaddr} = $net->{macaddr} || die "unable to get mac address";
+ $info->{bridge} = $net->{bridge} || die "unable to get bridge";
+ $info->{fwbr} = "fwbr${vmid}i0";
+ $info->{tapdev} = "tap${vmid}i0";
+ $info->{fwln} = "fwln${vmid}i0";
+ $info->{fwpr} = "fwpr${vmid}p0";
+
+ return $info;
+}