2023-02-02 20:22:18 +07:00
|
|
|
/*
|
|
|
|
* SPDX-License-Identifier: AGPL-3.0-only
|
2023-03-14 14:01:55 +07:00
|
|
|
* Copyright (c) 2022-2023, daeuniverse Organization <dae@v2raya.org>
|
2023-02-02 20:22:18 +07:00
|
|
|
*/
|
|
|
|
|
|
|
|
package control
|
|
|
|
|
|
|
|
import (
|
2023-03-23 14:34:56 +07:00
|
|
|
"context"
|
2023-07-07 16:35:01 +07:00
|
|
|
"errors"
|
2023-02-02 20:22:18 +07:00
|
|
|
"fmt"
|
2023-04-23 12:27:29 +07:00
|
|
|
"net"
|
|
|
|
"net/netip"
|
|
|
|
"os"
|
|
|
|
"regexp"
|
2023-07-07 16:35:01 +07:00
|
|
|
"sync"
|
2023-04-23 12:27:29 +07:00
|
|
|
|
2023-02-02 20:22:18 +07:00
|
|
|
"github.com/cilium/ebpf"
|
|
|
|
ciliumLink "github.com/cilium/ebpf/link"
|
2023-03-14 14:01:55 +07:00
|
|
|
"github.com/daeuniverse/dae/common"
|
|
|
|
"github.com/daeuniverse/dae/common/consts"
|
|
|
|
internal "github.com/daeuniverse/dae/pkg/ebpf_internal"
|
2023-07-09 15:02:17 +07:00
|
|
|
dnsmessage "github.com/miekg/dns"
|
2023-03-23 14:34:56 +07:00
|
|
|
"github.com/mohae/deepcopy"
|
|
|
|
"github.com/safchain/ethtool"
|
|
|
|
"github.com/sirupsen/logrus"
|
2023-02-02 20:22:18 +07:00
|
|
|
"github.com/vishvananda/netlink"
|
|
|
|
"golang.org/x/sys/unix"
|
|
|
|
)
|
|
|
|
|
2023-02-27 13:36:36 +07:00
|
|
|
// coreFlip should be 0 or 1
|
2023-02-27 12:29:42 +07:00
|
|
|
var coreFlip = 0
|
|
|
|
|
|
|
|
type controlPlaneCore struct {
|
2023-07-07 16:35:01 +07:00
|
|
|
mu sync.Mutex
|
|
|
|
|
2023-02-17 01:11:08 +07:00
|
|
|
log *logrus.Logger
|
|
|
|
deferFuncs []func() error
|
|
|
|
bpf *bpfObjects
|
|
|
|
outboundId2Name map[uint8]string
|
2023-02-02 20:22:18 +07:00
|
|
|
|
|
|
|
kernelVersion *internal.Version
|
2023-02-27 12:29:42 +07:00
|
|
|
|
2023-03-02 21:25:51 +07:00
|
|
|
flip int
|
|
|
|
isReload bool
|
|
|
|
bpfEjected bool
|
2023-03-23 14:34:56 +07:00
|
|
|
|
|
|
|
closed context.Context
|
|
|
|
close context.CancelFunc
|
2023-02-02 20:22:18 +07:00
|
|
|
}
|
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
func newControlPlaneCore(log *logrus.Logger,
|
|
|
|
bpf *bpfObjects,
|
|
|
|
outboundId2Name map[uint8]string,
|
|
|
|
kernelVersion *internal.Version,
|
|
|
|
isReload bool,
|
|
|
|
) *controlPlaneCore {
|
|
|
|
if isReload {
|
2023-02-27 13:36:36 +07:00
|
|
|
coreFlip = coreFlip&1 ^ 1
|
2023-02-27 12:29:42 +07:00
|
|
|
}
|
2023-03-02 21:25:51 +07:00
|
|
|
var deferFuncs []func() error
|
|
|
|
if !isReload {
|
|
|
|
deferFuncs = append(deferFuncs, bpf.Close)
|
|
|
|
}
|
2023-03-23 14:34:56 +07:00
|
|
|
closed, toClose := context.WithCancel(context.Background())
|
2023-02-27 12:29:42 +07:00
|
|
|
return &controlPlaneCore{
|
|
|
|
log: log,
|
2023-03-02 21:25:51 +07:00
|
|
|
deferFuncs: deferFuncs,
|
2023-02-27 12:29:42 +07:00
|
|
|
bpf: bpf,
|
|
|
|
outboundId2Name: outboundId2Name,
|
|
|
|
kernelVersion: kernelVersion,
|
|
|
|
flip: coreFlip,
|
2023-02-27 13:36:36 +07:00
|
|
|
isReload: isReload,
|
2023-03-23 14:34:56 +07:00
|
|
|
bpfEjected: false,
|
|
|
|
closed: closed,
|
|
|
|
close: toClose,
|
2023-02-27 12:29:42 +07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-03-02 21:25:51 +07:00
|
|
|
func (c *controlPlaneCore) Flip() {
|
|
|
|
coreFlip = coreFlip&1 ^ 1
|
|
|
|
}
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) Close() (err error) {
|
2023-07-07 16:35:01 +07:00
|
|
|
c.mu.Lock()
|
|
|
|
defer c.mu.Unlock()
|
2023-03-23 14:34:56 +07:00
|
|
|
select {
|
|
|
|
case <-c.closed.Done():
|
|
|
|
return nil
|
|
|
|
default:
|
|
|
|
}
|
2023-02-02 20:22:18 +07:00
|
|
|
// Invoke defer funcs in reverse order.
|
|
|
|
for i := len(c.deferFuncs) - 1; i >= 0; i-- {
|
|
|
|
if e := c.deferFuncs[i](); e != nil {
|
|
|
|
// Combine errors.
|
|
|
|
if err != nil {
|
|
|
|
err = fmt.Errorf("%w; %v", err, e)
|
|
|
|
} else {
|
|
|
|
err = e
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2023-03-23 14:34:56 +07:00
|
|
|
c.close()
|
2023-02-02 20:22:18 +07:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-02-07 22:52:37 +07:00
|
|
|
func getIfParamsFromLink(link netlink.Link) (ifParams bpfIfParams, err error) {
|
2023-02-04 10:38:01 +07:00
|
|
|
// Get link offload features.
|
|
|
|
et, err := ethtool.NewEthtool()
|
|
|
|
if err != nil {
|
|
|
|
return bpfIfParams{}, err
|
|
|
|
}
|
|
|
|
defer et.Close()
|
|
|
|
features, err := et.Features(link.Attrs().Name)
|
|
|
|
if err != nil {
|
|
|
|
return bpfIfParams{}, err
|
|
|
|
}
|
|
|
|
if features["tx-checksum-ip-generic"] {
|
|
|
|
ifParams.TxL4CksmIp4Offload = true
|
|
|
|
ifParams.TxL4CksmIp6Offload = true
|
|
|
|
}
|
|
|
|
if features["tx-checksum-ipv4"] {
|
|
|
|
ifParams.TxL4CksmIp4Offload = true
|
|
|
|
}
|
|
|
|
if features["tx-checksum-ipv6"] {
|
|
|
|
ifParams.TxL4CksmIp6Offload = true
|
|
|
|
}
|
|
|
|
if features["rx-checksum"] {
|
|
|
|
ifParams.RxCksmOffload = true
|
|
|
|
}
|
|
|
|
switch {
|
|
|
|
case regexp.MustCompile(`^docker\d+$`).MatchString(link.Attrs().Name):
|
|
|
|
ifParams.UseNonstandardOffloadAlgorithm = true
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
return ifParams, nil
|
|
|
|
}
|
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) addQdisc(ifname string) error {
|
2023-02-04 10:38:01 +07:00
|
|
|
link, err := netlink.LinkByName(ifname)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
qdisc := &netlink.GenericQdisc{
|
|
|
|
QdiscAttrs: netlink.QdiscAttrs{
|
|
|
|
LinkIndex: link.Attrs().Index,
|
|
|
|
Handle: netlink.MakeHandle(0xffff, 0),
|
|
|
|
Parent: netlink.HANDLE_CLSACT,
|
|
|
|
},
|
|
|
|
QdiscType: "clsact",
|
2023-02-06 12:56:43 +07:00
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
if err := netlink.QdiscAdd(qdisc); err != nil {
|
|
|
|
return fmt.Errorf("cannot add clsact qdisc: %w", err)
|
2023-02-04 10:38:01 +07:00
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) delQdisc(ifname string) error {
|
2023-02-08 13:36:16 +07:00
|
|
|
link, err := netlink.LinkByName(ifname)
|
|
|
|
if err != nil {
|
2023-02-04 10:38:01 +07:00
|
|
|
return err
|
|
|
|
}
|
2023-02-02 20:22:18 +07:00
|
|
|
qdisc := &netlink.GenericQdisc{
|
|
|
|
QdiscAttrs: netlink.QdiscAttrs{
|
|
|
|
LinkIndex: link.Attrs().Index,
|
|
|
|
Handle: netlink.MakeHandle(0xffff, 0),
|
|
|
|
Parent: netlink.HANDLE_CLSACT,
|
|
|
|
},
|
|
|
|
QdiscType: "clsact",
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
if err := netlink.QdiscDel(qdisc); err != nil {
|
|
|
|
if !os.IsExist(err) {
|
2023-02-02 20:22:18 +07:00
|
|
|
return fmt.Errorf("cannot add clsact qdisc: %w", err)
|
|
|
|
}
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
return nil
|
|
|
|
}
|
2023-02-02 20:22:18 +07:00
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) setupRoutingPolicy() (err error) {
|
2023-02-18 13:55:42 +07:00
|
|
|
/// Insert ip rule / ip route.
|
2023-02-27 12:29:42 +07:00
|
|
|
var table = 2023 + c.flip
|
2023-02-18 13:55:42 +07:00
|
|
|
|
|
|
|
/** ip table
|
|
|
|
ip route add local default dev lo table 2023
|
|
|
|
ip -6 route add local default dev lo table 2023
|
|
|
|
*/
|
|
|
|
routes := []netlink.Route{{
|
|
|
|
Scope: unix.RT_SCOPE_HOST,
|
|
|
|
LinkIndex: consts.LoopbackIfIndex,
|
|
|
|
Dst: &net.IPNet{
|
|
|
|
IP: []byte{0, 0, 0, 0},
|
|
|
|
Mask: net.CIDRMask(0, 32),
|
|
|
|
},
|
|
|
|
Table: table,
|
|
|
|
Type: unix.RTN_LOCAL,
|
|
|
|
}, {
|
|
|
|
Scope: unix.RT_SCOPE_HOST,
|
|
|
|
LinkIndex: consts.LoopbackIfIndex,
|
|
|
|
Dst: &net.IPNet{
|
|
|
|
IP: []byte{0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0},
|
|
|
|
Mask: net.CIDRMask(0, 128),
|
|
|
|
},
|
|
|
|
Table: table,
|
|
|
|
Type: unix.RTN_LOCAL,
|
|
|
|
}}
|
2023-04-12 21:34:45 +07:00
|
|
|
var routeBadIpv6 bool
|
2023-02-18 13:55:42 +07:00
|
|
|
cleanRoutes := func() error {
|
|
|
|
var errs error
|
|
|
|
for _, route := range routes {
|
|
|
|
if e := netlink.RouteDel(&route); e != nil {
|
2023-04-12 21:34:45 +07:00
|
|
|
if len(route.Dst.IP) == net.IPv6len && routeBadIpv6 {
|
|
|
|
// Not clean for bad ipv6.
|
2023-03-04 20:16:09 +07:00
|
|
|
continue
|
|
|
|
}
|
2023-02-18 13:55:42 +07:00
|
|
|
if errs != nil {
|
|
|
|
errs = fmt.Errorf("%w; %v", errs, e)
|
|
|
|
} else {
|
|
|
|
errs = e
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if errs != nil {
|
|
|
|
return fmt.Errorf("IpRouteDel(lo): %w", errs)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
tryRouteAddAgain:
|
|
|
|
for _, route := range routes {
|
|
|
|
if err = netlink.RouteAdd(&route); err != nil {
|
|
|
|
if os.IsExist(err) {
|
|
|
|
_ = cleanRoutes()
|
|
|
|
goto tryRouteAddAgain
|
|
|
|
}
|
2023-03-04 20:16:09 +07:00
|
|
|
if len(route.Dst.IP) == net.IPv6len {
|
|
|
|
// ipv6
|
2023-04-12 21:34:45 +07:00
|
|
|
c.log.Warnln("IpRouteAdd: Bad IPv6 support. Perhaps your machine disabled IPv6.")
|
|
|
|
routeBadIpv6 = true
|
2023-03-04 20:16:09 +07:00
|
|
|
continue
|
|
|
|
}
|
2023-02-18 13:55:42 +07:00
|
|
|
return fmt.Errorf("IpRouteAdd: %w", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
c.deferFuncs = append(c.deferFuncs, cleanRoutes)
|
|
|
|
|
|
|
|
/** ip rule
|
|
|
|
ip rule add fwmark 0x8000000/0x8000000 table 2023
|
|
|
|
ip -6 rule add fwmark 0x8000000/0x8000000 table 2023
|
|
|
|
*/
|
|
|
|
rules := []netlink.Rule{{
|
|
|
|
SuppressIfgroup: -1,
|
|
|
|
SuppressPrefixlen: -1,
|
|
|
|
Priority: -1,
|
|
|
|
Goto: -1,
|
|
|
|
Flow: -1,
|
|
|
|
Family: unix.AF_INET,
|
|
|
|
Table: table,
|
|
|
|
Mark: int(consts.TproxyMark),
|
|
|
|
Mask: int(consts.TproxyMark),
|
|
|
|
}, {
|
|
|
|
SuppressIfgroup: -1,
|
|
|
|
SuppressPrefixlen: -1,
|
|
|
|
Priority: -1,
|
|
|
|
Goto: -1,
|
|
|
|
Flow: -1,
|
|
|
|
Family: unix.AF_INET6,
|
|
|
|
Table: table,
|
|
|
|
Mark: int(consts.TproxyMark),
|
|
|
|
Mask: int(consts.TproxyMark),
|
|
|
|
}}
|
2023-04-12 21:34:45 +07:00
|
|
|
var ruleBadIpv6 bool
|
2023-02-18 13:55:42 +07:00
|
|
|
cleanRules := func() error {
|
|
|
|
var errs error
|
|
|
|
for _, rule := range rules {
|
2023-04-12 21:34:45 +07:00
|
|
|
if rule.Family == unix.AF_INET6 && ruleBadIpv6 {
|
|
|
|
// Not clean for bad ipv6.
|
|
|
|
continue
|
|
|
|
}
|
2023-02-18 13:55:42 +07:00
|
|
|
if e := netlink.RuleDel(&rule); e != nil {
|
|
|
|
if errs != nil {
|
|
|
|
errs = fmt.Errorf("%w; %v", errs, e)
|
|
|
|
} else {
|
|
|
|
errs = e
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if errs != nil {
|
|
|
|
return fmt.Errorf("IpRuleDel: %w", errs)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
tryRuleAddAgain:
|
|
|
|
for _, rule := range rules {
|
|
|
|
if err = netlink.RuleAdd(&rule); err != nil {
|
|
|
|
if os.IsExist(err) {
|
|
|
|
_ = cleanRules()
|
|
|
|
goto tryRuleAddAgain
|
|
|
|
}
|
2023-04-12 21:34:45 +07:00
|
|
|
if rule.Family == unix.AF_INET6 {
|
|
|
|
// ipv6
|
|
|
|
c.log.Warnln("IpRuleAdd: Bad IPv6 support. Perhaps your machine disabled IPv6 (need CONFIG_IPV6_MULTIPLE_TABLES).")
|
|
|
|
ruleBadIpv6 = true
|
|
|
|
continue
|
|
|
|
}
|
2023-02-18 13:55:42 +07:00
|
|
|
return fmt.Errorf("IpRuleAdd: %w", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
c.deferFuncs = append(c.deferFuncs, cleanRules)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-07 16:35:01 +07:00
|
|
|
func (c *controlPlaneCore) addLinkCb(_ifname string, rtmType uint16, cb func()) error {
|
|
|
|
ch := make(chan netlink.LinkUpdate)
|
|
|
|
done := make(chan struct{})
|
|
|
|
if e := netlink.LinkSubscribeWithOptions(ch, done, netlink.LinkSubscribeOptions{
|
|
|
|
ErrorCallback: func(err error) {
|
2023-07-07 20:07:39 +07:00
|
|
|
c.log.Debug("LinkSubscribe:", err)
|
2023-07-07 16:35:01 +07:00
|
|
|
},
|
|
|
|
ListExisting: true,
|
|
|
|
}); e != nil {
|
|
|
|
return e
|
|
|
|
}
|
|
|
|
go func(ctx context.Context, ch <-chan netlink.LinkUpdate, done chan struct{}) {
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
close(done)
|
|
|
|
return
|
|
|
|
case <-done:
|
|
|
|
return
|
|
|
|
case update := <-ch:
|
|
|
|
if update.Header.Type == rtmType {
|
|
|
|
ifname := update.Link.Attrs().Name
|
|
|
|
if ifname == _ifname {
|
|
|
|
cb()
|
|
|
|
close(done)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}(c.closed, ch, done)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// addNewLinkBindLanCb waits for NEWLINK msg of given `ifname` and invokes `bindLan`.
|
|
|
|
func (c *controlPlaneCore) addNewLinkBindLanCb(ifname string, autoConfigKernelParameter bool) error {
|
|
|
|
return c.addLinkCb(ifname, unix.RTM_NEWLINK, func() {
|
|
|
|
c.log.Warnf("New link creation of '%v' is detected. Bind LAN program to it.", ifname)
|
|
|
|
if err := c.addQdisc(ifname); err != nil {
|
|
|
|
c.log.Errorf("addQdisc: %v", err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if err := c.bindLan(ifname, autoConfigKernelParameter); err != nil {
|
|
|
|
c.log.Errorf("bindLan: %v", err)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
// bindLan automatically configures kernel parameters and bind to lan interface `ifname`.
|
|
|
|
// bindLan supports lazy-bind if interface `ifname` is not found.
|
|
|
|
// bindLan supports rebinding when the interface `ifname` is deleted in the future.
|
|
|
|
func (c *controlPlaneCore) bindLan(ifname string, autoConfigKernelParameter bool) error {
|
|
|
|
if autoConfigKernelParameter {
|
|
|
|
SetSendRedirects(ifname, "0")
|
|
|
|
SetForwarding(ifname, "1")
|
|
|
|
}
|
|
|
|
if err := c._bindLan(ifname); err != nil {
|
|
|
|
var notFoundErr netlink.LinkNotFoundError
|
|
|
|
if !errors.As(err, ¬FoundErr) {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
// Not found error.
|
|
|
|
|
|
|
|
// Listen for `NEWLINK` to bind.
|
|
|
|
c.log.Warnf("Link '%v' is not found. Bind LAN program to it once it is created.", ifname)
|
|
|
|
if e := c.addNewLinkBindLanCb(ifname, autoConfigKernelParameter); e != nil {
|
|
|
|
return fmt.Errorf("%w: %v", err, e)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
// Listen for `DELLINK` and add `NEWLINK` callback to re-bind.
|
|
|
|
if err := c.addLinkCb(ifname, unix.RTM_DELLINK, func() {
|
|
|
|
c.log.Warnf("Link deletion of '%v' is detected. Bind LAN program to it once it is re-created.", ifname)
|
|
|
|
if e := c.addNewLinkBindLanCb(ifname, autoConfigKernelParameter); e != nil {
|
|
|
|
c.log.Errorf("Failed to add callback for re-bind LAN program to '%v': %v", ifname, e)
|
|
|
|
}
|
|
|
|
}); err != nil {
|
|
|
|
return fmt.Errorf("failed to add re-bind callback: %w", err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *controlPlaneCore) _bindLan(ifname string) error {
|
|
|
|
c.mu.Lock()
|
|
|
|
defer c.mu.Unlock()
|
|
|
|
select {
|
|
|
|
case <-c.closed.Done():
|
|
|
|
return nil
|
|
|
|
default:
|
|
|
|
}
|
2023-02-10 10:59:40 +07:00
|
|
|
c.log.Infof("Bind to LAN: %v", ifname)
|
|
|
|
|
2023-02-13 09:52:40 +07:00
|
|
|
link, err := netlink.LinkByName(ifname)
|
2023-02-10 10:55:00 +07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-02-26 04:07:42 +07:00
|
|
|
if err = CheckIpforward(ifname); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err = CheckSendRedirects(ifname); err != nil {
|
2023-02-02 20:22:18 +07:00
|
|
|
return err
|
|
|
|
}
|
2023-02-04 10:38:01 +07:00
|
|
|
/// Insert an elem into IfindexParamsMap.
|
2023-02-07 22:52:37 +07:00
|
|
|
ifParams, err := getIfParamsFromLink(link)
|
2023-02-04 10:38:01 +07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err = ifParams.CheckVersionRequirement(c.kernelVersion); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := c.bpf.IfindexParamsMap.Update(uint32(link.Attrs().Index), ifParams, ebpf.UpdateAny); err != nil {
|
|
|
|
return fmt.Errorf("update IfindexIpsMap: %w", err)
|
|
|
|
}
|
2023-02-02 20:22:18 +07:00
|
|
|
|
2023-02-08 13:36:16 +07:00
|
|
|
// Insert filters.
|
|
|
|
filterIngress := &netlink.BpfFilter{
|
|
|
|
FilterAttrs: netlink.FilterAttrs{
|
|
|
|
LinkIndex: link.Attrs().Index,
|
|
|
|
Parent: netlink.HANDLE_MIN_INGRESS,
|
2023-02-27 12:29:42 +07:00
|
|
|
Handle: netlink.MakeHandle(0x2023, 0b100+uint16(c.flip)),
|
2023-02-08 13:36:16 +07:00
|
|
|
Protocol: unix.ETH_P_ALL,
|
|
|
|
// Priority should be behind of WAN's
|
|
|
|
Priority: 2,
|
|
|
|
},
|
|
|
|
Fd: c.bpf.bpfPrograms.TproxyLanIngress.FD(),
|
|
|
|
Name: consts.AppName + "_lan_ingress",
|
|
|
|
DirectAction: true,
|
|
|
|
}
|
|
|
|
// Remove and add.
|
|
|
|
_ = netlink.FilterDel(filterIngress)
|
2023-02-27 13:36:36 +07:00
|
|
|
if !c.isReload {
|
|
|
|
// Clean up thoroughly.
|
|
|
|
filterIngressFlipped := deepcopy.Copy(filterIngress).(*netlink.BpfFilter)
|
|
|
|
filterIngressFlipped.FilterAttrs.Handle ^= 1
|
|
|
|
_ = netlink.FilterDel(filterIngressFlipped)
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
if err := netlink.FilterAdd(filterIngress); err != nil {
|
|
|
|
return fmt.Errorf("cannot attach ebpf object to filter ingress: %w", err)
|
|
|
|
}
|
|
|
|
c.deferFuncs = append(c.deferFuncs, func() error {
|
|
|
|
if err := netlink.FilterDel(filterIngress); err != nil {
|
|
|
|
return fmt.Errorf("FilterDel(%v:%v): %w", ifname, filterIngress.Name, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
2023-02-12 20:50:15 +07:00
|
|
|
|
|
|
|
// Insert filters.
|
|
|
|
filterEgress := &netlink.BpfFilter{
|
|
|
|
FilterAttrs: netlink.FilterAttrs{
|
|
|
|
LinkIndex: link.Attrs().Index,
|
|
|
|
Parent: netlink.HANDLE_MIN_EGRESS,
|
2023-02-27 12:29:42 +07:00
|
|
|
Handle: netlink.MakeHandle(0x2023, 0b010+uint16(c.flip)),
|
2023-02-12 20:50:15 +07:00
|
|
|
Protocol: unix.ETH_P_ALL,
|
|
|
|
// Priority should be front of WAN's
|
|
|
|
Priority: 1,
|
|
|
|
},
|
|
|
|
Fd: c.bpf.bpfPrograms.TproxyLanEgress.FD(),
|
|
|
|
Name: consts.AppName + "_lan_egress",
|
|
|
|
DirectAction: true,
|
|
|
|
}
|
|
|
|
// Remove and add.
|
|
|
|
_ = netlink.FilterDel(filterEgress)
|
2023-02-27 13:36:36 +07:00
|
|
|
if !c.isReload {
|
|
|
|
// Clean up thoroughly.
|
|
|
|
filterEgressFlipped := deepcopy.Copy(filterEgress).(*netlink.BpfFilter)
|
|
|
|
filterEgressFlipped.FilterAttrs.Handle ^= 1
|
|
|
|
_ = netlink.FilterDel(filterEgressFlipped)
|
|
|
|
}
|
2023-02-12 20:50:15 +07:00
|
|
|
if err := netlink.FilterAdd(filterEgress); err != nil {
|
|
|
|
return fmt.Errorf("cannot attach ebpf object to filter egress: %w", err)
|
|
|
|
}
|
|
|
|
c.deferFuncs = append(c.deferFuncs, func() error {
|
|
|
|
if err := netlink.FilterDel(filterEgress); err != nil {
|
|
|
|
return fmt.Errorf("FilterDel(%v:%v): %w", ifname, filterEgress.Name, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
2023-02-08 13:36:16 +07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) setupSkPidMonitor() error {
|
2023-02-02 20:22:18 +07:00
|
|
|
/// Set-up SrcPidMapper.
|
|
|
|
/// Attach programs to support pname routing.
|
|
|
|
// Get the first-mounted cgroupv2 path.
|
|
|
|
cgroupPath, err := detectCgroupPath()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
// Bind cg programs
|
|
|
|
type cgProg struct {
|
|
|
|
Name string
|
|
|
|
Prog *ebpf.Program
|
|
|
|
Attach ebpf.AttachType
|
|
|
|
}
|
|
|
|
cgProgs := []cgProg{
|
|
|
|
{Prog: c.bpf.TproxyWanCgSockCreate, Attach: ebpf.AttachCGroupInetSockCreate},
|
|
|
|
{Prog: c.bpf.TproxyWanCgSockRelease, Attach: ebpf.AttachCgroupInetSockRelease},
|
2023-02-12 22:15:53 +07:00
|
|
|
{Prog: c.bpf.TproxyWanCgConnect4, Attach: ebpf.AttachCGroupInet4Connect},
|
|
|
|
{Prog: c.bpf.TproxyWanCgConnect6, Attach: ebpf.AttachCGroupInet6Connect},
|
|
|
|
{Prog: c.bpf.TproxyWanCgSendmsg4, Attach: ebpf.AttachCGroupUDP4Sendmsg},
|
|
|
|
{Prog: c.bpf.TproxyWanCgSendmsg6, Attach: ebpf.AttachCGroupUDP6Sendmsg},
|
2023-02-02 20:22:18 +07:00
|
|
|
}
|
|
|
|
for _, prog := range cgProgs {
|
|
|
|
attached, err := ciliumLink.AttachCgroup(ciliumLink.CgroupOptions{
|
|
|
|
Path: cgroupPath,
|
|
|
|
Attach: prog.Attach,
|
|
|
|
Program: prog.Prog,
|
|
|
|
})
|
|
|
|
if err != nil {
|
2023-04-02 16:43:50 +07:00
|
|
|
return fmt.Errorf("AttachCgroup: %v: %w", prog.Prog.String(), err)
|
2023-02-02 20:22:18 +07:00
|
|
|
}
|
|
|
|
c.deferFuncs = append(c.deferFuncs, func() error {
|
|
|
|
if err := attached.Close(); err != nil {
|
|
|
|
return fmt.Errorf("inet6Bind.Close(): %w", err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
return nil
|
|
|
|
}
|
2023-07-07 16:35:01 +07:00
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) bindWan(ifname string) error {
|
2023-07-07 16:35:01 +07:00
|
|
|
return c._bindWan(ifname)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *controlPlaneCore) _bindWan(ifname string) error {
|
|
|
|
c.mu.Lock()
|
|
|
|
defer c.mu.Unlock()
|
|
|
|
select {
|
|
|
|
case <-c.closed.Done():
|
|
|
|
return nil
|
|
|
|
default:
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
c.log.Infof("Bind to WAN: %v", ifname)
|
|
|
|
link, err := netlink.LinkByName(ifname)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2023-02-02 20:22:18 +07:00
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
if link.Attrs().Index == consts.LoopbackIfIndex {
|
|
|
|
return fmt.Errorf("cannot bind to loopback interface")
|
|
|
|
}
|
|
|
|
/// Insert an elem into IfindexParamsMap.
|
|
|
|
ifParams, err := getIfParamsFromLink(link)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err = ifParams.CheckVersionRequirement(c.kernelVersion); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := c.bpf.IfindexParamsMap.Update(uint32(link.Attrs().Index), ifParams, ebpf.UpdateAny); err != nil {
|
|
|
|
return fmt.Errorf("update IfindexIpsMap: %w", err)
|
2023-02-02 20:22:18 +07:00
|
|
|
}
|
|
|
|
|
2023-02-08 13:36:16 +07:00
|
|
|
/// Set-up WAN ingress/egress TC programs.
|
2023-02-02 20:22:18 +07:00
|
|
|
// Insert TC filters
|
|
|
|
filterEgress := &netlink.BpfFilter{
|
|
|
|
FilterAttrs: netlink.FilterAttrs{
|
|
|
|
LinkIndex: link.Attrs().Index,
|
|
|
|
Parent: netlink.HANDLE_MIN_EGRESS,
|
2023-02-27 12:29:42 +07:00
|
|
|
Handle: netlink.MakeHandle(0x2023, 0b100+uint16(c.flip)),
|
2023-02-02 20:22:18 +07:00
|
|
|
Protocol: unix.ETH_P_ALL,
|
2023-02-12 20:50:15 +07:00
|
|
|
Priority: 2,
|
2023-02-02 20:22:18 +07:00
|
|
|
},
|
|
|
|
Fd: c.bpf.bpfPrograms.TproxyWanEgress.FD(),
|
2023-02-08 13:36:16 +07:00
|
|
|
Name: consts.AppName + "_wan_egress",
|
2023-02-02 20:22:18 +07:00
|
|
|
DirectAction: true,
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
_ = netlink.FilterDel(filterEgress)
|
2023-02-27 13:36:36 +07:00
|
|
|
// Remove and add.
|
|
|
|
if !c.isReload {
|
|
|
|
// Clean up thoroughly.
|
|
|
|
filterEgressFlipped := deepcopy.Copy(filterEgress).(*netlink.BpfFilter)
|
|
|
|
filterEgressFlipped.FilterAttrs.Handle ^= 1
|
|
|
|
_ = netlink.FilterDel(filterEgressFlipped)
|
|
|
|
}
|
2023-02-02 20:22:18 +07:00
|
|
|
if err := netlink.FilterAdd(filterEgress); err != nil {
|
|
|
|
return fmt.Errorf("cannot attach ebpf object to filter egress: %w", err)
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
c.deferFuncs = append(c.deferFuncs, func() error {
|
|
|
|
if err := netlink.FilterDel(filterEgress); err != nil && !os.IsNotExist(err) {
|
|
|
|
return fmt.Errorf("FilterDel(%v:%v): %w", ifname, filterEgress.Name, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
2023-02-02 20:22:18 +07:00
|
|
|
|
|
|
|
filterIngress := &netlink.BpfFilter{
|
|
|
|
FilterAttrs: netlink.FilterAttrs{
|
|
|
|
LinkIndex: link.Attrs().Index,
|
|
|
|
Parent: netlink.HANDLE_MIN_INGRESS,
|
2023-02-27 12:29:42 +07:00
|
|
|
Handle: netlink.MakeHandle(0x2023, 0b010+uint16(c.flip)),
|
2023-02-02 20:22:18 +07:00
|
|
|
Protocol: unix.ETH_P_ALL,
|
2023-02-08 13:36:16 +07:00
|
|
|
Priority: 1,
|
2023-02-02 20:22:18 +07:00
|
|
|
},
|
|
|
|
Fd: c.bpf.bpfPrograms.TproxyWanIngress.FD(),
|
2023-02-08 13:36:16 +07:00
|
|
|
Name: consts.AppName + "_wan_ingress",
|
2023-02-02 20:22:18 +07:00
|
|
|
DirectAction: true,
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
_ = netlink.FilterDel(filterIngress)
|
2023-02-27 13:36:36 +07:00
|
|
|
// Remove and add.
|
|
|
|
if !c.isReload {
|
|
|
|
// Clean up thoroughly.
|
|
|
|
filterIngressFlipped := deepcopy.Copy(filterIngress).(*netlink.BpfFilter)
|
|
|
|
filterIngressFlipped.FilterAttrs.Handle ^= 1
|
|
|
|
_ = netlink.FilterDel(filterIngressFlipped)
|
|
|
|
}
|
2023-02-02 20:22:18 +07:00
|
|
|
if err := netlink.FilterAdd(filterIngress); err != nil {
|
|
|
|
return fmt.Errorf("cannot attach ebpf object to filter ingress: %w", err)
|
|
|
|
}
|
2023-02-08 13:36:16 +07:00
|
|
|
c.deferFuncs = append(c.deferFuncs, func() error {
|
|
|
|
if err := netlink.FilterDel(filterIngress); err != nil {
|
|
|
|
return fmt.Errorf("FilterDel(%v:%v): %w", ifname, filterIngress.Name, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
2023-02-02 20:22:18 +07:00
|
|
|
return nil
|
|
|
|
}
|
2023-02-25 01:38:21 +07:00
|
|
|
|
|
|
|
// BatchUpdateDomainRouting update bpf map domain_routing. Since one IP may have multiple domains, this function should
|
|
|
|
// be invoked every A/AAAA-record lookup.
|
2023-02-27 12:29:42 +07:00
|
|
|
func (c *controlPlaneCore) BatchUpdateDomainRouting(cache *DnsCache) error {
|
2023-02-25 01:38:21 +07:00
|
|
|
// Parse ips from DNS resp answers.
|
|
|
|
var ips []netip.Addr
|
2023-07-09 15:02:17 +07:00
|
|
|
for _, ans := range cache.Answer {
|
|
|
|
var (
|
|
|
|
ip netip.Addr
|
|
|
|
ok bool
|
|
|
|
)
|
|
|
|
switch body := ans.(type) {
|
|
|
|
case *dnsmessage.A:
|
|
|
|
ip, ok = netip.AddrFromSlice(body.A)
|
|
|
|
case *dnsmessage.AAAA:
|
|
|
|
ip, ok = netip.AddrFromSlice(body.AAAA)
|
2023-02-25 01:38:21 +07:00
|
|
|
}
|
2023-07-09 15:02:17 +07:00
|
|
|
if !ok || ip.IsUnspecified() {
|
2023-04-29 12:59:20 +07:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
ips = append(ips, ip)
|
2023-02-25 01:38:21 +07:00
|
|
|
}
|
|
|
|
if len(ips) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Update bpf map.
|
|
|
|
// Construct keys and vals, and BpfMapBatchUpdate.
|
|
|
|
var keys [][4]uint32
|
|
|
|
var vals []bpfDomainRouting
|
|
|
|
for _, ip := range ips {
|
|
|
|
ip6 := ip.As16()
|
|
|
|
keys = append(keys, common.Ipv6ByteSliceToUint32Array(ip6[:]))
|
|
|
|
r := bpfDomainRouting{}
|
|
|
|
if len(cache.DomainBitmap) != len(r.Bitmap) {
|
|
|
|
return fmt.Errorf("domain bitmap length not sync with kern program")
|
|
|
|
}
|
|
|
|
copy(r.Bitmap[:], cache.DomainBitmap)
|
|
|
|
vals = append(vals, r)
|
|
|
|
}
|
|
|
|
if _, err := BpfMapBatchUpdate(c.bpf.DomainRoutingMap, keys, vals, &ebpf.BatchOptions{
|
|
|
|
ElemFlags: uint64(ebpf.UpdateAny),
|
|
|
|
}); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
2023-02-27 12:29:42 +07:00
|
|
|
|
2023-05-30 21:10:32 +07:00
|
|
|
// BatchRemoveDomainRouting remove bpf map domain_routing.
|
|
|
|
func (c *controlPlaneCore) BatchRemoveDomainRouting(cache *DnsCache) error {
|
|
|
|
// Parse ips from DNS resp answers.
|
|
|
|
var ips []netip.Addr
|
2023-07-09 15:02:17 +07:00
|
|
|
for _, ans := range cache.Answer {
|
|
|
|
var (
|
|
|
|
ip netip.Addr
|
|
|
|
ok bool
|
|
|
|
)
|
|
|
|
switch body := ans.(type) {
|
|
|
|
case *dnsmessage.A:
|
|
|
|
ip, ok = netip.AddrFromSlice(body.A)
|
|
|
|
case *dnsmessage.AAAA:
|
|
|
|
ip, ok = netip.AddrFromSlice(body.AAAA)
|
2023-05-30 21:10:32 +07:00
|
|
|
}
|
2023-07-09 15:02:17 +07:00
|
|
|
if !ok || ip.IsUnspecified() {
|
2023-05-30 21:10:32 +07:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
ips = append(ips, ip)
|
|
|
|
}
|
|
|
|
if len(ips) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Update bpf map.
|
|
|
|
// Construct keys and vals, and BpfMapBatchUpdate.
|
|
|
|
var keys [][4]uint32
|
|
|
|
for _, ip := range ips {
|
|
|
|
ip6 := ip.As16()
|
|
|
|
keys = append(keys, common.Ipv6ByteSliceToUint32Array(ip6[:]))
|
|
|
|
}
|
|
|
|
if _, err := BpfMapBatchDelete(c.bpf.DomainRoutingMap, keys); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-02-27 12:29:42 +07:00
|
|
|
// EjectBpf will resect bpf from destroying life-cycle of control plane core.
|
|
|
|
func (c *controlPlaneCore) EjectBpf() *bpfObjects {
|
2023-03-02 21:25:51 +07:00
|
|
|
if !c.bpfEjected && !c.isReload {
|
|
|
|
c.deferFuncs = c.deferFuncs[1:]
|
|
|
|
}
|
|
|
|
c.bpfEjected = true
|
2023-02-27 12:29:42 +07:00
|
|
|
return c.bpf
|
|
|
|
}
|
2023-03-02 21:25:51 +07:00
|
|
|
|
|
|
|
// InjectBpf will inject bpf back.
|
|
|
|
func (c *controlPlaneCore) InjectBpf(bpf *bpfObjects) {
|
|
|
|
if c.bpfEjected {
|
|
|
|
c.bpfEjected = false
|
|
|
|
c.deferFuncs = append([]func() error{bpf.Close}, c.deferFuncs...)
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|