| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055 |
- // Copyright (c) Tailscale Inc & AUTHORS
- // SPDX-License-Identifier: BSD-3-Clause
- //go:build linux
- package linuxfw
- import (
- "encoding/binary"
- "encoding/hex"
- "errors"
- "fmt"
- "net"
- "net/netip"
- "reflect"
- "strings"
- "github.com/google/nftables"
- "github.com/google/nftables/expr"
- "golang.org/x/sys/unix"
- "tailscale.com/net/tsaddr"
- "tailscale.com/types/logger"
- "tailscale.com/types/ptr"
- )
- const (
- chainNameForward = "ts-forward"
- chainNameInput = "ts-input"
- chainNamePostrouting = "ts-postrouting"
- )
- // chainTypeRegular is an nftables chain that does not apply to a hook.
- const chainTypeRegular = ""
- type chainInfo struct {
- table *nftables.Table
- name string
- chainType nftables.ChainType
- chainHook *nftables.ChainHook
- chainPriority *nftables.ChainPriority
- chainPolicy *nftables.ChainPolicy
- }
- // nftable contains nat and filter tables for the given IP family (Proto).
- type nftable struct {
- Proto nftables.TableFamily // IPv4 or IPv6
- Filter *nftables.Table
- Nat *nftables.Table
- }
- // nftablesRunner implements a netfilterRunner using the netlink based nftables
- // library. As nftables allows for arbitrary tables and chains, there is a need
- // to follow conventions in order to integrate well with a surrounding
- // ecosystem. The rules installed by nftablesRunner have the following
- // properties:
- // - Install rules that intend to take precedence over rules installed by
- // other software. Tailscale provides packet filtering for tailnet traffic
- // inside the daemon based on the tailnet ACL rules.
- // - As nftables "accept" is not final, rules from high priority tables (low
- // numbers) will fall through to lower priority tables (high numbers). In
- // order to effectively be 'final', we install "jump" rules into conventional
- // tables and chains that will reach an accept verdict inside those tables.
- // - The table and chain conventions followed here are those used by
- // `iptables-nft` and `ufw`, so that those tools co-exist and do not
- // negatively affect Tailscale function.
- // - Be mindful that 1) all chains attached to a given hook (i.e the forward hook)
- // will be processed in priority order till either a rule in one of the chains issues a drop verdict
- // or there are no more chains for that hook
- // 2) processing of individual rules within a chain will stop once one of them issues a final verdict (accept, drop).
- // https://wiki.nftables.org/wiki-nftables/index.php/Configuring_chains
- type nftablesRunner struct {
- conn *nftables.Conn
- nft4 *nftable // IPv4 tables, never nil
- nft6 *nftable // IPv6 tables or nil if the system does not support IPv6
- v6Available bool // whether the host supports IPv6
- }
- func (n *nftablesRunner) ensurePreroutingChain(dst netip.Addr) (*nftables.Table, *nftables.Chain, error) {
- polAccept := nftables.ChainPolicyAccept
- table, err := n.getNFTByAddr(dst)
- if err != nil {
- return nil, nil, fmt.Errorf("error setting up nftables for IP family of %v: %w", dst, err)
- }
- nat, err := createTableIfNotExist(n.conn, table.Proto, "nat")
- if err != nil {
- return nil, nil, fmt.Errorf("error ensuring nat table: %w", err)
- }
- // ensure prerouting chain exists
- preroutingCh, err := getOrCreateChain(n.conn, chainInfo{
- table: nat,
- name: "PREROUTING",
- chainType: nftables.ChainTypeNAT,
- chainHook: nftables.ChainHookPrerouting,
- chainPriority: nftables.ChainPriorityNATDest,
- chainPolicy: &polAccept,
- })
- if err != nil {
- return nil, nil, fmt.Errorf("error ensuring prerouting chain: %w", err)
- }
- return nat, preroutingCh, nil
- }
- func (n *nftablesRunner) AddDNATRule(origDst netip.Addr, dst netip.Addr) error {
- nat, preroutingCh, err := n.ensurePreroutingChain(dst)
- if err != nil {
- return err
- }
- var daddrOffset, fam, dadderLen uint32
- if origDst.Is4() {
- daddrOffset = 16
- dadderLen = 4
- fam = unix.NFPROTO_IPV4
- } else {
- daddrOffset = 24
- dadderLen = 16
- fam = unix.NFPROTO_IPV6
- }
- dnatRule := &nftables.Rule{
- Table: nat,
- Chain: preroutingCh,
- Exprs: []expr.Any{
- &expr.Payload{
- DestRegister: 1,
- Base: expr.PayloadBaseNetworkHeader,
- Offset: daddrOffset,
- Len: dadderLen,
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: origDst.AsSlice(),
- },
- &expr.Immediate{
- Register: 1,
- Data: dst.AsSlice(),
- },
- &expr.NAT{
- Type: expr.NATTypeDestNAT,
- Family: fam,
- RegAddrMin: 1,
- },
- },
- }
- n.conn.InsertRule(dnatRule)
- return n.conn.Flush()
- }
- // DNATWithLoadBalancer currently just forwards all traffic destined for origDst
- // to the first IP address from the backend targets.
- // TODO (irbekrm): instead of doing this load balance traffic evenly to all
- // backend destinations.
- // https://github.com/tailscale/tailscale/commit/d37f2f508509c6c35ad724fd75a27685b90b575b#diff-a3bcbcd1ca198799f4f768dc56fea913e1945a6b3ec9dbec89325a84a19a85e7R148-R232
- func (n *nftablesRunner) DNATWithLoadBalancer(origDst netip.Addr, dsts []netip.Addr) error {
- return n.AddDNATRule(origDst, dsts[0])
- }
- func (n *nftablesRunner) DNATNonTailscaleTraffic(tunname string, dst netip.Addr) error {
- nat, preroutingCh, err := n.ensurePreroutingChain(dst)
- if err != nil {
- return err
- }
- var famConst uint32
- if dst.Is4() {
- famConst = unix.NFPROTO_IPV4
- } else {
- famConst = unix.NFPROTO_IPV6
- }
- dnatRule := &nftables.Rule{
- Table: nat,
- Chain: preroutingCh,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyOIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpNeq,
- Register: 1,
- Data: []byte(tunname),
- },
- &expr.Immediate{
- Register: 1,
- Data: dst.AsSlice(),
- },
- &expr.NAT{
- Type: expr.NATTypeDestNAT,
- Family: famConst,
- RegAddrMin: 1,
- },
- },
- }
- n.conn.InsertRule(dnatRule)
- return n.conn.Flush()
- }
- func (n *nftablesRunner) EnsureSNATForDst(src, dst netip.Addr) error {
- polAccept := nftables.ChainPolicyAccept
- table, err := n.getNFTByAddr(dst)
- if err != nil {
- return fmt.Errorf("error setting up nftables for IP family of %v: %w", dst, err)
- }
- nat, err := createTableIfNotExist(n.conn, table.Proto, "nat")
- if err != nil {
- return fmt.Errorf("error ensuring nat table exists: %w", err)
- }
- // ensure postrouting chain exists
- postRoutingCh, err := getOrCreateChain(n.conn, chainInfo{
- table: nat,
- name: "POSTROUTING",
- chainType: nftables.ChainTypeNAT,
- chainHook: nftables.ChainHookPostrouting,
- chainPriority: nftables.ChainPriorityNATSource,
- chainPolicy: &polAccept,
- })
- if err != nil {
- return fmt.Errorf("error ensuring postrouting chain: %w", err)
- }
- rules, err := n.conn.GetRules(nat, postRoutingCh)
- if err != nil {
- return fmt.Errorf("error listing rules: %w", err)
- }
- snatRulePrefixMatch := fmt.Sprintf("dst:%s,src:", dst.String())
- snatRuleFullMatch := fmt.Sprintf("%s%s", snatRulePrefixMatch, src.String())
- for _, rule := range rules {
- current := string(rule.UserData)
- if strings.HasPrefix(string(rule.UserData), snatRulePrefixMatch) {
- if strings.EqualFold(current, snatRuleFullMatch) {
- return nil // already exists, do nothing
- }
- if err := n.conn.DelRule(rule); err != nil {
- return fmt.Errorf("error deleting SNAT rule: %w", err)
- }
- }
- }
- rule := snatRule(nat, postRoutingCh, src, dst, []byte(snatRuleFullMatch))
- n.conn.AddRule(rule)
- return n.conn.Flush()
- }
- // ClampMSSToPMTU ensures that all packets with TCP flags (SYN, ACK, RST) set
- // being forwarded via the given interface (tun) have MSS set to <MTU of the
- // interface> - 40 (IP and TCP headers). This can be useful if this tailscale
- // instance is expected to run as a forwarding proxy, forwarding packets from an
- // endpoint with higher MTU in an environment where path MTU discovery is
- // expected to not work (such as the proxies created by the Tailscale Kubernetes
- // operator). ClamMSSToPMTU creates a new base-chain ts-clamp in the filter
- // table with accept policy and priority -150. In practice, this means that for
- // SYN packets the clamp rule in this chain will likely run first and accept the
- // packet. This is fine because 1) nftables run ALL chains with the same hook
- // type unless a rule in one of them drops the packet and 2) this chain does not
- // have functionality to drop the packet- so in practice a matching clamp rule
- // will always be followed by the custom tailscale filtering rules in the other
- // chains attached to the filter hook (FORWARD, ts-forward).
- // We do not want to place the clamping rule into FORWARD/ts-forward chains
- // because wgengine populates those chains with rules that contain accept
- // verdicts that would cause no further procesing within that chain. This
- // functionality is currently invoked from outside wgengine (containerboot), so
- // we don't want to race with wgengine for rule ordering within chains.
- func (n *nftablesRunner) ClampMSSToPMTU(tun string, addr netip.Addr) error {
- polAccept := nftables.ChainPolicyAccept
- table, err := n.getNFTByAddr(addr)
- if err != nil {
- return fmt.Errorf("error setting up nftables for IP family of %v: %w", addr, err)
- }
- filterTable, err := createTableIfNotExist(n.conn, table.Proto, "filter")
- if err != nil {
- return fmt.Errorf("error ensuring filter table: %w", err)
- }
- // ensure ts-clamp chain exists
- fwChain, err := getOrCreateChain(n.conn, chainInfo{
- table: filterTable,
- name: "ts-clamp",
- chainType: nftables.ChainTypeFilter,
- chainHook: nftables.ChainHookForward,
- chainPriority: nftables.ChainPriorityMangle,
- chainPolicy: &polAccept,
- })
- if err != nil {
- return fmt.Errorf("error ensuring forward chain: %w", err)
- }
- clampRule := &nftables.Rule{
- Table: filterTable,
- Chain: fwChain,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyOIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte(tun),
- },
- &expr.Meta{Key: expr.MetaKeyL4PROTO, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte{unix.IPPROTO_TCP},
- },
- &expr.Payload{
- DestRegister: 1,
- Base: expr.PayloadBaseTransportHeader,
- Offset: 13,
- Len: 1,
- },
- &expr.Bitwise{
- DestRegister: 1,
- SourceRegister: 1,
- Len: 1,
- Mask: []byte{0x02},
- Xor: []byte{0x00},
- },
- &expr.Cmp{
- Op: expr.CmpOpNeq, // match any packet with a TCP flag set (SYN, ACK, RST)
- Register: 1,
- Data: []byte{0x00},
- },
- &expr.Rt{
- Register: 1,
- Key: expr.RtTCPMSS,
- },
- &expr.Byteorder{
- DestRegister: 1,
- SourceRegister: 1,
- Op: expr.ByteorderHton,
- Len: 2,
- Size: 2,
- },
- &expr.Exthdr{
- SourceRegister: 1,
- Type: 2,
- Offset: 2,
- Len: 2,
- Op: expr.ExthdrOpTcpopt,
- },
- },
- }
- n.conn.AddRule(clampRule)
- return n.conn.Flush()
- }
- // deleteTableIfExists deletes a nftables table via connection c if it exists
- // within the given family.
- func deleteTableIfExists(c *nftables.Conn, family nftables.TableFamily, name string) error {
- t, err := getTableIfExists(c, family, name)
- if err != nil {
- return fmt.Errorf("get table: %w", err)
- }
- if t == nil {
- // Table does not exist, so nothing to delete.
- return nil
- }
- c.DelTable(t)
- if err := c.Flush(); err != nil {
- if t, err = getTableIfExists(c, family, name); t == nil && err == nil {
- // Check if the table still exists. If it does not, then the error
- // is due to the table not existing, so we can ignore it. Maybe a
- // concurrent process deleted the table.
- return nil
- }
- return fmt.Errorf("del table: %w", err)
- }
- return nil
- }
- // getTableIfExists returns the table with the given name from the given family
- // if it exists. If none match, it returns (nil, nil).
- func getTableIfExists(c *nftables.Conn, family nftables.TableFamily, name string) (*nftables.Table, error) {
- tables, err := c.ListTables()
- if err != nil {
- return nil, fmt.Errorf("get tables: %w", err)
- }
- for _, table := range tables {
- if table.Name == name && table.Family == family {
- return table, nil
- }
- }
- return nil, nil
- }
- // createTableIfNotExist creates a nftables table via connection c if it does
- // not exist within the given family.
- func createTableIfNotExist(c *nftables.Conn, family nftables.TableFamily, name string) (*nftables.Table, error) {
- if t, err := getTableIfExists(c, family, name); err != nil {
- return nil, fmt.Errorf("get table: %w", err)
- } else if t != nil {
- return t, nil
- }
- t := c.AddTable(&nftables.Table{
- Family: family,
- Name: name,
- })
- if err := c.Flush(); err != nil {
- return nil, fmt.Errorf("add table: %w", err)
- }
- return t, nil
- }
- type errorChainNotFound struct {
- chainName string
- tableName string
- }
- func (e errorChainNotFound) Error() string {
- return fmt.Sprintf("chain %s not found in table %s", e.chainName, e.tableName)
- }
- // getChainFromTable returns the chain with the given name from the given table.
- // Note that a chain name is unique within a table.
- func getChainFromTable(c *nftables.Conn, table *nftables.Table, name string) (*nftables.Chain, error) {
- chains, err := c.ListChainsOfTableFamily(table.Family)
- if err != nil {
- return nil, fmt.Errorf("list chains: %w", err)
- }
- for _, chain := range chains {
- // Table family is already checked so table name is unique
- if chain.Table.Name == table.Name && chain.Name == name {
- return chain, nil
- }
- }
- return nil, errorChainNotFound{table.Name, name}
- }
- // isTSChain reports whether `name` begins with "ts-" (and is thus a
- // Tailscale-managed chain).
- func isTSChain(name string) bool {
- return strings.HasPrefix(name, "ts-")
- }
- // createChainIfNotExist creates a chain with the given name in the given table
- // if it does not exist.
- func createChainIfNotExist(c *nftables.Conn, cinfo chainInfo) error {
- _, err := getOrCreateChain(c, cinfo)
- return err
- }
- func getOrCreateChain(c *nftables.Conn, cinfo chainInfo) (*nftables.Chain, error) {
- chain, err := getChainFromTable(c, cinfo.table, cinfo.name)
- if err != nil && !errors.Is(err, errorChainNotFound{cinfo.table.Name, cinfo.name}) {
- return nil, fmt.Errorf("get chain: %w", err)
- } else if err == nil {
- // The chain already exists. If it is a TS chain, check the
- // type/hook/priority, but for "conventional chains" assume they're what
- // we expect (in case iptables-nft/ufw make minor behavior changes in
- // the future).
- if isTSChain(chain.Name) && (chain.Type != cinfo.chainType || *chain.Hooknum != *cinfo.chainHook || *chain.Priority != *cinfo.chainPriority) {
- return nil, fmt.Errorf("chain %s already exists with different type/hook/priority", cinfo.name)
- }
- return chain, nil
- }
- chain = c.AddChain(&nftables.Chain{
- Name: cinfo.name,
- Table: cinfo.table,
- Type: cinfo.chainType,
- Hooknum: cinfo.chainHook,
- Priority: cinfo.chainPriority,
- Policy: cinfo.chainPolicy,
- })
- if err := c.Flush(); err != nil {
- return nil, fmt.Errorf("add chain: %w", err)
- }
- return chain, nil
- }
- // NetfilterRunner abstracts helpers to run netfilter commands. It is
- // implemented by linuxfw.IPTablesRunner and linuxfw.NfTablesRunner.
- type NetfilterRunner interface {
- // AddLoopbackRule adds a rule to permit loopback traffic to addr. This rule
- // is added only if it does not already exist.
- AddLoopbackRule(addr netip.Addr) error
- // DelLoopbackRule removes the rule added by AddLoopbackRule.
- DelLoopbackRule(addr netip.Addr) error
- // AddHooks adds rules to conventional chains like "FORWARD", "INPUT" and
- // "POSTROUTING" to jump from those chains to tailscale chains.
- AddHooks() error
- // DelHooks deletes rules added by AddHooks.
- DelHooks(logf logger.Logf) error
- // AddChains creates custom Tailscale chains.
- AddChains() error
- // DelChains removes chains added by AddChains.
- DelChains() error
- // AddBase adds rules reused by different other rules.
- AddBase(tunname string) error
- // DelBase removes rules added by AddBase.
- DelBase() error
- // AddSNATRule adds the netfilter rule to SNAT incoming traffic over
- // the Tailscale interface destined for local subnets. An error is
- // returned if the rule already exists.
- AddSNATRule() error
- // DelSNATRule removes the rule added by AddSNATRule.
- DelSNATRule() error
- // AddStatefulRule adds a netfilter rule for stateful packet filtering
- // using conntrack.
- AddStatefulRule(tunname string) error
- // DelStatefulRule removes a netfilter rule for stateful packet filtering
- // using conntrack.
- DelStatefulRule(tunname string) error
- // HasIPV6 reports true if the system supports IPv6.
- HasIPV6() bool
- // HasIPV6NAT reports true if the system supports IPv6 NAT.
- HasIPV6NAT() bool
- // HasIPV6Filter reports true if the system supports IPv6 filter tables
- // This is only meaningful for iptables implementation, where hosts have
- // partial ipables support (i.e missing filter table). For nftables
- // implementation, this will default to the value of HasIPv6().
- HasIPV6Filter() bool
- // AddDNATRule adds a rule to the nat/PREROUTING chain to DNAT traffic
- // destined for the given original destination to the given new destination.
- // This is used to forward all traffic destined for the Tailscale interface
- // to the provided destination, as used in the Kubernetes ingress proxies.
- AddDNATRule(origDst, dst netip.Addr) error
- // DNATWithLoadBalancer adds a rule to the nat/PREROUTING chain to DNAT
- // traffic destined for the given original destination to the given new
- // destination(s) using round robin to load balance if more than one
- // destination is provided. This is used to forward all traffic destined
- // for the Tailscale interface to the provided destination(s), as used
- // in the Kubernetes ingress proxies.
- DNATWithLoadBalancer(origDst netip.Addr, dsts []netip.Addr) error
- // EnsureSNATForDst sets up firewall to mask the source for traffic destined for dst to src:
- // - creates a SNAT rule if it doesn't already exist
- // - deletes any pre-existing rules matching the destination
- // This is used to forward traffic destined for the local machine over
- // the Tailscale interface, as used in the Kubernetes egress proxies.
- EnsureSNATForDst(src, dst netip.Addr) error
- // DNATNonTailscaleTraffic adds a rule to the nat/PREROUTING chain to DNAT
- // all traffic inbound from any interface except exemptInterface to dst.
- // This is used to forward traffic destined for the local machine over
- // the Tailscale interface, as used in the Kubernetes egress proxies.
- DNATNonTailscaleTraffic(exemptInterface string, dst netip.Addr) error
- EnsurePortMapRuleForSvc(svc, tun string, targetIP netip.Addr, pm PortMap) error
- DeletePortMapRuleForSvc(svc, tun string, targetIP netip.Addr, pm PortMap) error
- DeleteSvc(svc, tun string, targetIPs []netip.Addr, pm []PortMap) error
- // ClampMSSToPMTU adds a rule to the mangle/FORWARD chain to clamp MSS for
- // traffic destined for the provided tun interface.
- ClampMSSToPMTU(tun string, addr netip.Addr) error
- // AddMagicsockPortRule adds a rule to the ts-input chain to accept
- // incoming traffic on the specified port, to allow magicsock to
- // communicate.
- AddMagicsockPortRule(port uint16, network string) error
- // DelMagicsockPortRule removes the rule created by AddMagicsockPortRule,
- // if it exists.
- DelMagicsockPortRule(port uint16, network string) error
- }
- // New creates a NetfilterRunner, auto-detecting whether to use
- // nftables or iptables.
- // As nftables is still experimental, iptables will be used unless
- // either the TS_DEBUG_FIREWALL_MODE environment variable, or the prefHint
- // parameter, is set to one of "nftables" or "auto".
- func New(logf logger.Logf, prefHint string) (NetfilterRunner, error) {
- mode := detectFirewallMode(logf, prefHint)
- switch mode {
- case FirewallModeIPTables:
- // Note that we don't simply return an newIPTablesRunner here because it
- // would return a `nil` iptablesRunner which is different from returning
- // a nil NetfilterRunner.
- ipr, err := newIPTablesRunner(logf)
- if err != nil {
- return nil, err
- }
- return ipr, nil
- case FirewallModeNfTables:
- // Note that we don't simply return an newNfTablesRunner here because it
- // would return a `nil` nftablesRunner which is different from returning
- // a nil NetfilterRunner.
- nfr, err := newNfTablesRunner(logf)
- if err != nil {
- return nil, err
- }
- return nfr, nil
- default:
- return nil, fmt.Errorf("unknown firewall mode %v", mode)
- }
- }
- // newNfTablesRunner creates a new nftablesRunner without guaranteeing
- // the existence of the tables and chains.
- func newNfTablesRunner(logf logger.Logf) (*nftablesRunner, error) {
- conn, err := nftables.New()
- if err != nil {
- return nil, fmt.Errorf("nftables connection: %w", err)
- }
- return newNfTablesRunnerWithConn(logf, conn), nil
- }
- func newNfTablesRunnerWithConn(logf logger.Logf, conn *nftables.Conn) *nftablesRunner {
- nft4 := &nftable{Proto: nftables.TableFamilyIPv4}
- v6err := CheckIPv6(logf)
- if v6err != nil {
- logf("disabling tunneled IPv6 due to system IPv6 config: %v", v6err)
- }
- supportsV6 := v6err == nil
- var nft6 *nftable
- if supportsV6 {
- nft6 = &nftable{Proto: nftables.TableFamilyIPv6}
- }
- logf("netfilter running in nftables mode, v6 = %v", supportsV6)
- // TODO(KevinLiang10): convert iptables rule to nftable rules if they exist in the iptables
- return &nftablesRunner{
- conn: conn,
- nft4: nft4,
- nft6: nft6,
- v6Available: supportsV6,
- }
- }
- // newLoadSaddrExpr creates a new nftables expression that loads the source
- // address of the packet into the given register.
- func newLoadSaddrExpr(proto nftables.TableFamily, destReg uint32) (expr.Any, error) {
- switch proto {
- case nftables.TableFamilyIPv4:
- return &expr.Payload{
- DestRegister: destReg,
- Base: expr.PayloadBaseNetworkHeader,
- Offset: 12,
- Len: 4,
- }, nil
- case nftables.TableFamilyIPv6:
- return &expr.Payload{
- DestRegister: destReg,
- Base: expr.PayloadBaseNetworkHeader,
- Offset: 8,
- Len: 16,
- }, nil
- default:
- return nil, fmt.Errorf("table family %v is neither IPv4 nor IPv6", proto)
- }
- }
- // newLoadDportExpr creates a new nftables express that loads the desination port
- // of a TCP/UDP packet into the given register.
- func newLoadDportExpr(destReg uint32) expr.Any {
- return &expr.Payload{
- DestRegister: destReg,
- Base: expr.PayloadBaseTransportHeader,
- Offset: 2,
- Len: 2,
- }
- }
- // HasIPV6 reports true if the system supports IPv6.
- func (n *nftablesRunner) HasIPV6() bool {
- return n.v6Available
- }
- // HasIPV6NAT returns true if the system supports IPv6.
- // Kernel support for nftables was added after support for IPv6
- // NAT, so no need for a separate IPv6 NAT support check like we do for iptables.
- // https://tldp.org/HOWTO/Linux+IPv6-HOWTO/ch18s04.html
- // https://wiki.nftables.org/wiki-nftables/index.php/Building_and_installing_nftables_from_sources
- func (n *nftablesRunner) HasIPV6NAT() bool {
- return n.v6Available
- }
- // HasIPV6Filter returns true if system supports IPv6. There are no known edge
- // cases where nftables running on a host that supports IPv6 would not support
- // filter table.
- func (n *nftablesRunner) HasIPV6Filter() bool {
- return n.v6Available
- }
- // findRule iterates through the rules to find the rule with matching expressions.
- func findRule(conn *nftables.Conn, rule *nftables.Rule) (*nftables.Rule, error) {
- rules, err := conn.GetRules(rule.Table, rule.Chain)
- if err != nil {
- return nil, fmt.Errorf("get nftables rules: %w", err)
- }
- if len(rules) == 0 {
- return nil, nil
- }
- ruleLoop:
- for _, r := range rules {
- if len(r.Exprs) != len(rule.Exprs) {
- continue
- }
- for i, e := range r.Exprs {
- // Skip counter expressions, as they will not match.
- if _, ok := e.(*expr.Counter); ok {
- continue
- }
- if !reflect.DeepEqual(e, rule.Exprs[i]) {
- continue ruleLoop
- }
- }
- return r, nil
- }
- return nil, nil
- }
- func createLoopbackRule(
- proto nftables.TableFamily,
- table *nftables.Table,
- chain *nftables.Chain,
- addr netip.Addr,
- ) (*nftables.Rule, error) {
- saddrExpr, err := newLoadSaddrExpr(proto, 1)
- if err != nil {
- return nil, fmt.Errorf("newLoadSaddrExpr: %w", err)
- }
- loopBackRule := &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{
- Key: expr.MetaKeyIIFNAME,
- Register: 1,
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte("lo"),
- },
- saddrExpr,
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: addr.AsSlice(),
- },
- &expr.Counter{},
- &expr.Verdict{
- Kind: expr.VerdictAccept,
- },
- },
- }
- return loopBackRule, nil
- }
- // insertLoopbackRule inserts the TS loop back rule into
- // the given chain as the first rule if it does not exist.
- func insertLoopbackRule(
- conn *nftables.Conn, proto nftables.TableFamily,
- table *nftables.Table, chain *nftables.Chain, addr netip.Addr) error {
- loopBackRule, err := createLoopbackRule(proto, table, chain, addr)
- if err != nil {
- return fmt.Errorf("create loopback rule: %w", err)
- }
- // If TestDial is set, we are running in test mode and we should not
- // find rule because header will mismatch.
- if conn.TestDial == nil {
- // Check if the rule already exists.
- rule, err := findRule(conn, loopBackRule)
- if err != nil {
- return fmt.Errorf("find rule: %w", err)
- }
- if rule != nil {
- // Rule already exists, no need to insert.
- return nil
- }
- }
- // This inserts the rule to the top of the chain
- _ = conn.InsertRule(loopBackRule)
- if err = conn.Flush(); err != nil {
- return fmt.Errorf("insert rule: %w", err)
- }
- return nil
- }
- // getNFTByAddr returns the nftables with correct IP family
- // that we will be using for the given address.
- func (n *nftablesRunner) getNFTByAddr(addr netip.Addr) (*nftable, error) {
- if addr.Is6() && !n.v6Available {
- return nil, fmt.Errorf("nftables for IPv6 are not available on this host")
- }
- if addr.Is6() {
- return n.nft6, nil
- }
- return n.nft4, nil
- }
- // AddLoopbackRule adds an nftables rule to permit loopback traffic to
- // a local Tailscale IP. This rule is added only if it does not already exist.
- func (n *nftablesRunner) AddLoopbackRule(addr netip.Addr) error {
- nf, err := n.getNFTByAddr(addr)
- if err != nil {
- return fmt.Errorf("error setting up nftables for IP family of %v: %w", addr, err)
- }
- inputChain, err := getChainFromTable(n.conn, nf.Filter, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain: %w", err)
- }
- if err := insertLoopbackRule(n.conn, nf.Proto, nf.Filter, inputChain, addr); err != nil {
- return fmt.Errorf("add loopback rule: %w", err)
- }
- return nil
- }
- // DelLoopbackRule removes the nftables rule permitting loopback
- // traffic to a Tailscale IP.
- func (n *nftablesRunner) DelLoopbackRule(addr netip.Addr) error {
- nf, err := n.getNFTByAddr(addr)
- if err != nil {
- return fmt.Errorf("error setting up nftables for IP family of %v: %w", addr, err)
- }
- inputChain, err := getChainFromTable(n.conn, nf.Filter, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain: %w", err)
- }
- loopBackRule, err := createLoopbackRule(nf.Proto, nf.Filter, inputChain, addr)
- if err != nil {
- return fmt.Errorf("create loopback rule: %w", err)
- }
- existingLoopBackRule, err := findRule(n.conn, loopBackRule)
- if err != nil {
- return fmt.Errorf("find loop back rule: %w", err)
- }
- if existingLoopBackRule == nil {
- // Rule does not exist, no need to delete.
- return nil
- }
- if err := n.conn.DelRule(existingLoopBackRule); err != nil {
- return fmt.Errorf("delete rule: %w", err)
- }
- return n.conn.Flush()
- }
- // getTables returns tables for IP families that this host was determined to
- // support (either IPv4 and IPv6 or just IPv4).
- func (n *nftablesRunner) getTables() []*nftable {
- if n.HasIPV6() {
- return []*nftable{n.nft4, n.nft6}
- }
- return []*nftable{n.nft4}
- }
- // AddChains creates custom Tailscale chains in netfilter via nftables
- // if the ts-chain doesn't already exist.
- func (n *nftablesRunner) AddChains() error {
- polAccept := nftables.ChainPolicyAccept
- for _, table := range n.getTables() {
- // Create the filter table if it doesn't exist, this table name is the same
- // as the name used by iptables-nft and ufw. We install rules into the
- // same conventional table so that `accept` verdicts from our jump
- // chains are conclusive.
- filter, err := createTableIfNotExist(n.conn, table.Proto, "filter")
- if err != nil {
- return fmt.Errorf("create table: %w", err)
- }
- table.Filter = filter
- // Adding the "conventional chains" that are used by iptables-nft and ufw.
- if err = createChainIfNotExist(n.conn, chainInfo{filter, "FORWARD", nftables.ChainTypeFilter, nftables.ChainHookForward, nftables.ChainPriorityFilter, &polAccept}); err != nil {
- return fmt.Errorf("create forward chain: %w", err)
- }
- if err = createChainIfNotExist(n.conn, chainInfo{filter, "INPUT", nftables.ChainTypeFilter, nftables.ChainHookInput, nftables.ChainPriorityFilter, &polAccept}); err != nil {
- return fmt.Errorf("create input chain: %w", err)
- }
- // Adding the tailscale chains that contain our rules.
- if err = createChainIfNotExist(n.conn, chainInfo{filter, chainNameForward, chainTypeRegular, nil, nil, nil}); err != nil {
- return fmt.Errorf("create forward chain: %w", err)
- }
- if err = createChainIfNotExist(n.conn, chainInfo{filter, chainNameInput, chainTypeRegular, nil, nil, nil}); err != nil {
- return fmt.Errorf("create input chain: %w", err)
- }
- // Create the nat table if it doesn't exist, this table name is the same
- // as the name used by iptables-nft and ufw. We install rules into the
- // same conventional table so that `accept` verdicts from our jump
- // chains are conclusive.
- nat, err := createTableIfNotExist(n.conn, table.Proto, "nat")
- if err != nil {
- return fmt.Errorf("create table: %w", err)
- }
- table.Nat = nat
- // Adding the "conventional chains" that are used by iptables-nft and ufw.
- if err = createChainIfNotExist(n.conn, chainInfo{nat, "POSTROUTING", nftables.ChainTypeNAT, nftables.ChainHookPostrouting, nftables.ChainPriorityNATSource, &polAccept}); err != nil {
- return fmt.Errorf("create postrouting chain: %w", err)
- }
- // Adding the tailscale chain that contains our rules.
- if err = createChainIfNotExist(n.conn, chainInfo{nat, chainNamePostrouting, chainTypeRegular, nil, nil, nil}); err != nil {
- return fmt.Errorf("create postrouting chain: %w", err)
- }
- }
- return n.conn.Flush()
- }
- // These are dummy chains and tables we create to detect if nftables is
- // available. We create them, then delete them. If we can create and delete
- // them, then we can use nftables. If we can't, then we assume that we're
- // running on a system that doesn't support nftables. See
- // createDummyPostroutingChains.
- const (
- tsDummyChainName = "ts-test-postrouting"
- tsDummyTableName = "ts-test-nat"
- )
- // createDummyPostroutingChains creates dummy postrouting chains in netfilter
- // via netfilter via nftables, as a last resort measure to detect that nftables
- // can be used. It cleans up the dummy chains after creation.
- func (n *nftablesRunner) createDummyPostroutingChains() (retErr error) {
- polAccept := ptr.To(nftables.ChainPolicyAccept)
- for _, table := range n.getTables() {
- nat, err := createTableIfNotExist(n.conn, table.Proto, tsDummyTableName)
- if err != nil {
- return fmt.Errorf("create nat table: %w", err)
- }
- defer func(fm nftables.TableFamily) {
- if err := deleteTableIfExists(n.conn, fm, tsDummyTableName); err != nil && retErr == nil {
- retErr = fmt.Errorf("delete %q table: %w", tsDummyTableName, err)
- }
- }(table.Proto)
- table.Nat = nat
- if err = createChainIfNotExist(n.conn, chainInfo{nat, tsDummyChainName, nftables.ChainTypeNAT, nftables.ChainHookPostrouting, nftables.ChainPriorityNATSource, polAccept}); err != nil {
- return fmt.Errorf("create %q chain: %w", tsDummyChainName, err)
- }
- if err := deleteChainIfExists(n.conn, nat, tsDummyChainName); err != nil {
- return fmt.Errorf("delete %q chain: %w", tsDummyChainName, err)
- }
- }
- return nil
- }
- // deleteChainIfExists deletes a chain if it exists.
- func deleteChainIfExists(c *nftables.Conn, table *nftables.Table, name string) error {
- chain, err := getChainFromTable(c, table, name)
- if err != nil && !errors.Is(err, errorChainNotFound{table.Name, name}) {
- return fmt.Errorf("get chain: %w", err)
- } else if err != nil {
- // If the chain doesn't exist, we don't need to delete it.
- return nil
- }
- c.FlushChain(chain)
- c.DelChain(chain)
- if err := c.Flush(); err != nil {
- return fmt.Errorf("flush and delete chain: %w", err)
- }
- return nil
- }
- // DelChains removes the custom Tailscale chains from netfilter via nftables.
- func (n *nftablesRunner) DelChains() error {
- for _, table := range n.getTables() {
- if err := deleteChainIfExists(n.conn, table.Filter, chainNameForward); err != nil {
- return fmt.Errorf("delete chain: %w", err)
- }
- if err := deleteChainIfExists(n.conn, table.Filter, chainNameInput); err != nil {
- return fmt.Errorf("delete chain: %w", err)
- }
- }
- if err := deleteChainIfExists(n.conn, n.nft4.Nat, chainNamePostrouting); err != nil {
- return fmt.Errorf("delete chain: %w", err)
- }
- if n.HasIPV6NAT() {
- if err := deleteChainIfExists(n.conn, n.nft6.Nat, chainNamePostrouting); err != nil {
- return fmt.Errorf("delete chain: %w", err)
- }
- }
- if err := n.conn.Flush(); err != nil {
- return fmt.Errorf("flush: %w", err)
- }
- return nil
- }
- // createHookRule creates a rule to jump from a hooked chain to a regular chain.
- func createHookRule(table *nftables.Table, fromChain *nftables.Chain, toChainName string) *nftables.Rule {
- exprs := []expr.Any{
- &expr.Counter{},
- &expr.Verdict{
- Kind: expr.VerdictJump,
- Chain: toChainName,
- },
- }
- rule := &nftables.Rule{
- Table: table,
- Chain: fromChain,
- Exprs: exprs,
- }
- return rule
- }
- // addHookRule adds a rule to jump from a hooked chain to a regular chain at top of the hooked chain.
- func addHookRule(conn *nftables.Conn, table *nftables.Table, fromChain *nftables.Chain, toChainName string) error {
- rule := createHookRule(table, fromChain, toChainName)
- _ = conn.InsertRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add rule: %w", err)
- }
- return nil
- }
- // AddHooks is adding rules to conventional chains like "FORWARD", "INPUT" and "POSTROUTING"
- // in tables and jump from those chains to tailscale chains.
- func (n *nftablesRunner) AddHooks() error {
- conn := n.conn
- for _, table := range n.getTables() {
- inputChain, err := getChainFromTable(conn, table.Filter, "INPUT")
- if err != nil {
- return fmt.Errorf("get INPUT chain: %w", err)
- }
- err = addHookRule(conn, table.Filter, inputChain, chainNameInput)
- if err != nil {
- return fmt.Errorf("Addhook: %w", err)
- }
- forwardChain, err := getChainFromTable(conn, table.Filter, "FORWARD")
- if err != nil {
- return fmt.Errorf("get FORWARD chain: %w", err)
- }
- err = addHookRule(conn, table.Filter, forwardChain, chainNameForward)
- if err != nil {
- return fmt.Errorf("Addhook: %w", err)
- }
- postroutingChain, err := getChainFromTable(conn, table.Nat, "POSTROUTING")
- if err != nil {
- return fmt.Errorf("get INPUT chain: %w", err)
- }
- err = addHookRule(conn, table.Nat, postroutingChain, chainNamePostrouting)
- if err != nil {
- return fmt.Errorf("Addhook: %w", err)
- }
- }
- return nil
- }
- // delHookRule deletes a rule that jumps from a hooked chain to a regular chain.
- func delHookRule(conn *nftables.Conn, table *nftables.Table, fromChain *nftables.Chain, toChainName string) error {
- rule := createHookRule(table, fromChain, toChainName)
- existingRule, err := findRule(conn, rule)
- if err != nil {
- return fmt.Errorf("Failed to find hook rule: %w", err)
- }
- if existingRule == nil {
- return nil
- }
- _ = conn.DelRule(existingRule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush del hook rule: %w", err)
- }
- return nil
- }
- // DelHooks is deleting the rules added to conventional chains to jump to tailscale chains.
- func (n *nftablesRunner) DelHooks(logf logger.Logf) error {
- conn := n.conn
- for _, table := range n.getTables() {
- inputChain, err := getChainFromTable(conn, table.Filter, "INPUT")
- if err != nil {
- return fmt.Errorf("get INPUT chain: %w", err)
- }
- err = delHookRule(conn, table.Filter, inputChain, chainNameInput)
- if err != nil {
- return fmt.Errorf("delhook: %w", err)
- }
- forwardChain, err := getChainFromTable(conn, table.Filter, "FORWARD")
- if err != nil {
- return fmt.Errorf("get FORWARD chain: %w", err)
- }
- err = delHookRule(conn, table.Filter, forwardChain, chainNameForward)
- if err != nil {
- return fmt.Errorf("delhook: %w", err)
- }
- postroutingChain, err := getChainFromTable(conn, table.Nat, "POSTROUTING")
- if err != nil {
- return fmt.Errorf("get INPUT chain: %w", err)
- }
- err = delHookRule(conn, table.Nat, postroutingChain, chainNamePostrouting)
- if err != nil {
- return fmt.Errorf("delhook: %w", err)
- }
- }
- return nil
- }
- // maskof returns the mask of the given prefix in big endian bytes.
- func maskof(pfx netip.Prefix) []byte {
- mask := make([]byte, 4)
- binary.BigEndian.PutUint32(mask, ^(uint32(0xffff_ffff) >> pfx.Bits()))
- return mask
- }
- // createRangeRule creates a rule that matches packets with source IP from the give
- // range (like CGNAT range or ChromeOSVM range) and the interface is not the tunname,
- // and makes the given decision. Only IPv4 is supported.
- func createRangeRule(
- table *nftables.Table, chain *nftables.Chain,
- tunname string, rng netip.Prefix, decision expr.VerdictKind,
- ) (*nftables.Rule, error) {
- if rng.Addr().Is6() {
- return nil, errors.New("IPv6 is not supported")
- }
- saddrExpr, err := newLoadSaddrExpr(nftables.TableFamilyIPv4, 1)
- if err != nil {
- return nil, fmt.Errorf("newLoadSaddrExpr: %w", err)
- }
- netip := rng.Addr().AsSlice()
- mask := maskof(rng)
- rule := &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyIIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpNeq,
- Register: 1,
- Data: []byte(tunname),
- },
- saddrExpr,
- &expr.Bitwise{
- SourceRegister: 1,
- DestRegister: 1,
- Len: 4,
- Mask: mask,
- Xor: []byte{0x00, 0x00, 0x00, 0x00},
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: netip,
- },
- &expr.Counter{},
- &expr.Verdict{
- Kind: decision,
- },
- },
- }
- return rule, nil
- }
- // addReturnChromeOSVMRangeRule adds a rule to return if the source IP
- // is in the ChromeOS VM range.
- func addReturnChromeOSVMRangeRule(c *nftables.Conn, table *nftables.Table, chain *nftables.Chain, tunname string) error {
- rule, err := createRangeRule(table, chain, tunname, tsaddr.ChromeOSVMRange(), expr.VerdictReturn)
- if err != nil {
- return fmt.Errorf("create rule: %w", err)
- }
- _ = c.AddRule(rule)
- if err = c.Flush(); err != nil {
- return fmt.Errorf("add rule: %w", err)
- }
- return nil
- }
- // addDropCGNATRangeRule adds a rule to drop if the source IP is in the
- // CGNAT range.
- func addDropCGNATRangeRule(c *nftables.Conn, table *nftables.Table, chain *nftables.Chain, tunname string) error {
- rule, err := createRangeRule(table, chain, tunname, tsaddr.CGNATRange(), expr.VerdictDrop)
- if err != nil {
- return fmt.Errorf("create rule: %w", err)
- }
- _ = c.AddRule(rule)
- if err = c.Flush(); err != nil {
- return fmt.Errorf("add rule: %w", err)
- }
- return nil
- }
- // createSetSubnetRouteMarkRule creates a rule to set the subnet route
- // mark if the packet is from the given interface.
- func createSetSubnetRouteMarkRule(table *nftables.Table, chain *nftables.Chain, tunname string) (*nftables.Rule, error) {
- hexTsFwmarkMaskNeg := getTailscaleFwmarkMaskNeg()
- hexTSSubnetRouteMark := getTailscaleSubnetRouteMark()
- rule := &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyIIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte(tunname),
- },
- &expr.Counter{},
- &expr.Meta{Key: expr.MetaKeyMARK, Register: 1},
- &expr.Bitwise{
- SourceRegister: 1,
- DestRegister: 1,
- Len: 4,
- Mask: hexTsFwmarkMaskNeg,
- Xor: hexTSSubnetRouteMark,
- },
- &expr.Meta{
- Key: expr.MetaKeyMARK,
- SourceRegister: true,
- Register: 1,
- },
- },
- }
- return rule, nil
- }
- // addSetSubnetRouteMarkRule adds a rule to set the subnet route mark
- // if the packet is from the given interface.
- func addSetSubnetRouteMarkRule(c *nftables.Conn, table *nftables.Table, chain *nftables.Chain, tunname string) error {
- rule, err := createSetSubnetRouteMarkRule(table, chain, tunname)
- if err != nil {
- return fmt.Errorf("create rule: %w", err)
- }
- _ = c.AddRule(rule)
- if err := c.Flush(); err != nil {
- return fmt.Errorf("add rule: %w", err)
- }
- return nil
- }
- // createDropOutgoingPacketFromCGNATRangeRuleWithTunname creates a rule to drop
- // outgoing packets from the CGNAT range.
- func createDropOutgoingPacketFromCGNATRangeRuleWithTunname(table *nftables.Table, chain *nftables.Chain, tunname string) (*nftables.Rule, error) {
- _, ipNet, err := net.ParseCIDR(tsaddr.CGNATRange().String())
- if err != nil {
- return nil, fmt.Errorf("parse cidr: %v", err)
- }
- mask, err := hex.DecodeString(ipNet.Mask.String())
- if err != nil {
- return nil, fmt.Errorf("decode mask: %v", err)
- }
- netip := ipNet.IP.Mask(ipNet.Mask).To4()
- saddrExpr, err := newLoadSaddrExpr(nftables.TableFamilyIPv4, 1)
- if err != nil {
- return nil, fmt.Errorf("newLoadSaddrExpr: %v", err)
- }
- rule := &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyOIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte(tunname),
- },
- saddrExpr,
- &expr.Bitwise{
- SourceRegister: 1,
- DestRegister: 1,
- Len: 4,
- Mask: mask,
- Xor: []byte{0x00, 0x00, 0x00, 0x00},
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: netip,
- },
- &expr.Counter{},
- &expr.Verdict{
- Kind: expr.VerdictDrop,
- },
- },
- }
- return rule, nil
- }
- // addDropOutgoingPacketFromCGNATRangeRuleWithTunname adds a rule to drop
- // outgoing packets from the CGNAT range.
- func addDropOutgoingPacketFromCGNATRangeRuleWithTunname(conn *nftables.Conn, table *nftables.Table, chain *nftables.Chain, tunname string) error {
- rule, err := createDropOutgoingPacketFromCGNATRangeRuleWithTunname(table, chain, tunname)
- if err != nil {
- return fmt.Errorf("create rule: %w", err)
- }
- _ = conn.AddRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("add rule: %w", err)
- }
- return nil
- }
- // createAcceptOutgoingPacketRule creates a rule to accept outgoing packets
- // from the given interface.
- func createAcceptOutgoingPacketRule(table *nftables.Table, chain *nftables.Chain, tunname string) *nftables.Rule {
- return &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyOIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte(tunname),
- },
- &expr.Counter{},
- &expr.Verdict{
- Kind: expr.VerdictAccept,
- },
- },
- }
- }
- // addAcceptOutgoingPacketRule adds a rule to accept outgoing packets
- // from the given interface.
- func addAcceptOutgoingPacketRule(conn *nftables.Conn, table *nftables.Table, chain *nftables.Chain, tunname string) error {
- rule := createAcceptOutgoingPacketRule(table, chain, tunname)
- _ = conn.AddRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add rule: %w", err)
- }
- return nil
- }
- // createAcceptOnPortRule creates a rule to accept incoming packets to
- // a given destination UDP port.
- func createAcceptOnPortRule(table *nftables.Table, chain *nftables.Chain, port uint16) *nftables.Rule {
- portBytes := make([]byte, 2)
- binary.BigEndian.PutUint16(portBytes, port)
- return &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{
- Key: expr.MetaKeyL4PROTO,
- Register: 1,
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte{unix.IPPROTO_UDP},
- },
- newLoadDportExpr(1),
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: portBytes,
- },
- &expr.Counter{},
- &expr.Verdict{
- Kind: expr.VerdictAccept,
- },
- },
- }
- }
- // addAcceptOnPortRule adds a rule to accept incoming packets to
- // a given destination UDP port.
- func addAcceptOnPortRule(conn *nftables.Conn, table *nftables.Table, chain *nftables.Chain, port uint16) error {
- rule := createAcceptOnPortRule(table, chain, port)
- _ = conn.AddRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add rule: %w", err)
- }
- return nil
- }
- // addAcceptOnPortRule removes a rule to accept incoming packets to
- // a given destination UDP port.
- func removeAcceptOnPortRule(conn *nftables.Conn, table *nftables.Table, chain *nftables.Chain, port uint16) error {
- rule := createAcceptOnPortRule(table, chain, port)
- rule, err := findRule(conn, rule)
- if err != nil {
- return fmt.Errorf("find rule: %v", err)
- }
- _ = conn.DelRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush del rule: %w", err)
- }
- return nil
- }
- // AddMagicsockPortRule adds a rule to nftables to allow incoming traffic on
- // the specified UDP port, so magicsock can accept incoming connections.
- // network must be either "udp4" or "udp6" - this determines whether the rule
- // is added for IPv4 or IPv6.
- func (n *nftablesRunner) AddMagicsockPortRule(port uint16, network string) error {
- var filterTable *nftables.Table
- switch network {
- case "udp4":
- filterTable = n.nft4.Filter
- case "udp6":
- filterTable = n.nft6.Filter
- default:
- return fmt.Errorf("unsupported network %s", network)
- }
- inputChain, err := getChainFromTable(n.conn, filterTable, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain: %v", err)
- }
- err = addAcceptOnPortRule(n.conn, filterTable, inputChain, port)
- if err != nil {
- return fmt.Errorf("add accept on port rule: %v", err)
- }
- return nil
- }
- // DelMagicsockPortRule removes a rule added by AddMagicsockPortRule to accept
- // incoming traffic on a particular UDP port.
- // network must be either "udp4" or "udp6" - this determines whether the rule
- // is removed for IPv4 or IPv6.
- func (n *nftablesRunner) DelMagicsockPortRule(port uint16, network string) error {
- var filterTable *nftables.Table
- switch network {
- case "udp4":
- filterTable = n.nft4.Filter
- case "udp6":
- filterTable = n.nft6.Filter
- default:
- return fmt.Errorf("unsupported network %s", network)
- }
- inputChain, err := getChainFromTable(n.conn, filterTable, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain: %v", err)
- }
- err = removeAcceptOnPortRule(n.conn, filterTable, inputChain, port)
- if err != nil {
- return fmt.Errorf("add accept on port rule: %v", err)
- }
- return nil
- }
- // createAcceptIncomingPacketRule creates a rule to accept incoming packets to
- // the given interface.
- func createAcceptIncomingPacketRule(table *nftables.Table, chain *nftables.Chain, tunname string) *nftables.Rule {
- return &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: []expr.Any{
- &expr.Meta{Key: expr.MetaKeyIIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte(tunname),
- },
- &expr.Counter{},
- &expr.Verdict{
- Kind: expr.VerdictAccept,
- },
- },
- }
- }
- func addAcceptIncomingPacketRule(conn *nftables.Conn, table *nftables.Table, chain *nftables.Chain, tunname string) error {
- rule := createAcceptIncomingPacketRule(table, chain, tunname)
- _ = conn.AddRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add rule: %w", err)
- }
- return nil
- }
- // AddBase adds some basic processing rules.
- func (n *nftablesRunner) AddBase(tunname string) error {
- if err := n.addBase4(tunname); err != nil {
- return fmt.Errorf("add base v4: %w", err)
- }
- if n.HasIPV6() {
- if err := n.addBase6(tunname); err != nil {
- return fmt.Errorf("add base v6: %w", err)
- }
- }
- return nil
- }
- // addBase4 adds some basic IPv4 processing rules.
- func (n *nftablesRunner) addBase4(tunname string) error {
- conn := n.conn
- inputChain, err := getChainFromTable(conn, n.nft4.Filter, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain v4: %v", err)
- }
- if err = addReturnChromeOSVMRangeRule(conn, n.nft4.Filter, inputChain, tunname); err != nil {
- return fmt.Errorf("add return chromeos vm range rule v4: %w", err)
- }
- if err = addDropCGNATRangeRule(conn, n.nft4.Filter, inputChain, tunname); err != nil {
- return fmt.Errorf("add drop cgnat range rule v4: %w", err)
- }
- if err = addAcceptIncomingPacketRule(conn, n.nft4.Filter, inputChain, tunname); err != nil {
- return fmt.Errorf("add accept incoming packet rule v4: %w", err)
- }
- forwardChain, err := getChainFromTable(conn, n.nft4.Filter, chainNameForward)
- if err != nil {
- return fmt.Errorf("get forward chain v4: %v", err)
- }
- if err = addSetSubnetRouteMarkRule(conn, n.nft4.Filter, forwardChain, tunname); err != nil {
- return fmt.Errorf("add set subnet route mark rule v4: %w", err)
- }
- if err = addMatchSubnetRouteMarkRule(conn, n.nft4.Filter, forwardChain, Accept); err != nil {
- return fmt.Errorf("add match subnet route mark rule v4: %w", err)
- }
- if err = addDropOutgoingPacketFromCGNATRangeRuleWithTunname(conn, n.nft4.Filter, forwardChain, tunname); err != nil {
- return fmt.Errorf("add drop outgoing packet from cgnat range rule v4: %w", err)
- }
- if err = addAcceptOutgoingPacketRule(conn, n.nft4.Filter, forwardChain, tunname); err != nil {
- return fmt.Errorf("add accept outgoing packet rule v4: %w", err)
- }
- if err = conn.Flush(); err != nil {
- return fmt.Errorf("flush base v4: %w", err)
- }
- return nil
- }
- // addBase6 adds some basic IPv6 processing rules.
- func (n *nftablesRunner) addBase6(tunname string) error {
- conn := n.conn
- inputChain, err := getChainFromTable(conn, n.nft6.Filter, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain v4: %v", err)
- }
- if err = addAcceptIncomingPacketRule(conn, n.nft6.Filter, inputChain, tunname); err != nil {
- return fmt.Errorf("add accept incoming packet rule v6: %w", err)
- }
- forwardChain, err := getChainFromTable(conn, n.nft6.Filter, chainNameForward)
- if err != nil {
- return fmt.Errorf("get forward chain v6: %w", err)
- }
- if err = addSetSubnetRouteMarkRule(conn, n.nft6.Filter, forwardChain, tunname); err != nil {
- return fmt.Errorf("add set subnet route mark rule v6: %w", err)
- }
- if err = addMatchSubnetRouteMarkRule(conn, n.nft6.Filter, forwardChain, Accept); err != nil {
- return fmt.Errorf("add match subnet route mark rule v6: %w", err)
- }
- if err = addAcceptOutgoingPacketRule(conn, n.nft6.Filter, forwardChain, tunname); err != nil {
- return fmt.Errorf("add accept outgoing packet rule v6: %w", err)
- }
- if err = conn.Flush(); err != nil {
- return fmt.Errorf("flush base v6: %w", err)
- }
- return nil
- }
- // DelBase empties, but does not remove, custom Tailscale chains from
- // netfilter via iptables.
- func (n *nftablesRunner) DelBase() error {
- conn := n.conn
- for _, table := range n.getTables() {
- inputChain, err := getChainFromTable(conn, table.Filter, chainNameInput)
- if err != nil {
- return fmt.Errorf("get input chain: %v", err)
- }
- conn.FlushChain(inputChain)
- forwardChain, err := getChainFromTable(conn, table.Filter, chainNameForward)
- if err != nil {
- return fmt.Errorf("get forward chain: %v", err)
- }
- conn.FlushChain(forwardChain)
- postrouteChain, err := getChainFromTable(conn, table.Nat, chainNamePostrouting)
- if err != nil {
- return fmt.Errorf("get postrouting chain v4: %v", err)
- }
- conn.FlushChain(postrouteChain)
- }
- return conn.Flush()
- }
- // createMatchSubnetRouteMarkRule creates a rule that matches packets
- // with the subnet route mark and takes the specified action.
- func createMatchSubnetRouteMarkRule(table *nftables.Table, chain *nftables.Chain, action MatchDecision) (*nftables.Rule, error) {
- hexTSFwmarkMask := getTailscaleFwmarkMask()
- hexTSSubnetRouteMark := getTailscaleSubnetRouteMark()
- var endAction expr.Any
- endAction = &expr.Verdict{Kind: expr.VerdictAccept}
- if action == Masq {
- endAction = &expr.Masq{}
- }
- exprs := []expr.Any{
- &expr.Meta{Key: expr.MetaKeyMARK, Register: 1},
- &expr.Bitwise{
- SourceRegister: 1,
- DestRegister: 1,
- Len: 4,
- Mask: hexTSFwmarkMask,
- Xor: []byte{0x00, 0x00, 0x00, 0x00},
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: hexTSSubnetRouteMark,
- },
- &expr.Counter{},
- endAction,
- }
- rule := &nftables.Rule{
- Table: table,
- Chain: chain,
- Exprs: exprs,
- }
- return rule, nil
- }
- // addMatchSubnetRouteMarkRule adds a rule that matches packets with
- // the subnet route mark and takes the specified action.
- func addMatchSubnetRouteMarkRule(conn *nftables.Conn, table *nftables.Table, chain *nftables.Chain, action MatchDecision) error {
- rule, err := createMatchSubnetRouteMarkRule(table, chain, action)
- if err != nil {
- return fmt.Errorf("create match subnet route mark rule: %w", err)
- }
- _ = conn.AddRule(rule)
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add rule: %w", err)
- }
- return nil
- }
- // AddSNATRule adds a netfilter rule to SNAT traffic destined for
- // local subnets.
- func (n *nftablesRunner) AddSNATRule() error {
- conn := n.conn
- for _, table := range n.getTables() {
- chain, err := getChainFromTable(conn, table.Nat, chainNamePostrouting)
- if err != nil {
- return fmt.Errorf("get postrouting chain v4: %w", err)
- }
- if err = addMatchSubnetRouteMarkRule(conn, table.Nat, chain, Masq); err != nil {
- return fmt.Errorf("add match subnet route mark rule v4: %w", err)
- }
- }
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add SNAT rule: %w", err)
- }
- return nil
- }
- // DelSNATRule removes the netfilter rule to SNAT traffic destined for
- // local subnets. An error is returned if the rule does not exist.
- func (n *nftablesRunner) DelSNATRule() error {
- conn := n.conn
- hexTSFwmarkMask := getTailscaleFwmarkMask()
- hexTSSubnetRouteMark := getTailscaleSubnetRouteMark()
- exprs := []expr.Any{
- &expr.Meta{Key: expr.MetaKeyMARK, Register: 1},
- &expr.Bitwise{
- SourceRegister: 1,
- DestRegister: 1,
- Len: 4,
- Mask: hexTSFwmarkMask,
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: hexTSSubnetRouteMark,
- },
- &expr.Counter{},
- &expr.Masq{},
- }
- for _, table := range n.getTables() {
- chain, err := getChainFromTable(conn, table.Nat, chainNamePostrouting)
- if err != nil {
- return fmt.Errorf("get postrouting chain v4: %w", err)
- }
- rule := &nftables.Rule{
- Table: table.Nat,
- Chain: chain,
- Exprs: exprs,
- }
- SNATRule, err := findRule(conn, rule)
- if err != nil {
- return fmt.Errorf("find SNAT rule v4: %w", err)
- }
- if SNATRule != nil {
- _ = conn.DelRule(SNATRule)
- }
- }
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush del SNAT rule: %w", err)
- }
- return nil
- }
- func nativeUint32(v uint32) []byte {
- b := make([]byte, 4)
- binary.NativeEndian.PutUint32(b, v)
- return b
- }
- func makeStatefulRuleExprs(tunname string) []expr.Any {
- return []expr.Any{
- // Check if the output interface is the Tailscale interface by
- // first loding the OIFNAME into register 1 and comparing it
- // against our tunname.
- //
- // 'cmp' implicitly breaks from a rule if a comparison fails,
- // so if we continue past this rule we know that the packet is
- // going to our TUN.
- &expr.Meta{Key: expr.MetaKeyOIFNAME, Register: 1},
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: []byte(tunname),
- },
- // Store the conntrack state in register 1
- &expr.Ct{
- Register: 1,
- Key: expr.CtKeySTATE,
- },
- // Mask the state in register 1 to "hide" the ESTABLISHED and
- // RELATED bits (which are expected and fine); if there are any
- // other bits, we want them to remain.
- //
- // This operation is, in the kernel:
- // dst[i] = (src[i] & mask[i]) ^ xor[i]
- //
- // So, we can mask by setting the inverse of the bits we want
- // to remove; i.e. ESTABLISHED = 0b00000010, RELATED =
- // 0b00000100, so, if we assume an 8-bit state (in reality,
- // it's 32-bit), we can mask with 0b11111001 to clear those
- // bits and keep everything else (e.g. the INVALID bit which is
- // 0b00000001).
- //
- // TODO(andrew-d): for now, let's also allow
- // CtStateBitUNTRACKED, which is a state for packets that are not
- // tracked (marked so explicitly with an iptables rule using
- // --notrack); we should figure out if we want to allow this or not.
- &expr.Bitwise{
- SourceRegister: 1,
- DestRegister: 1,
- Len: 4,
- Mask: nativeUint32(^(0 |
- expr.CtStateBitESTABLISHED |
- expr.CtStateBitRELATED |
- expr.CtStateBitUNTRACKED)),
- // Xor is unused but must be specified
- Xor: nativeUint32(0),
- },
- // Compare against the expected state (0, i.e. no bits set
- // other than maybe ESTABLISHED and RELATED). We want this
- // comparison to fail if there are no bits set, so that this
- // rule's evaluation stops and we don't fall through to the
- // "Drop" verdict.
- //
- // For example, if the state is ESTABLISHED (and we want to
- // break from this rule/accept this packet):
- // state = ESTABLISHED
- // register1 = 0b0 (since the bitwise operation cleared the ESTABLISHED bit)
- //
- // compare register1 (0b0) != 0: false
- // -> comparison implicitly breaks
- // -> continue to the next rule
- //
- // For example, if the state is NEW (and we want to continue to
- // the next expression and thus drop this packet):
- // state = NEW
- // register1 = 0b1000
- //
- // compare register1 (0b1000) != 0: true
- // -> comparison continues to next expr
- &expr.Cmp{
- Op: expr.CmpOpNeq,
- Register: 1,
- Data: []byte{0, 0, 0, 0},
- },
- // If we get here, we know that this packet is going to our TUN
- // device, and has a conntrack state set other than ESTABLISHED
- // or RELATED. We thus count and drop the packet.
- &expr.Counter{},
- &expr.Verdict{Kind: expr.VerdictDrop},
- }
- // TODO(andrew-d): iptables-nft writes a rule that dumps as:
- //
- // match name conntrack rev 3
- //
- // I think this is using expr.Match against the following struct
- // (xt_conntrack_mtinfo3):
- //
- // https://github.com/torvalds/linux/blob/master/include/uapi/linux/netfilter/xt_conntrack.h#L64-L77
- //
- // We could probably do something similar here, but I'm not sure if
- // there's any advantage. Below is an example Match statement if we
- // decide to do that, based on dumping the rule that iptables-nft
- // generates:
- //
- // _ = expr.Match{
- // Name: "conntrack",
- // Rev: 3,
- // Info: &xt.ConntrackMtinfo3{
- // ConntrackMtinfo2: xt.ConntrackMtinfo2{
- // ConntrackMtinfoBase: xt.ConntrackMtinfoBase{
- // MatchFlags: xt.ConntrackState,
- // InvertFlags: xt.ConntrackState,
- // },
- // // Mask the state to remove ESTABLISHED and
- // // RELATED before comparing.
- // StateMask: expr.CtStateBitESTABLISHED | expr.CtStateBitRELATED,
- // },
- // },
- // }
- }
- // AddStatefulRule adds a netfilter rule for stateful packet filtering using
- // conntrack.
- func (n *nftablesRunner) AddStatefulRule(tunname string) error {
- conn := n.conn
- exprs := makeStatefulRuleExprs(tunname)
- for _, table := range n.getTables() {
- chain, err := getChainFromTable(conn, table.Filter, chainNameForward)
- if err != nil {
- return fmt.Errorf("get forward chain: %w", err)
- }
- // First, find the 'accept' rule that we want to insert our rule before.
- acceptRule := createAcceptOutgoingPacketRule(table.Filter, chain, tunname)
- rule, err := findRule(conn, acceptRule)
- if err != nil {
- return fmt.Errorf("find accept rule: %w", err)
- }
- conn.InsertRule(&nftables.Rule{
- Table: table.Filter,
- Chain: chain,
- Exprs: exprs,
- // Specifying Position in an Insert operation means to
- // insert this rule before the specified rule.
- Position: rule.Handle,
- })
- }
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush add stateful rule: %w", err)
- }
- return nil
- }
- // DelStatefulRule removes the netfilter rule for stateful packet filtering
- // using conntrack.
- func (n *nftablesRunner) DelStatefulRule(tunname string) error {
- conn := n.conn
- exprs := makeStatefulRuleExprs(tunname)
- for _, table := range n.getTables() {
- chain, err := getChainFromTable(conn, table.Filter, chainNameForward)
- if err != nil {
- return fmt.Errorf("get forward chain: %w", err)
- }
- rule, err := findRule(conn, &nftables.Rule{
- Table: table.Filter,
- Chain: chain,
- Exprs: exprs,
- })
- if err != nil {
- return fmt.Errorf("find stateful rule: %w", err)
- }
- if rule != nil {
- conn.DelRule(rule)
- }
- }
- if err := conn.Flush(); err != nil {
- return fmt.Errorf("flush del stateful rule: %w", err)
- }
- return nil
- }
- // cleanupChain removes a jump rule from hookChainName to tsChainName, and then
- // the entire chain tsChainName. Errors are logged, but attempts to remove both
- // the jump rule and chain continue even if one errors.
- func cleanupChain(logf logger.Logf, conn *nftables.Conn, table *nftables.Table, hookChainName, tsChainName string) {
- // remove the jump first, before removing the jump destination.
- defaultChain, err := getChainFromTable(conn, table, hookChainName)
- if err != nil && !errors.Is(err, errorChainNotFound{table.Name, hookChainName}) {
- logf("cleanup: did not find default chain: %s", err)
- }
- if !errors.Is(err, errorChainNotFound{table.Name, hookChainName}) {
- // delete hook in convention chain
- _ = delHookRule(conn, table, defaultChain, tsChainName)
- }
- tsChain, err := getChainFromTable(conn, table, tsChainName)
- if err != nil && !errors.Is(err, errorChainNotFound{table.Name, tsChainName}) {
- logf("cleanup: did not find ts-chain: %s", err)
- }
- if tsChain != nil {
- // flush and delete ts-chain
- conn.FlushChain(tsChain)
- conn.DelChain(tsChain)
- err = conn.Flush()
- logf("cleanup: delete and flush chain %s: %s", tsChainName, err)
- }
- }
- // NfTablesCleanUp removes all Tailscale added nftables rules.
- // Any errors that occur are logged to the provided logf.
- func NfTablesCleanUp(logf logger.Logf) {
- conn, err := nftables.New()
- if err != nil {
- logf("cleanup: nftables connection: %s", err)
- }
- tables, err := conn.ListTables() // both v4 and v6
- if err != nil {
- logf("cleanup: list tables: %s", err)
- }
- for _, table := range tables {
- // These table names were used briefly in 1.48.0.
- if table.Name == "ts-filter" || table.Name == "ts-nat" {
- conn.DelTable(table)
- if err := conn.Flush(); err != nil {
- logf("cleanup: flush delete table %s: %s", table.Name, err)
- }
- }
- if table.Name == "filter" {
- cleanupChain(logf, conn, table, "INPUT", chainNameInput)
- cleanupChain(logf, conn, table, "FORWARD", chainNameForward)
- }
- if table.Name == "nat" {
- cleanupChain(logf, conn, table, "POSTROUTING", chainNamePostrouting)
- }
- }
- }
- func snatRule(t *nftables.Table, ch *nftables.Chain, src, dst netip.Addr, meta []byte) *nftables.Rule {
- var daddrOffset, fam, daddrLen uint32
- if dst.Is4() {
- daddrOffset = 16
- daddrLen = 4
- fam = unix.NFPROTO_IPV4
- } else {
- daddrOffset = 24
- daddrLen = 16
- fam = unix.NFPROTO_IPV6
- }
- return &nftables.Rule{
- Table: t,
- Chain: ch,
- Exprs: []expr.Any{
- &expr.Payload{
- DestRegister: 1,
- Base: expr.PayloadBaseNetworkHeader,
- Offset: daddrOffset,
- Len: daddrLen,
- },
- &expr.Cmp{
- Op: expr.CmpOpEq,
- Register: 1,
- Data: dst.AsSlice(),
- },
- &expr.Immediate{
- Register: 1,
- Data: src.AsSlice(),
- },
- &expr.NAT{
- Type: expr.NATTypeSourceNAT,
- Family: fam,
- RegAddrMin: 1,
- RegAddrMax: 1,
- },
- },
- UserData: meta,
- }
- }
|