cregit-Linux how code gets into the kernel

Release 4.14 net/sched/cls_api.c

Directory: net/sched
/*
 * net/sched/cls_api.c  Packet classifier API.
 *
 *              This program is free software; you can redistribute it and/or
 *              modify it under the terms of the GNU General Public License
 *              as published by the Free Software Foundation; either version
 *              2 of the License, or (at your option) any later version.
 *
 * Authors:     Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
 *
 * Changes:
 *
 * Eduardo J. Blanco <ejbs@netlabs.com.uy> :990222: kmod support
 *
 */

#include <linux/module.h>
#include <linux/types.h>
#include <linux/kernel.h>
#include <linux/string.h>
#include <linux/errno.h>
#include <linux/err.h>
#include <linux/skbuff.h>
#include <linux/init.h>
#include <linux/kmod.h>
#include <linux/err.h>
#include <linux/slab.h>
#include <net/net_namespace.h>
#include <net/sock.h>
#include <net/netlink.h>
#include <net/pkt_sched.h>
#include <net/pkt_cls.h>

/* The list of all installed classifier types */
static LIST_HEAD(tcf_proto_base);

/* Protects list of registered TC modules. It is pure SMP lock. */
static DEFINE_RWLOCK(cls_mod_lock);

/* Find classifier type by string name */


static const struct tcf_proto_ops *tcf_proto_lookup_ops(const char *kind) { const struct tcf_proto_ops *t, *res = NULL; if (kind) { read_lock(&cls_mod_lock); list_for_each_entry(t, &tcf_proto_base, head) { if (strcmp(kind, t->kind) == 0) { if (try_module_get(t->owner)) res = t; break; } } read_unlock(&cls_mod_lock); } return res; }

Contributors

PersonTokensPropCommitsCommitProp
Linus Torvalds (pre-git)5261.18%225.00%
Patrick McHardy1315.29%112.50%
Eric Dumazet89.41%225.00%
Américo Wang89.41%112.50%
Jiri Pirko33.53%112.50%
Chris Wright11.18%112.50%
Total85100.00%8100.00%

/* Register(unregister) new classifier type */
int register_tcf_proto_ops(struct tcf_proto_ops *ops) { struct tcf_proto_ops *t; int rc = -EEXIST; write_lock(&cls_mod_lock); list_for_each_entry(t, &tcf_proto_base, head) if (!strcmp(ops->kind, t->kind)) goto out; list_add_tail(&ops->head, &tcf_proto_base); rc = 0; out: write_unlock(&cls_mod_lock); return rc; }

Contributors

PersonTokensPropCommitsCommitProp
Linus Torvalds (pre-git)4557.69%250.00%
Arnaldo Carvalho de Melo1721.79%125.00%
Américo Wang1620.51%125.00%
Total78100.00%4100.00%

EXPORT_SYMBOL(register_tcf_proto_ops); static struct workqueue_struct *tc_filter_wq;
int unregister_tcf_proto_ops(struct tcf_proto_ops *ops) { struct tcf_proto_ops *t; int rc = -ENOENT; /* Wait for outstanding call_rcu()s, if any, from a * tcf_proto_ops's destroy() handler. */ rcu_barrier(); flush_workqueue(tc_filter_wq); write_lock(&cls_mod_lock); list_for_each_entry(t, &tcf_proto_base, head) { if (t == ops) { list_del(&t->head); rc = 0; break; } } write_unlock(&cls_mod_lock); return rc; }

Contributors

PersonTokensPropCommitsCommitProp
Linus Torvalds (pre-git)3850.00%228.57%
Américo Wang1823.68%228.57%
Arnaldo Carvalho de Melo1114.47%114.29%
Eric Dumazet56.58%114.29%
Daniel Borkmann45.26%114.29%
Total76100.00%7100.00%

EXPORT_SYMBOL(unregister_tcf_proto_ops);
bool tcf_queue_work(struct work_struct *work) { return queue_work(tc_filter_wq, work); }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang18100.00%1100.00%
Total18100.00%1100.00%

EXPORT_SYMBOL(tcf_queue_work); /* Select new prio value from the range, managed by kernel. */
static inline u32 tcf_auto_prio(struct tcf_proto *tp) { u32 first = TC_H_MAKE(0xC0000000U, 0U); if (tp) first = tp->prio - 1; return TC_H_MAJ(first); }

Contributors

PersonTokensPropCommitsCommitProp
Linus Torvalds (pre-git)3690.00%133.33%
Jiri Pirko37.50%133.33%
Stephen Hemminger12.50%133.33%
Total40100.00%3100.00%


static struct tcf_proto *tcf_proto_create(const char *kind, u32 protocol, u32 prio, u32 parent, struct Qdisc *q, struct tcf_chain *chain) { struct tcf_proto *tp; int err; tp = kzalloc(sizeof(*tp), GFP_KERNEL); if (!tp) return ERR_PTR(-ENOBUFS); err = -ENOENT; tp->ops = tcf_proto_lookup_ops(kind); if (!tp->ops) { #ifdef CONFIG_MODULES rtnl_unlock(); request_module("cls_%s", kind); rtnl_lock(); tp->ops = tcf_proto_lookup_ops(kind); /* We dropped the RTNL semaphore in order to perform * the module load. So, even if we succeeded in loading * the module we have to replay the request. We indicate * this using -EAGAIN. */ if (tp->ops) { module_put(tp->ops->owner); err = -EAGAIN; } else { err = -ENOENT; } goto errout; #endif } tp->classify = tp->ops->classify; tp->protocol = protocol; tp->prio = prio; tp->classid = parent; tp->q = q; tp->chain = chain; err = tp->ops->init(tp); if (err) { module_put(tp->ops->owner); goto errout; } return tp; errout: kfree(tp); return ERR_PTR(err); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko234100.00%3100.00%
Total234100.00%3100.00%


static void tcf_proto_destroy(struct tcf_proto *tp) { tp->ops->destroy(tp); module_put(tp->ops->owner); kfree_rcu(tp, rcu); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko3494.44%150.00%
Américo Wang25.56%150.00%
Total36100.00%2100.00%


static struct tcf_chain *tcf_chain_create(struct tcf_block *block, u32 chain_index) { struct tcf_chain *chain; chain = kzalloc(sizeof(*chain), GFP_KERNEL); if (!chain) return NULL; list_add_tail(&chain->list, &block->chain_list); chain->block = block; chain->index = chain_index; chain->refcnt = 1; return chain; }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko7598.68%266.67%
Américo Wang11.32%133.33%
Total76100.00%3100.00%


static void tcf_chain_flush(struct tcf_chain *chain) { struct tcf_proto *tp; if (chain->p_filter_chain) RCU_INIT_POINTER(*chain->p_filter_chain, NULL); while ((tp = rtnl_dereference(chain->filter_chain)) != NULL) { RCU_INIT_POINTER(chain->filter_chain, tp->next); tcf_chain_put(chain); tcf_proto_destroy(tp); } }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko6592.86%583.33%
Américo Wang57.14%116.67%
Total70100.00%6100.00%


static void tcf_chain_destroy(struct tcf_chain *chain) { list_del(&chain->list); kfree(chain); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko2083.33%150.00%
Américo Wang416.67%150.00%
Total24100.00%2100.00%


static void tcf_chain_hold(struct tcf_chain *chain) { ++chain->refcnt; }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang1168.75%133.33%
Jiri Pirko531.25%266.67%
Total16100.00%3100.00%


struct tcf_chain *tcf_chain_get(struct tcf_block *block, u32 chain_index, bool create) { struct tcf_chain *chain; list_for_each_entry(chain, &block->chain_list, list) { if (chain->index == chain_index) { tcf_chain_hold(chain); return chain; } } return create ? tcf_chain_create(block, chain_index) : NULL; }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko4673.02%250.00%
Américo Wang1726.98%250.00%
Total63100.00%4100.00%

EXPORT_SYMBOL(tcf_chain_get);
void tcf_chain_put(struct tcf_chain *chain) { if (--chain->refcnt == 0) tcf_chain_destroy(chain); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko24100.00%1100.00%
Total24100.00%1100.00%

EXPORT_SYMBOL(tcf_chain_put);
static void tcf_chain_filter_chain_ptr_set(struct tcf_chain *chain, struct tcf_proto __rcu **p_filter_chain) { chain->p_filter_chain = p_filter_chain; }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko24100.00%2100.00%
Total24100.00%2100.00%


int tcf_block_get(struct tcf_block **p_block, struct tcf_proto __rcu **p_filter_chain) { struct tcf_block *block = kzalloc(sizeof(*block), GFP_KERNEL); struct tcf_chain *chain; int err; if (!block) return -ENOMEM; INIT_LIST_HEAD(&block->chain_list); /* Create chain 0 by default, it has to be always present. */ chain = tcf_chain_create(block, 0); if (!chain) { err = -ENOMEM; goto err_chain_create; } tcf_chain_filter_chain_ptr_set(chain, p_filter_chain); *p_block = block; return 0; err_chain_create: kfree(block); return err; }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko109100.00%3100.00%
Total109100.00%3100.00%

EXPORT_SYMBOL(tcf_block_get);
static void tcf_block_put_final(struct work_struct *work) { struct tcf_block *block = container_of(work, struct tcf_block, work); struct tcf_chain *chain, *tmp; rtnl_lock(); /* Only chain 0 should be still here. */ list_for_each_entry_safe(chain, tmp, &block->chain_list, list) tcf_chain_put(chain); rtnl_unlock(); kfree(block); }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang4675.41%250.00%
Jiri Pirko1524.59%250.00%
Total61100.00%4100.00%

/* XXX: Standalone actions are not allowed to jump to any chain, and bound * actions should be all removed after flushing. However, filters are now * destroyed in tc filter workqueue with RTNL lock, they can not race here. */
void tcf_block_put(struct tcf_block *block) { struct tcf_chain *chain, *tmp; if (!block) return; list_for_each_entry_safe(chain, tmp, &block->chain_list, list) tcf_chain_flush(chain); INIT_WORK(&block->work, tcf_block_put_final); /* Wait for RCU callbacks to release the reference count and make * sure their works have been queued before this. */ rcu_barrier(); tcf_queue_work(&block->work); }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang5081.97%457.14%
Jiri Pirko1118.03%342.86%
Total61100.00%7100.00%

EXPORT_SYMBOL(tcf_block_put); /* Main classifier routine: scans classifier chain attached * to this qdisc, (optionally) tests for protocol and asks * specific classifiers. */
int tcf_classify(struct sk_buff *skb, const struct tcf_proto *tp, struct tcf_result *res, bool compat_mode) { __be16 protocol = tc_skb_protocol(skb); #ifdef CONFIG_NET_CLS_ACT const int max_reclassify_loop = 4; const struct tcf_proto *orig_tp = tp; const struct tcf_proto *first_tp; int limit = 0; reclassify: #endif for (; tp; tp = rcu_dereference_bh(tp->next)) { int err; if (tp->protocol != protocol && tp->protocol != htons(ETH_P_ALL)) continue; err = tp->classify(skb, tp, res); #ifdef CONFIG_NET_CLS_ACT if (unlikely(err == TC_ACT_RECLASSIFY && !compat_mode)) { first_tp = orig_tp; goto reset; } else if (unlikely(TC_ACT_EXT_CMP(err, TC_ACT_GOTO_CHAIN))) { first_tp = res->goto_tp; goto reset; } #endif if (err >= 0) return err; } return TC_ACT_UNSPEC; /* signal: continue lookup */ #ifdef CONFIG_NET_CLS_ACT reset: if (unlikely(limit++ >= max_reclassify_loop)) { net_notice_ratelimited("%s: reclassify loop, rule prio %u, protocol %02x\n", tp->q->ops->id, tp->prio & 0xffff, ntohs(tp->protocol)); return TC_ACT_SHOT; } tp = first_tp; protocol = tc_skb_protocol(skb); goto reclassify; #endif }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko239100.00%4100.00%
Total239100.00%4100.00%

EXPORT_SYMBOL(tcf_classify); struct tcf_chain_info { struct tcf_proto __rcu **pprev; struct tcf_proto __rcu *next; };
static struct tcf_proto *tcf_chain_tp_prev(struct tcf_chain_info *chain_info) { return rtnl_dereference(*chain_info->pprev); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko22100.00%1100.00%
Total22100.00%1100.00%


static void tcf_chain_tp_insert(struct tcf_chain *chain, struct tcf_chain_info *chain_info, struct tcf_proto *tp) { if (chain->p_filter_chain && *chain_info->pprev == chain->filter_chain) rcu_assign_pointer(*chain->p_filter_chain, tp); RCU_INIT_POINTER(tp->next, tcf_chain_tp_prev(chain_info)); rcu_assign_pointer(*chain_info->pprev, tp); tcf_chain_hold(chain); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko6893.15%266.67%
Américo Wang56.85%133.33%
Total73100.00%3100.00%


static void tcf_chain_tp_remove(struct tcf_chain *chain, struct tcf_chain_info *chain_info, struct tcf_proto *tp) { struct tcf_proto *next = rtnl_dereference(chain_info->next); if (chain->p_filter_chain && tp == chain->filter_chain) RCU_INIT_POINTER(*chain->p_filter_chain, next); RCU_INIT_POINTER(*chain_info->pprev, next); tcf_chain_put(chain); }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko6592.86%266.67%
Américo Wang57.14%133.33%
Total70100.00%3100.00%


static struct tcf_proto *tcf_chain_tp_find(struct tcf_chain *chain, struct tcf_chain_info *chain_info, u32 protocol, u32 prio, bool prio_allocate) { struct tcf_proto **pprev; struct tcf_proto *tp; /* Check the chain for existence of proto-tcf with this priority */ for (pprev = &chain->filter_chain; (tp = rtnl_dereference(*pprev)); pprev = &tp->next) { if (tp->prio >= prio) { if (tp->prio == prio) { if (prio_allocate || (tp->protocol != protocol && protocol)) return ERR_PTR(-EINVAL); } else { tp = NULL; } break; } } chain_info->pprev = pprev; chain_info->next = tp ? tp->next : NULL; return tp; }

Contributors

PersonTokensPropCommitsCommitProp
Jiri Pirko137100.00%2100.00%
Total137100.00%2100.00%


static int tcf_fill_node(struct net *net, struct sk_buff *skb, struct tcf_proto *tp, void *fh, u32 portid, u32 seq, u16 flags, int event) { struct tcmsg *tcm; struct nlmsghdr *nlh; unsigned char *b = skb_tail_pointer(skb); nlh = nlmsg_put(skb, portid, seq, event, sizeof(*tcm), flags); if (!nlh) goto out_nlmsg_trim; tcm = nlmsg_data(nlh); tcm->tcm_family = AF_UNSPEC; tcm->tcm__pad1 = 0; tcm->tcm__pad2 = 0; tcm->tcm_ifindex = qdisc_dev(tp->q)->ifindex; tcm->tcm_parent = tp->classid; tcm->tcm_info = TC_H_MAKE(tp->prio, tp->protocol); if (nla_put_string(skb, TCA_KIND, tp->ops->kind)) goto nla_put_failure; if (nla_put_u32(skb, TCA_CHAIN, tp->chain->index)) goto nla_put_failure; if (!fh) { tcm->tcm_handle = 0; } else { if (tp->ops->dump && tp->ops->dump(net, tp, fh, skb, tcm) < 0) goto nla_put_failure; } nlh->nlmsg_len = skb_tail_pointer(skb) - b; return skb->len; out_nlmsg_trim: nla_put_failure: nlmsg_trim(skb, b); return -1; }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang15860.77%15.56%
Linus Torvalds (pre-git)5621.54%211.11%
Patrick McHardy166.15%316.67%
Hong Zhi Guo114.23%15.56%
Stephen Hemminger62.31%15.56%
Eric W. Biedermann41.54%316.67%
Jiri Pirko31.15%211.11%
David Ahern20.77%15.56%
David S. Miller10.38%15.56%
Stéphane Graber10.38%15.56%
John Fastabend10.38%15.56%
Daniel Borkmann10.38%15.56%
Total260100.00%18100.00%


static int tfilter_notify(struct net *net, struct sk_buff *oskb, struct nlmsghdr *n, struct tcf_proto *tp, void *fh, int event, bool unicast) { struct sk_buff *skb; u32 portid = oskb ? NETLINK_CB(oskb).portid : 0; skb = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL); if (!skb) return -ENOBUFS; if (tcf_fill_node(net, skb, tp, fh, portid, n->nlmsg_seq, n->nlmsg_flags, event) <= 0) { kfree_skb(skb); return -EINVAL; } if (unicast) return netlink_unicast(net->rtnl, skb, portid, MSG_DONTWAIT); return rtnetlink_send(skb, net, portid, RTNLGRP_TC, n->nlmsg_flags & NLM_F_ECHO); }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang11578.23%233.33%
Jiri Pirko2114.29%233.33%
Daniel Borkmann106.80%116.67%
John Fastabend10.68%116.67%
Total147100.00%6100.00%


static int tfilter_del_notify(struct net *net, struct sk_buff *oskb, struct nlmsghdr *n, struct tcf_proto *tp, void *fh, bool unicast, bool *last) { struct sk_buff *skb; u32 portid = oskb ? NETLINK_CB(oskb).portid : 0; int err; skb = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL); if (!skb) return -ENOBUFS; if (tcf_fill_node(net, skb, tp, fh, portid, n->nlmsg_seq, n->nlmsg_flags, RTM_DELTFILTER) <= 0) { kfree_skb(skb); return -EINVAL; } err = tp->ops->delete(tp, fh, last); if (err) { kfree_skb(skb); return err; } if (unicast) return netlink_unicast(net->rtnl, skb, portid, MSG_DONTWAIT); return rtnetlink_send(skb, net, portid, RTNLGRP_TC, n->nlmsg_flags & NLM_F_ECHO); }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang14480.00%111.11%
Linus Torvalds (pre-git)179.44%222.22%
Jiri Pirko168.89%444.44%
Patrick McHardy21.11%111.11%
Stephen Hemminger10.56%111.11%
Total180100.00%9100.00%


static void tfilter_notify_chain(struct net *net, struct sk_buff *oskb, struct nlmsghdr *n, struct tcf_chain *chain, int event) { struct tcf_proto *tp; for (tp = rtnl_dereference(chain->filter_chain); tp; tp = rtnl_dereference(tp->next)) tfilter_notify(net, oskb, n, tp, 0, event, false); }

Contributors

PersonTokensPropCommitsCommitProp
Américo Wang6386.30%125.00%
Linus Torvalds (pre-git)912.33%250.00%
Jiri Pirko11.37%125.00%
Total73100.00%4100.00%

/* Add/change/delete/get a filter node */
static int tc_ctl_tfilter(struct sk_buff *skb, struct nlmsghdr *n, struct netlink_ext_ack *extack) { struct net *net = sock_net(skb->sk); struct nlattr *tca[TCA_MAX + 1]; struct tcmsg *t; u32 protocol; u32 prio; bool prio_allocate; u32 parent; u32 chain_index; struct net_device *dev; struct Qdisc *q; struct tcf_chain_info chain_info; struct tcf_chain *chain = NULL; struct tcf_block *block; struct tcf_proto *tp; const struct Qdisc_class_ops *cops; unsigned long cl; void *fh; int err; int tp_created; if ((n->nlmsg_type != RTM_GETTFILTER) && !netlink_ns_capable(skb, net->user_ns, CAP_NET_ADMIN)) return -EPERM; replay: tp_created = 0; err = nlmsg_parse(n, sizeof(*t), tca, TCA_MAX, NULL, extack); if (err < 0) return err; t = nlmsg_data(n); protocol = TC_H_MIN(t->tcm_info); prio = TC_H_MAJ(t->tcm_info); prio_allocate = false; parent = t->tcm_parent; cl = 0; if (prio == 0) { switch (n->nlmsg_type) { case RTM_DELTFILTER: if (protocol || t->tcm_handle || tca[TCA_KIND]) return -ENOENT; break; case RTM_NEWTFILTER: /* If no priority is provided by the user, * we allocate one. */ if (n->nlmsg_flags & NLM_F_CREATE) { prio = TC_H_MAKE(0x80000000U, 0U); prio_allocate = true; break; } /* fall-through */ default: return -ENOENT; } } /* Find head of filter chain. */ /* Find link */ dev = __dev_get_by_index(net, t->tcm_ifindex); if (dev == NULL) return -ENODEV; /* Find qdisc */ if (!parent) { q = dev->qdisc; parent = q->handle; } else { q = qdisc_lookup(dev, TC_H_MAJ(t->tcm_parent)); if (q == NULL) return -EINVAL; } /* Is it classful? */ cops = q->ops->cl_ops; if (!cops) return -EINVAL; if (!cops->tcf_block) return -EOPNOTSUPP; /* Do we search for filter, attached to class? */ if (TC_H_MIN(parent)) { cl = cops->find(q, parent); if (cl == 0) return -ENOENT; } /* And the last stroke */ block = cops->tcf_block(q, cl); if (!block) { err = -EINVAL; goto errout; } chain_index = tca[TCA_CHAIN] ? nla_get_u32(tca[TCA_CHAIN]) : 0; if (chain_index > TC_ACT_EXT_VAL_MASK) { err = -EINVAL; goto errout; } chain = tcf_chain_get(block, chain_index, n->nlmsg_type == RTM_NEWTFILTER); if (!chain) { err = n->nlmsg_type == RTM_NEWTFILTER ? -ENOMEM : -EINVAL; goto errout; } if (n->nlmsg_type == RTM_DELTFILTER && prio == 0) { tfilter_notify_chain(net, skb, n, chain, RTM_DELTFILTER)