diff options
Diffstat (limited to 'net/sched/cls_bpf.c')
| -rw-r--r-- | net/sched/cls_bpf.c | 216 | 
1 files changed, 116 insertions, 100 deletions
| diff --git a/net/sched/cls_bpf.c b/net/sched/cls_bpf.c index f57bd531ba98..a9f3e317055c 100644 --- a/net/sched/cls_bpf.c +++ b/net/sched/cls_bpf.c @@ -17,6 +17,7 @@  #include <linux/skbuff.h>  #include <linux/filter.h>  #include <linux/bpf.h> +#include <linux/idr.h>  #include <net/rtnetlink.h>  #include <net/pkt_cls.h> @@ -32,7 +33,7 @@ MODULE_DESCRIPTION("TC BPF based classifier");  struct cls_bpf_head {  	struct list_head plist; -	u32 hgen; +	struct idr handle_idr;  	struct rcu_head rcu;  }; @@ -49,7 +50,10 @@ struct cls_bpf_prog {  	struct sock_filter *bpf_ops;  	const char *bpf_name;  	struct tcf_proto *tp; -	struct rcu_head rcu; +	union { +		struct work_struct work; +		struct rcu_head rcu; +	};  };  static const struct nla_policy bpf_policy[TCA_BPF_MAX + 1] = { @@ -99,11 +103,11 @@ static int cls_bpf_classify(struct sk_buff *skb, const struct tcf_proto *tp,  		} else if (at_ingress) {  			/* It is safe to push/pull even if skb_shared() */  			__skb_push(skb, skb->mac_len); -			bpf_compute_data_end(skb); +			bpf_compute_data_pointers(skb);  			filter_res = BPF_PROG_RUN(prog->filter, skb);  			__skb_pull(skb, skb->mac_len);  		} else { -			bpf_compute_data_end(skb); +			bpf_compute_data_pointers(skb);  			filter_res = BPF_PROG_RUN(prog->filter, skb);  		} @@ -146,35 +150,39 @@ static bool cls_bpf_is_ebpf(const struct cls_bpf_prog *prog)  static int cls_bpf_offload_cmd(struct tcf_proto *tp, struct cls_bpf_prog *prog,  			       enum tc_clsbpf_command cmd)  { -	struct net_device *dev = tp->q->dev_queue->dev; -	struct tc_cls_bpf_offload bpf_offload = {}; -	struct tc_to_netdev offload; +	bool addorrep = cmd == TC_CLSBPF_ADD || cmd == TC_CLSBPF_REPLACE; +	struct tcf_block *block = tp->chain->block; +	bool skip_sw = tc_skip_sw(prog->gen_flags); +	struct tc_cls_bpf_offload cls_bpf = {};  	int err; -	offload.type = TC_SETUP_CLSBPF; -	offload.cls_bpf = &bpf_offload; - -	bpf_offload.command = cmd; -	bpf_offload.exts = &prog->exts; -	bpf_offload.prog = prog->filter; -	bpf_offload.name = prog->bpf_name; -	bpf_offload.exts_integrated = prog->exts_integrated; -	bpf_offload.gen_flags = prog->gen_flags; - -	err = dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle, -					    tp->chain->index, -					    tp->protocol, &offload); +	tc_cls_common_offload_init(&cls_bpf.common, tp); +	cls_bpf.command = cmd; +	cls_bpf.exts = &prog->exts; +	cls_bpf.prog = prog->filter; +	cls_bpf.name = prog->bpf_name; +	cls_bpf.exts_integrated = prog->exts_integrated; +	cls_bpf.gen_flags = prog->gen_flags; + +	err = tc_setup_cb_call(block, NULL, TC_SETUP_CLSBPF, &cls_bpf, skip_sw); +	if (addorrep) { +		if (err < 0) { +			cls_bpf_offload_cmd(tp, prog, TC_CLSBPF_DESTROY); +			return err; +		} else if (err > 0) { +			prog->gen_flags |= TCA_CLS_FLAGS_IN_HW; +		} +	} -	if (!err && (cmd == TC_CLSBPF_ADD || cmd == TC_CLSBPF_REPLACE)) -		prog->gen_flags |= TCA_CLS_FLAGS_IN_HW; +	if (addorrep && skip_sw && !(prog->gen_flags & TCA_CLS_FLAGS_IN_HW)) +		return -EINVAL; -	return err; +	return 0;  }  static int cls_bpf_offload(struct tcf_proto *tp, struct cls_bpf_prog *prog,  			   struct cls_bpf_prog *oldprog)  { -	struct net_device *dev = tp->q->dev_queue->dev;  	struct cls_bpf_prog *obj = prog;  	enum tc_clsbpf_command cmd;  	bool skip_sw; @@ -184,7 +192,7 @@ static int cls_bpf_offload(struct tcf_proto *tp, struct cls_bpf_prog *prog,  		(oldprog && tc_skip_sw(oldprog->gen_flags));  	if (oldprog && oldprog->offloaded) { -		if (tc_should_offload(dev, tp, prog->gen_flags)) { +		if (!tc_skip_hw(prog->gen_flags)) {  			cmd = TC_CLSBPF_REPLACE;  		} else if (!tc_skip_sw(prog->gen_flags)) {  			obj = oldprog; @@ -193,14 +201,14 @@ static int cls_bpf_offload(struct tcf_proto *tp, struct cls_bpf_prog *prog,  			return -EINVAL;  		}  	} else { -		if (!tc_should_offload(dev, tp, prog->gen_flags)) +		if (tc_skip_hw(prog->gen_flags))  			return skip_sw ? -EINVAL : 0;  		cmd = TC_CLSBPF_ADD;  	}  	ret = cls_bpf_offload_cmd(tp, obj, cmd);  	if (ret) -		return skip_sw ? ret : 0; +		return ret;  	obj->offloaded = true;  	if (oldprog) @@ -244,6 +252,7 @@ static int cls_bpf_init(struct tcf_proto *tp)  		return -ENOBUFS;  	INIT_LIST_HEAD_RCU(&head->plist); +	idr_init(&head->handle_idr);  	rcu_assign_pointer(tp->root, head);  	return 0; @@ -252,6 +261,7 @@ static int cls_bpf_init(struct tcf_proto *tp)  static void __cls_bpf_delete_prog(struct cls_bpf_prog *prog)  {  	tcf_exts_destroy(&prog->exts); +	tcf_exts_put_net(&prog->exts);  	if (cls_bpf_is_ebpf(prog))  		bpf_prog_put(prog->filter); @@ -263,24 +273,42 @@ static void __cls_bpf_delete_prog(struct cls_bpf_prog *prog)  	kfree(prog);  } +static void cls_bpf_delete_prog_work(struct work_struct *work) +{ +	struct cls_bpf_prog *prog = container_of(work, struct cls_bpf_prog, work); + +	rtnl_lock(); +	__cls_bpf_delete_prog(prog); +	rtnl_unlock(); +} +  static void cls_bpf_delete_prog_rcu(struct rcu_head *rcu)  { -	__cls_bpf_delete_prog(container_of(rcu, struct cls_bpf_prog, rcu)); +	struct cls_bpf_prog *prog = container_of(rcu, struct cls_bpf_prog, rcu); + +	INIT_WORK(&prog->work, cls_bpf_delete_prog_work); +	tcf_queue_work(&prog->work);  }  static void __cls_bpf_delete(struct tcf_proto *tp, struct cls_bpf_prog *prog)  { +	struct cls_bpf_head *head = rtnl_dereference(tp->root); + +	idr_remove_ext(&head->handle_idr, prog->handle);  	cls_bpf_stop_offload(tp, prog);  	list_del_rcu(&prog->link);  	tcf_unbind_filter(tp, &prog->res); -	call_rcu(&prog->rcu, cls_bpf_delete_prog_rcu); +	if (tcf_exts_get_net(&prog->exts)) +		call_rcu(&prog->rcu, cls_bpf_delete_prog_rcu); +	else +		__cls_bpf_delete_prog(prog);  } -static int cls_bpf_delete(struct tcf_proto *tp, unsigned long arg, bool *last) +static int cls_bpf_delete(struct tcf_proto *tp, void *arg, bool *last)  {  	struct cls_bpf_head *head = rtnl_dereference(tp->root); -	__cls_bpf_delete(tp, (struct cls_bpf_prog *) arg); +	__cls_bpf_delete(tp, arg);  	*last = list_empty(&head->plist);  	return 0;  } @@ -293,23 +321,21 @@ static void cls_bpf_destroy(struct tcf_proto *tp)  	list_for_each_entry_safe(prog, tmp, &head->plist, link)  		__cls_bpf_delete(tp, prog); +	idr_destroy(&head->handle_idr);  	kfree_rcu(head, rcu);  } -static unsigned long cls_bpf_get(struct tcf_proto *tp, u32 handle) +static void *cls_bpf_get(struct tcf_proto *tp, u32 handle)  {  	struct cls_bpf_head *head = rtnl_dereference(tp->root);  	struct cls_bpf_prog *prog; -	unsigned long ret = 0UL;  	list_for_each_entry(prog, &head->plist, link) { -		if (prog->handle == handle) { -			ret = (unsigned long) prog; -			break; -		} +		if (prog->handle == handle) +			return prog;  	} -	return ret; +	return NULL;  }  static int cls_bpf_prog_from_ops(struct nlattr **tb, struct cls_bpf_prog *prog) @@ -352,15 +378,17 @@ static int cls_bpf_prog_from_ops(struct nlattr **tb, struct cls_bpf_prog *prog)  }  static int cls_bpf_prog_from_efd(struct nlattr **tb, struct cls_bpf_prog *prog, -				 const struct tcf_proto *tp) +				 u32 gen_flags, const struct tcf_proto *tp)  {  	struct bpf_prog *fp;  	char *name = NULL; +	bool skip_sw;  	u32 bpf_fd;  	bpf_fd = nla_get_u32(tb[TCA_BPF_FD]); +	skip_sw = gen_flags & TCA_CLS_FLAGS_SKIP_SW; -	fp = bpf_prog_get_type(bpf_fd, BPF_PROG_TYPE_SCHED_CLS); +	fp = bpf_prog_get_type_dev(bpf_fd, BPF_PROG_TYPE_SCHED_CLS, skip_sw);  	if (IS_ERR(fp))  		return PTR_ERR(fp); @@ -382,13 +410,11 @@ static int cls_bpf_prog_from_efd(struct nlattr **tb, struct cls_bpf_prog *prog,  	return 0;  } -static int cls_bpf_modify_existing(struct net *net, struct tcf_proto *tp, -				   struct cls_bpf_prog *prog, -				   unsigned long base, struct nlattr **tb, -				   struct nlattr *est, bool ovr) +static int cls_bpf_set_parms(struct net *net, struct tcf_proto *tp, +			     struct cls_bpf_prog *prog, unsigned long base, +			     struct nlattr **tb, struct nlattr *est, bool ovr)  {  	bool is_bpf, is_ebpf, have_exts = false; -	struct tcf_exts exts;  	u32 gen_flags = 0;  	int ret; @@ -397,83 +423,51 @@ static int cls_bpf_modify_existing(struct net *net, struct tcf_proto *tp,  	if ((!is_bpf && !is_ebpf) || (is_bpf && is_ebpf))  		return -EINVAL; -	ret = tcf_exts_init(&exts, TCA_BPF_ACT, TCA_BPF_POLICE); +	ret = tcf_exts_validate(net, tp, tb, est, &prog->exts, ovr);  	if (ret < 0)  		return ret; -	ret = tcf_exts_validate(net, tp, tb, est, &exts, ovr); -	if (ret < 0) -		goto errout;  	if (tb[TCA_BPF_FLAGS]) {  		u32 bpf_flags = nla_get_u32(tb[TCA_BPF_FLAGS]); -		if (bpf_flags & ~TCA_BPF_FLAG_ACT_DIRECT) { -			ret = -EINVAL; -			goto errout; -		} +		if (bpf_flags & ~TCA_BPF_FLAG_ACT_DIRECT) +			return -EINVAL;  		have_exts = bpf_flags & TCA_BPF_FLAG_ACT_DIRECT;  	}  	if (tb[TCA_BPF_FLAGS_GEN]) {  		gen_flags = nla_get_u32(tb[TCA_BPF_FLAGS_GEN]);  		if (gen_flags & ~CLS_BPF_SUPPORTED_GEN_FLAGS || -		    !tc_flags_valid(gen_flags)) { -			ret = -EINVAL; -			goto errout; -		} +		    !tc_flags_valid(gen_flags)) +			return -EINVAL;  	}  	prog->exts_integrated = have_exts;  	prog->gen_flags = gen_flags;  	ret = is_bpf ? cls_bpf_prog_from_ops(tb, prog) : -		       cls_bpf_prog_from_efd(tb, prog, tp); +		       cls_bpf_prog_from_efd(tb, prog, gen_flags, tp);  	if (ret < 0) -		goto errout; +		return ret;  	if (tb[TCA_BPF_CLASSID]) {  		prog->res.classid = nla_get_u32(tb[TCA_BPF_CLASSID]);  		tcf_bind_filter(tp, &prog->res, base);  	} -	tcf_exts_change(tp, &prog->exts, &exts);  	return 0; - -errout: -	tcf_exts_destroy(&exts); -	return ret; -} - -static u32 cls_bpf_grab_new_handle(struct tcf_proto *tp, -				   struct cls_bpf_head *head) -{ -	unsigned int i = 0x80000000; -	u32 handle; - -	do { -		if (++head->hgen == 0x7FFFFFFF) -			head->hgen = 1; -	} while (--i > 0 && cls_bpf_get(tp, head->hgen)); - -	if (unlikely(i == 0)) { -		pr_err("Insufficient number of handles\n"); -		handle = 0; -	} else { -		handle = head->hgen; -	} - -	return handle;  }  static int cls_bpf_change(struct net *net, struct sk_buff *in_skb,  			  struct tcf_proto *tp, unsigned long base,  			  u32 handle, struct nlattr **tca, -			  unsigned long *arg, bool ovr) +			  void **arg, bool ovr)  {  	struct cls_bpf_head *head = rtnl_dereference(tp->root); -	struct cls_bpf_prog *oldprog = (struct cls_bpf_prog *) *arg; +	struct cls_bpf_prog *oldprog = *arg;  	struct nlattr *tb[TCA_BPF_MAX + 1];  	struct cls_bpf_prog *prog; +	unsigned long idr_index;  	int ret;  	if (tca[TCA_OPTIONS] == NULL) @@ -499,22 +493,30 @@ static int cls_bpf_change(struct net *net, struct sk_buff *in_skb,  		}  	} -	if (handle == 0) -		prog->handle = cls_bpf_grab_new_handle(tp, head); -	else +	if (handle == 0) { +		ret = idr_alloc_ext(&head->handle_idr, prog, &idr_index, +				    1, 0x7FFFFFFF, GFP_KERNEL); +		if (ret) +			goto errout; +		prog->handle = idr_index; +	} else { +		if (!oldprog) { +			ret = idr_alloc_ext(&head->handle_idr, prog, &idr_index, +					    handle, handle + 1, GFP_KERNEL); +			if (ret) +				goto errout; +		}  		prog->handle = handle; -	if (prog->handle == 0) { -		ret = -EINVAL; -		goto errout;  	} -	ret = cls_bpf_modify_existing(net, tp, prog, base, tb, tca[TCA_RATE], -				      ovr); +	ret = cls_bpf_set_parms(net, tp, prog, base, tb, tca[TCA_RATE], ovr);  	if (ret < 0) -		goto errout; +		goto errout_idr;  	ret = cls_bpf_offload(tp, prog, oldprog);  	if (ret) { +		if (!oldprog) +			idr_remove_ext(&head->handle_idr, prog->handle);  		__cls_bpf_delete_prog(prog);  		return ret;  	} @@ -523,16 +525,21 @@ static int cls_bpf_change(struct net *net, struct sk_buff *in_skb,  		prog->gen_flags |= TCA_CLS_FLAGS_NOT_IN_HW;  	if (oldprog) { +		idr_replace_ext(&head->handle_idr, prog, handle);  		list_replace_rcu(&oldprog->link, &prog->link);  		tcf_unbind_filter(tp, &oldprog->res); +		tcf_exts_get_net(&oldprog->exts);  		call_rcu(&oldprog->rcu, cls_bpf_delete_prog_rcu);  	} else {  		list_add_rcu(&prog->link, &head->plist);  	} -	*arg = (unsigned long) prog; +	*arg = prog;  	return 0; +errout_idr: +	if (!oldprog) +		idr_remove_ext(&head->handle_idr, prog->handle);  errout:  	tcf_exts_destroy(&prog->exts);  	kfree(prog); @@ -578,10 +585,10 @@ static int cls_bpf_dump_ebpf_info(const struct cls_bpf_prog *prog,  	return 0;  } -static int cls_bpf_dump(struct net *net, struct tcf_proto *tp, unsigned long fh, +static int cls_bpf_dump(struct net *net, struct tcf_proto *tp, void *fh,  			struct sk_buff *skb, struct tcmsg *tm)  { -	struct cls_bpf_prog *prog = (struct cls_bpf_prog *) fh; +	struct cls_bpf_prog *prog = fh;  	struct nlattr *nest;  	u32 bpf_flags = 0;  	int ret; @@ -631,6 +638,14 @@ nla_put_failure:  	return -1;  } +static void cls_bpf_bind_class(void *fh, u32 classid, unsigned long cl) +{ +	struct cls_bpf_prog *prog = fh; + +	if (prog && prog->res.classid == classid) +		prog->res.class = cl; +} +  static void cls_bpf_walk(struct tcf_proto *tp, struct tcf_walker *arg)  {  	struct cls_bpf_head *head = rtnl_dereference(tp->root); @@ -639,7 +654,7 @@ static void cls_bpf_walk(struct tcf_proto *tp, struct tcf_walker *arg)  	list_for_each_entry(prog, &head->plist, link) {  		if (arg->count < arg->skip)  			goto skip; -		if (arg->fn(tp, (unsigned long) prog, arg) < 0) { +		if (arg->fn(tp, prog, arg) < 0) {  			arg->stop = 1;  			break;  		} @@ -659,6 +674,7 @@ static struct tcf_proto_ops cls_bpf_ops __read_mostly = {  	.delete		=	cls_bpf_delete,  	.walk		=	cls_bpf_walk,  	.dump		=	cls_bpf_dump, +	.bind_class	=	cls_bpf_bind_class,  };  static int __init cls_bpf_init_mod(void) | 
