Fri, Oct 12, 2018 at 03:53:30PM CEST, amritha.namb...@intel.com wrote: >Added support in tc flower for filtering based on port ranges. >This is a rework of the RFC patch at: >https://patchwork.ozlabs.org/patch/969595/ > >Example: >1. Match on a port range: >------------------------- >$ tc filter add dev enp4s0 protocol ip parent ffff:\ > prio 1 flower ip_proto tcp dst_port range 20-30 skip_hw\ > action drop > >$ tc -s filter show dev enp4s0 parent ffff: >filter protocol ip pref 1 flower chain 0 >filter protocol ip pref 1 flower chain 0 handle 0x1 > eth_type ipv4 > ip_proto tcp > dst_port_min 20 > dst_port_max 30 > skip_hw > not_in_hw > action order 1: gact action drop > random type none pass val 0 > index 1 ref 1 bind 1 installed 181 sec used 5 sec > Action statistics: > Sent 460 bytes 10 pkt (dropped 10, overlimits 0 requeues 0) > backlog 0b 0p requeues 0 > >2. Match on IP address and port range: >-------------------------------------- >$ tc filter add dev enp4s0 protocol ip parent ffff:\ > prio 1 flower dst_ip 192.168.1.1 ip_proto tcp dst_port range 100-200\ > skip_hw action drop > >$ tc -s filter show dev enp4s0 parent ffff: >filter protocol ip pref 1 flower chain 0 handle 0x2 > eth_type ipv4 > ip_proto tcp > dst_ip 192.168.1.1 > dst_port_min 100 > dst_port_max 200 > skip_hw > not_in_hw > action order 1: gact action drop > random type none pass val 0 > index 2 ref 1 bind 1 installed 28 sec used 6 sec > Action statistics: > Sent 460 bytes 10 pkt (dropped 10, overlimits 0 requeues 0) > backlog 0b 0p requeues 0 > >Signed-off-by: Amritha Nambiar <amritha.namb...@intel.com> >--- > include/uapi/linux/pkt_cls.h | 5 ++ > net/sched/cls_flower.c | 134 ++++++++++++++++++++++++++++++++++++++++-- > 2 files changed, 132 insertions(+), 7 deletions(-) > >diff --git a/include/uapi/linux/pkt_cls.h b/include/uapi/linux/pkt_cls.h >index 401d0c1..b569308 100644 >--- a/include/uapi/linux/pkt_cls.h >+++ b/include/uapi/linux/pkt_cls.h >@@ -405,6 +405,11 @@ enum { > TCA_FLOWER_KEY_UDP_SRC, /* be16 */ > TCA_FLOWER_KEY_UDP_DST, /* be16 */ > >+ TCA_FLOWER_KEY_PORT_SRC_MIN, /* be16 */ >+ TCA_FLOWER_KEY_PORT_SRC_MAX, /* be16 */ >+ TCA_FLOWER_KEY_PORT_DST_MIN, /* be16 */ >+ TCA_FLOWER_KEY_PORT_DST_MAX, /* be16 */ >+ > TCA_FLOWER_FLAGS, > TCA_FLOWER_KEY_VLAN_ID, /* be16 */ > TCA_FLOWER_KEY_VLAN_PRIO, /* u8 */ >diff --git a/net/sched/cls_flower.c b/net/sched/cls_flower.c >index 9aada2d..5f135f0 100644 >--- a/net/sched/cls_flower.c >+++ b/net/sched/cls_flower.c >@@ -55,6 +55,9 @@ struct fl_flow_key { > struct flow_dissector_key_ip ip; > struct flow_dissector_key_ip enc_ip; > struct flow_dissector_key_enc_opts enc_opts; >+ >+ struct flow_dissector_key_ports tp_min; >+ struct flow_dissector_key_ports tp_max; > } __aligned(BITS_PER_LONG / 8); /* Ensure that we can do comparisons as > longs. */ > > struct fl_flow_mask_range { >@@ -103,6 +106,11 @@ struct cls_fl_filter { > struct net_device *hw_dev; > }; > >+enum fl_endpoint { >+ FLOWER_ENDPOINT_DST, >+ FLOWER_ENDPOINT_SRC >+}; >+ > static const struct rhashtable_params mask_ht_params = { > .key_offset = offsetof(struct fl_flow_mask, key), > .key_len = sizeof(struct fl_flow_key), >@@ -179,11 +187,86 @@ static void fl_clear_masked_range(struct fl_flow_key >*key, > memset(fl_key_get_start(key, mask), 0, fl_mask_range(mask)); > } > >+static int fl_range_compare_params(struct cls_fl_filter *filter, >+ struct fl_flow_key *key, >+ struct fl_flow_key *mkey, >+ enum fl_endpoint endpoint) >+{ >+ __be16 min_mask, max_mask, min_val, max_val; >+ >+ if (endpoint == FLOWER_ENDPOINT_DST) { >+ min_mask = htons(filter->mask->key.tp_min.dst); >+ max_mask = htons(filter->mask->key.tp_max.dst); >+ min_val = htons(filter->key.tp_min.dst); >+ max_val = htons(filter->key.tp_max.dst); >+ >+ if (min_mask && max_mask) { >+ if (htons(key->tp.dst) < min_val || >+ htons(key->tp.dst) > max_val) >+ return -1; >+ >+ /* skb does not have min and max values */ >+ mkey->tp_min.dst = filter->mkey.tp_min.dst; >+ mkey->tp_max.dst = filter->mkey.tp_max.dst; >+ } >+ } else { >+ min_mask = htons(filter->mask->key.tp_min.src); >+ max_mask = htons(filter->mask->key.tp_max.src); >+ min_val = htons(filter->key.tp_min.src); >+ max_val = htons(filter->key.tp_max.src); >+ >+ if (min_mask && max_mask) { >+ if (htons(key->tp.src) < min_val || >+ htons(key->tp.src) > max_val) >+ return -1; >+ >+ /* skb does not have min and max values */ >+ mkey->tp_min.src = filter->mkey.tp_min.src; >+ mkey->tp_max.src = filter->mkey.tp_max.src; >+ }
You basically have 2 functions in 1 here. Just have 2 functions: fl_port_range_dst_cmp() and fl_port_range_src_cmp() And avoid the "endpoint enum. Also, as you return -1 or 0, just make it bool. >+ } >+ return 0; >+} >+ >+static struct cls_fl_filter *fl_lookup_range(struct fl_flow_mask *mask, >+ struct fl_flow_key *mkey, >+ struct fl_flow_key *key) >+{ >+ struct cls_fl_filter *filter, *f; >+ int ret; >+ >+ list_for_each_entry_rcu(filter, &mask->filters, list) { >+ ret = fl_range_compare_params(filter, key, mkey, >+ FLOWER_ENDPOINT_DST); >+ if (ret < 0) >+ continue; >+ >+ ret = fl_range_compare_params(filter, key, mkey, >+ FLOWER_ENDPOINT_SRC); >+ if (ret < 0) >+ continue; >+ >+ f = rhashtable_lookup_fast(&mask->ht, >+ fl_key_get_start(mkey, mask), >+ mask->filter_ht_params); >+ if (f) >+ return f; >+ } >+ return NULL; >+} >+ > static struct cls_fl_filter *fl_lookup(struct fl_flow_mask *mask, >- struct fl_flow_key *mkey) >+ struct fl_flow_key *mkey, >+ struct fl_flow_key *key, bool is_skb) > { >- return rhashtable_lookup_fast(&mask->ht, fl_key_get_start(mkey, mask), >- mask->filter_ht_params); >+ if ((!(mask->key.tp_min.dst && mask->key.tp_max.dst) && >+ !(mask->key.tp_min.src && mask->key.tp_max.src)) || !is_skb) { Would be probably good to have a dedicated bit to check for and decide if you do normal/range lookup. This is fast path. >+ return rhashtable_lookup_fast(&mask->ht, Remove double space ^^ >+ fl_key_get_start(mkey, mask), >+ mask->filter_ht_params); >+ } >+ /* Classify based on range */ >+ return fl_lookup_range(mask, mkey, key); > } > > static int fl_classify(struct sk_buff *skb, const struct tcf_proto *tp, >@@ -207,8 +290,8 @@ static int fl_classify(struct sk_buff *skb, const struct >tcf_proto *tp, > skb_flow_dissect(skb, &mask->dissector, &skb_key, 0); > > fl_set_masked_key(&skb_mkey, &skb_key, mask); >+ f = fl_lookup(mask, &skb_mkey, &skb_key, true); > >- f = fl_lookup(mask, &skb_mkey); > if (f && !tc_skip_sw(f->flags)) { > *res = f->res; > return tcf_exts_exec(skb, &f->exts, res); >@@ -909,6 +992,23 @@ static int fl_set_key(struct net *net, struct nlattr **tb, > sizeof(key->arp.tha)); > } > >+ if (key->basic.ip_proto == IPPROTO_TCP || >+ key->basic.ip_proto == IPPROTO_UDP || >+ key->basic.ip_proto == IPPROTO_SCTP) { >+ fl_set_key_val(tb, &key->tp_min.dst, >+ TCA_FLOWER_KEY_PORT_DST_MIN, &mask->tp_min.dst, >+ TCA_FLOWER_UNSPEC, sizeof(key->tp_min.dst)); >+ fl_set_key_val(tb, &key->tp_max.dst, >+ TCA_FLOWER_KEY_PORT_DST_MAX, &mask->tp_max.dst, >+ TCA_FLOWER_UNSPEC, sizeof(key->tp_max.dst)); >+ fl_set_key_val(tb, &key->tp_min.src, >+ TCA_FLOWER_KEY_PORT_SRC_MIN, &mask->tp_min.src, >+ TCA_FLOWER_UNSPEC, sizeof(key->tp_min.src)); >+ fl_set_key_val(tb, &key->tp_max.src, >+ TCA_FLOWER_KEY_PORT_SRC_MAX, &mask->tp_max.src, >+ TCA_FLOWER_UNSPEC, sizeof(key->tp_max.src)); >+ } >+ > if (tb[TCA_FLOWER_KEY_ENC_IPV4_SRC] || > tb[TCA_FLOWER_KEY_ENC_IPV4_DST]) { > key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS; >@@ -1026,8 +1126,7 @@ static void fl_init_dissector(struct flow_dissector >*dissector, > FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4); > FL_KEY_SET_IF_MASKED(mask, keys, cnt, > FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6); >- FL_KEY_SET_IF_MASKED(mask, keys, cnt, >- FLOW_DISSECTOR_KEY_PORTS, tp); >+ FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_PORTS, tp); > FL_KEY_SET_IF_MASKED(mask, keys, cnt, > FLOW_DISSECTOR_KEY_IP, ip); > FL_KEY_SET_IF_MASKED(mask, keys, cnt, >@@ -1227,7 +1326,7 @@ static int fl_change(struct net *net, struct sk_buff >*in_skb, > goto errout_idr; > > if (!tc_skip_sw(fnew->flags)) { >- if (!fold && fl_lookup(fnew->mask, &fnew->mkey)) { >+ if (!fold && fl_lookup(fnew->mask, &fnew->mkey, NULL, false)) { I don't undestand why do you need the "is_skb" arg here. Could you please explain? Thanks! > err = -EEXIST; > goto errout_mask; > } >@@ -1800,6 +1899,27 @@ static int fl_dump_key(struct sk_buff *skb, struct net >*net, > sizeof(key->arp.tha)))) > goto nla_put_failure; > >+ if ((key->basic.ip_proto == IPPROTO_TCP || >+ key->basic.ip_proto == IPPROTO_UDP || >+ key->basic.ip_proto == IPPROTO_SCTP) && >+ (fl_dump_key_val(skb, &key->tp_min.dst, >+ TCA_FLOWER_KEY_PORT_DST_MIN, >+ &mask->tp_min.dst, TCA_FLOWER_UNSPEC, >+ sizeof(key->tp_min.dst)) || >+ fl_dump_key_val(skb, &key->tp_max.dst, >+ TCA_FLOWER_KEY_PORT_DST_MAX, >+ &mask->tp_max.dst, TCA_FLOWER_UNSPEC, >+ sizeof(key->tp_max.dst)) || >+ fl_dump_key_val(skb, &key->tp_min.src, >+ TCA_FLOWER_KEY_PORT_SRC_MIN, >+ &mask->tp_min.src, TCA_FLOWER_UNSPEC, >+ sizeof(key->tp_min.src)) || >+ fl_dump_key_val(skb, &key->tp_max.src, >+ TCA_FLOWER_KEY_PORT_SRC_MAX, >+ &mask->tp_max.src, TCA_FLOWER_UNSPEC, >+ sizeof(key->tp_max.src)))) >+ goto nla_put_failure; >+ > if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS && > (fl_dump_key_val(skb, &key->enc_ipv4.src, > TCA_FLOWER_KEY_ENC_IPV4_SRC, &mask->enc_ipv4.src, >