Hi, Jiri On 2017/9/25 1:22, Jiri Pirko wrote: > From: Yotam Gigi <yot...@mellanox.com> > > Make the ipmr module register as a FIB notifier. To do that, implement both > the ipmr_seq_read and ipmr_dump ops. > > The ipmr_seq_read op returns a sequence counter that is incremented on > every notification related operation done by the ipmr. To implement that, > add a sequence counter in the netns_ipv4 struct and increment it whenever a > new MFC route or VIF are added or deleted. The sequence operations are > protected by the RTNL lock. > > The ipmr_dump iterates the list of MFC routes and the list of VIF entries > and sends notifications about them. The entries dump is done under RCU > where the VIF dump uses the mrt_lock too, as the vif->dev field can change > under RCU. > > Signed-off-by: Yotam Gigi <yot...@mellanox.com> > Reviewed-by: Ido Schimmel <ido...@mellanox.com> > Signed-off-by: Jiri Pirko <j...@mellanox.com> > --- > v1->v2: > - Take the mrt_lock when dumping VIF entries. > --- > include/linux/mroute.h | 15 ++++++ > include/net/netns/ipv4.h | 3 ++ > net/ipv4/ipmr.c | 137 > ++++++++++++++++++++++++++++++++++++++++++++++- > 3 files changed, 153 insertions(+), 2 deletions(-) > > diff --git a/include/linux/mroute.h b/include/linux/mroute.h > index 10028f2..54c5cb8 100644 > --- a/include/linux/mroute.h > +++ b/include/linux/mroute.h > @@ -5,6 +5,7 @@ > #include <linux/pim.h> > #include <linux/rhashtable.h> > #include <net/sock.h> > +#include <net/fib_notifier.h> > #include <uapi/linux/mroute.h> > > #ifdef CONFIG_IP_MROUTE > @@ -58,6 +59,14 @@ struct vif_device { > int link; /* Physical interface index > */ > }; > > +struct vif_entry_notifier_info { > + struct fib_notifier_info info; > + struct net_device *dev; > + vifi_t vif_index; > + unsigned short vif_flags; > + u32 tb_id; > +}; > + > #define VIFF_STATIC 0x8000 > > #define VIF_EXISTS(_mrt, _idx) ((_mrt)->vif_table[_idx].dev != NULL) > @@ -146,6 +155,12 @@ struct mfc_cache { > struct rcu_head rcu; > }; > > +struct mfc_entry_notifier_info { > + struct fib_notifier_info info; > + struct mfc_cache *mfc; > + u32 tb_id; > +}; > + > struct rtmsg; > int ipmr_get_route(struct net *net, struct sk_buff *skb, > __be32 saddr, __be32 daddr, > diff --git a/include/net/netns/ipv4.h b/include/net/netns/ipv4.h > index 8387f09..abc84d9 100644 > --- a/include/net/netns/ipv4.h > +++ b/include/net/netns/ipv4.h > @@ -163,6 +163,9 @@ struct netns_ipv4 { > struct fib_notifier_ops *notifier_ops; > unsigned int fib_seq; /* protected by rtnl_mutex */ > > + struct fib_notifier_ops *ipmr_notifier_ops;
Can we add a const here? > + unsigned int ipmr_seq; /* protected by rtnl_mutex */ > + > atomic_t rt_genid; > }; > #endif > diff --git a/net/ipv4/ipmr.c b/net/ipv4/ipmr.c > index 86dc5f9..49879c3 100644 > --- a/net/ipv4/ipmr.c > +++ b/net/ipv4/ipmr.c > @@ -264,6 +264,16 @@ static void __net_exit ipmr_rules_exit(struct net *net) > fib_rules_unregister(net->ipv4.mr_rules_ops); > rtnl_unlock(); > } > + > +static int ipmr_rules_dump(struct net *net, struct notifier_block *nb) > +{ > + return fib_rules_dump(net, nb, RTNL_FAMILY_IPMR); > +} > + > +static unsigned int ipmr_rules_seq_read(struct net *net) > +{ > + return fib_rules_seq_read(net, RTNL_FAMILY_IPMR); > +} > #else > #define ipmr_for_each_table(mrt, net) \ > for (mrt = net->ipv4.mrt; mrt; mrt = NULL) > @@ -298,6 +308,16 @@ static void __net_exit ipmr_rules_exit(struct net *net) > net->ipv4.mrt = NULL; > rtnl_unlock(); > } > + > +static int ipmr_rules_dump(struct net *net, struct notifier_block *nb) > +{ > + return 0; > +} > + > +static unsigned int ipmr_rules_seq_read(struct net *net) > +{ > + return 0; > +} > #endif > > static inline int ipmr_hash_cmp(struct rhashtable_compare_arg *arg, > @@ -587,6 +607,43 @@ static struct net_device *ipmr_reg_vif(struct net *net, > struct mr_table *mrt) > } > #endif > > +static int call_ipmr_vif_entry_notifier(struct notifier_block *nb, > + struct net *net, > + enum fib_event_type event_type, > + struct vif_device *vif, > + vifi_t vif_index, u32 tb_id) > +{ > + struct vif_entry_notifier_info info = { > + .info = { > + .family = RTNL_FAMILY_IPMR, > + .net = net, > + }, > + .dev = vif->dev, > + .vif_index = vif_index, > + .vif_flags = vif->flags, > + .tb_id = tb_id, > + }; We only use info.info which is fib_notifier_info, the vif_entry_notifier_info seems to be not needed, why not just use fib_notifier_info? > + > + return call_fib_notifier(nb, net, event_type, &info.info); > +} > + > +static int call_ipmr_mfc_entry_notifier(struct notifier_block *nb, > + struct net *net, > + enum fib_event_type event_type, > + struct mfc_cache *mfc, u32 tb_id) > +{ > + struct mfc_entry_notifier_info info = { > + .info = { > + .family = RTNL_FAMILY_IPMR, > + .net = net, > + }, > + .mfc = mfc, > + .tb_id = tb_id > + }; > + As above. > + return call_fib_notifier(nb, net, event_type, &info.info); > +} > + > /** > * vif_delete - Delete a VIF entry > * @notify: Set to 1, if the caller is a notifier_call > @@ -3050,14 +3107,87 @@ static const struct net_protocol pim_protocol = { > }; > #endif > > +static unsigned int ipmr_seq_read(struct net *net) > +{ > + ASSERT_RTNL(); > + > + return net->ipv4.ipmr_seq + ipmr_rules_seq_read(net); > +} > + > +static int ipmr_dump(struct net *net, struct notifier_block *nb) > +{ > + struct mr_table *mrt; > + int err; > + > + err = ipmr_rules_dump(net, nb); > + if (err) > + return err; > + > + ipmr_for_each_table(mrt, net) { > + struct vif_device *v = &mrt->vif_table[0]; > + struct mfc_cache *mfc; > + int vifi; > + > + /* Notifiy on table VIF entries */ > + read_lock(&mrt_lock); > + for (vifi = 0; vifi < mrt->maxvif; vifi++, v++) { > + if (!v->dev) > + continue; > + > + call_ipmr_vif_entry_notifier(nb, net, FIB_EVENT_VIF_ADD, > + v, vifi, mrt->id); > + } > + read_unlock(&mrt_lock); > + > + /* Notify on table MFC entries */ > + list_for_each_entry_rcu(mfc, &mrt->mfc_cache_list, list) > + call_ipmr_mfc_entry_notifier(nb, net, > + FIB_EVENT_ENTRY_ADD, mfc, > + mrt->id); > + } > + > + return 0; > +} > + > +static const struct fib_notifier_ops ipmr_notifier_ops_template = { > + .family = RTNL_FAMILY_IPMR, > + .fib_seq_read = ipmr_seq_read, > + .fib_dump = ipmr_dump, > + .owner = THIS_MODULE, > +}; > + > +int __net_init ipmr_notifier_init(struct net *net) > +{ > + struct fib_notifier_ops *ops; > + > + net->ipv4.ipmr_seq = 0; > + > + ops = fib_notifier_ops_register(&ipmr_notifier_ops_template, net); > + if (IS_ERR(ops)) > + return PTR_ERR(ops); > + net->ipv4.ipmr_notifier_ops = ops; > + > + return 0; > +} > + > +static void __net_exit ipmr_notifier_exit(struct net *net) > +{ > + fib_notifier_ops_unregister(net->ipv4.ipmr_notifier_ops); > + net->ipv4.ipmr_notifier_ops = NULL; > +} > + > /* Setup for IP multicast routing */ > static int __net_init ipmr_net_init(struct net *net) > { > int err; > > + err = ipmr_notifier_init(net); > + if (err) > + goto ipmr_notifier_fail; > + > err = ipmr_rules_init(net); > if (err < 0) > - goto fail; > + goto ipmr_rules_fail; > > #ifdef CONFIG_PROC_FS > err = -ENOMEM; > @@ -3074,7 +3204,9 @@ static int __net_init ipmr_net_init(struct net *net) > proc_vif_fail: > ipmr_rules_exit(net); > #endif > -fail: > +ipmr_rules_fail: > + ipmr_notifier_exit(net); > +ipmr_notifier_fail: > return err; > } > > @@ -3084,6 +3216,7 @@ static void __net_exit ipmr_net_exit(struct net *net) > remove_proc_entry("ip_mr_cache", net->proc_net); > remove_proc_entry("ip_mr_vif", net->proc_net); > #endif > + ipmr_notifier_exit(net); > ipmr_rules_exit(net); > } > >