From: martin Zhang <zhangjunweimar...@didichuxing.com>

Every net ns has its own trace_state,
and use a ref to control trace state of whole kernel.

trace_state in struct per_ns_dm_cb:
Just like the previous trace state, record the trace state for
every net ns. Possible values are ON/OFF.

dm_trace_ref: record how many net namespace is set to
TRACE_ON. increase when a net ns change to ON,
and decrease for OFF.

Signed-off-by: martin Zhang <zhangjunweimar...@didichuxing.com>
---
 net/core/drop_monitor.c | 88 +++++++++++++++++++++++++++++++++++++++++--------
 1 file changed, 75 insertions(+), 13 deletions(-)

diff --git a/net/core/drop_monitor.c b/net/core/drop_monitor.c
index 6a75e04..0cf25c3 100644
--- a/net/core/drop_monitor.c
+++ b/net/core/drop_monitor.c
@@ -49,10 +49,16 @@
 struct ns_pcpu_dm_data {
 };
 
+/**
+ * struct per_ns_dm_cb  - drop monitor control block in per net ns.
+ * @trace_state:    the trace state.
+ * @ns_dm_mutex:    protect whole per_ns_dm_cb.
+ */
 struct per_ns_dm_cb {
+       int trace_state;
+       struct mutex ns_dm_mutex;
 };
 
-static int trace_state = TRACE_OFF;
 static DEFINE_MUTEX(trace_state_mutex);
 
 struct per_cpu_dm_data {
@@ -70,6 +76,7 @@ struct dm_hw_stat_delta {
        unsigned long last_drop_val;
 };
 
+int dm_trace_ref;
 static int dm_net_id __read_mostly;
 static struct genl_family net_drop_monitor_family;
 
@@ -254,9 +261,16 @@ static int set_all_monitor_traces(int state)
 
        mutex_lock(&trace_state_mutex);
 
-       if (state == trace_state) {
-               rc = -EAGAIN;
-               goto out_unlock;
+       //Cases: Only inc/dec reference value.
+       if (state == TRACE_ON && dm_trace_ref > 0)
+               goto skip_register_trace;
+       else if (state == TRACE_OFF && dm_trace_ref > 1)
+               goto skip_register_trace;
+
+       //Bad cases.
+       if (dm_trace_ref < 0 || (dm_trace_ref == 0 && state == TRACE_OFF)) {
+               rc = -EINPROGRESS;
+               goto skip_register_trace;
        }
 
        switch (state) {
@@ -294,12 +308,15 @@ static int set_all_monitor_traces(int state)
                break;
        }
 
-       if (!rc)
-               trace_state = state;
-       else
+skip_register_trace:
+       if (!rc) {
+               if (state == TRACE_ON)
+                       dm_trace_ref++;
+               else if (state == TRACE_OFF)
+                       dm_trace_ref--;
+       } else
                rc = -EINPROGRESS;
 
-out_unlock:
        mutex_unlock(&trace_state_mutex);
 
        return rc;
@@ -315,22 +332,65 @@ static int net_dm_cmd_config(struct sk_buff *skb,
 static int net_dm_cmd_trace(struct sk_buff *skb,
                        struct genl_info *info)
 {
+       int state;
+       struct net *net;
+       struct per_ns_dm_cb *ns_dm_cb;
+
+       if (!skb->sk)
+               return -ENOTSUPP;
+       net = sock_net(skb->sk);
+       ns_dm_cb = net_generic(net, dm_net_id);
+
+       if (!ns_dm_cb)
+               return -ENOMEM;
+
        switch (info->genlhdr->cmd) {
        case NET_DM_CMD_START:
-               return set_all_monitor_traces(TRACE_ON);
+               state = TRACE_ON;
+               break;
+
        case NET_DM_CMD_STOP:
-               return set_all_monitor_traces(TRACE_OFF);
+               state = TRACE_OFF;
+               break;
+
+       default:
+               return -ENOTSUPP;
        }
 
-       return -ENOTSUPP;
+       mutex_lock(&ns_dm_cb->ns_dm_mutex);
+       if (state == ns_dm_cb->trace_state) {
+               mutex_unlock(&ns_dm_cb->ns_dm_mutex);
+               return -EAGAIN;
+       }
+
+       if (set_all_monitor_traces(state) != 0) {
+               mutex_unlock(&ns_dm_cb->ns_dm_mutex);
+               return -ENOTSUPP;
+       }
+
+       ns_dm_cb->trace_state = state;
+       mutex_unlock(&ns_dm_cb->ns_dm_mutex);
+
+       return 0;
 }
 
 static int dropmon_net_event(struct notifier_block *ev_block,
                             unsigned long event, void *ptr)
 {
-       struct net_device *dev = netdev_notifier_info_to_dev(ptr);
+       struct net *net;
+       struct net_device *dev;
        struct dm_hw_stat_delta *new_stat = NULL;
        struct dm_hw_stat_delta *tmp;
+       struct per_ns_dm_cb *ns_dm_cb;
+
+       dev = netdev_notifier_info_to_dev(ptr);
+       if (!dev)
+               goto out;
+
+       net = dev_net(dev);
+       ns_dm_cb = net_generic(net, dm_net_id);
+       if (!ns_dm_cb)
+               goto out;
 
        switch (event) {
        case NETDEV_REGISTER:
@@ -350,7 +410,7 @@ static int dropmon_net_event(struct notifier_block 
*ev_block,
                list_for_each_entry_safe(new_stat, tmp, &hw_stats_list, list) {
                        if (new_stat->dev == dev) {
                                new_stat->dev = NULL;
-                               if (trace_state == TRACE_OFF) {
+                               if (ns_dm_cb->trace_state == TRACE_OFF) {
                                        list_del_rcu(&new_stat->list);
                                        kfree_rcu(new_stat, rcu);
                                        break;
@@ -402,6 +462,7 @@ static int __net_init dm_net_init(struct net *net)
        if (!ns_dm_cb)
                return -ENOMEM;
 
+       ns_dm_cb->trace_state = TRACE_OFF;
        return 0;
 }
 
@@ -432,6 +493,7 @@ static int __init init_net_drop_monitor(void)
                pr_err("Unable to store program counters on this arch, Drop 
monitor failed\n");
                return -ENOSPC;
        }
+       dm_trace_ref = 0;
        rc = register_pernet_subsys(&dm_net_ops);
 
        rc = genl_register_family(&net_drop_monitor_family);
-- 
1.8.3.1

Reply via email to