From: Mark Zhang <ma...@mellanox.com>

Since a QP can only be bound to one counter, then if it is bound to a
separate counter, for backward compatibility purpose, the statistic
value must be:
* stat of default counter
+ stat of all running allocated counters
+ stat of all deallocated counters (history stats)

Signed-off-by: Mark Zhang <ma...@mellanox.com>
Reviewed-by: Majd Dibbiny <m...@mellanox.com>
Signed-off-by: Leon Romanovsky <leo...@mellanox.com>
---
 drivers/infiniband/core/counters.c | 99 +++++++++++++++++++++++++++++-
 drivers/infiniband/core/device.c   |  8 ++-
 drivers/infiniband/core/sysfs.c    | 10 ++-
 include/rdma/rdma_counter.h        |  5 +-
 4 files changed, 113 insertions(+), 9 deletions(-)

diff --git a/drivers/infiniband/core/counters.c 
b/drivers/infiniband/core/counters.c
index 36cd9eca1e46..f598b1cdb241 100644
--- a/drivers/infiniband/core/counters.c
+++ b/drivers/infiniband/core/counters.c
@@ -146,6 +146,20 @@ static int __rdma_counter_bind_qp(struct rdma_counter 
*counter,
        return ret;
 }
 
+static void counter_history_stat_update(const struct rdma_counter *counter)
+{
+       struct ib_device *dev = counter->device;
+       struct rdma_port_counter *port_counter;
+       int i;
+
+       port_counter = &dev->port_data[counter->port].port_counter;
+       if (!port_counter->hstats)
+               return;
+
+       for (i = 0; i < counter->stats->num_counters; i++)
+               port_counter->hstats->value[i] += counter->stats->value[i];
+}
+
 static int __rdma_counter_unbind_qp(struct ib_qp *qp, bool force)
 {
        struct rdma_counter *counter = qp->counter;
@@ -285,8 +299,10 @@ int rdma_counter_unbind_qp(struct ib_qp *qp, bool force)
                return ret;
 
        rdma_restrack_put(&counter->res);
-       if (atomic_dec_and_test(&counter->usecnt))
+       if (atomic_dec_and_test(&counter->usecnt)) {
+               counter_history_stat_update(counter);
                rdma_counter_dealloc(counter);
+       }
 
        return 0;
 }
@@ -307,21 +323,98 @@ int rdma_counter_query_stats(struct rdma_counter *counter)
        return ret;
 }
 
-void rdma_counter_init(struct ib_device *dev)
+static u64 get_running_counters_hwstat_sum(struct ib_device *dev,
+                                          u8 port, u32 index)
+{
+       struct rdma_restrack_entry *res;
+       struct rdma_restrack_root *rt;
+       struct rdma_counter *counter;
+       unsigned long id = 0;
+       u64 sum = 0;
+
+       rt = &dev->res[RDMA_RESTRACK_COUNTER];
+       xa_lock(&rt->xa);
+       xa_for_each(&rt->xa, id, res) {
+               if (!rdma_restrack_get(res))
+                       continue;
+
+               counter = container_of(res, struct rdma_counter, res);
+               if ((counter->device != dev) || (counter->port != port))
+                       goto next;
+
+               if (rdma_counter_query_stats(counter))
+                       goto next;
+
+               sum += counter->stats->value[index];
+next:
+               rdma_restrack_put(res);
+       }
+
+       xa_unlock(&rt->xa);
+       return sum;
+}
+
+/**
+ * rdma_counter_get_hwstat_value() - Get the sum value of all counters on a
+ *   specific port, including the running ones and history data
+ */
+u64 rdma_counter_get_hwstat_value(struct ib_device *dev, u8 port, u32 index)
+{
+       struct rdma_port_counter *port_counter;
+       u64 sum;
+
+       if (!rdma_is_port_valid(dev, port))
+               return -EINVAL;
+
+       port_counter = &dev->port_data[port].port_counter;
+       if (index >= port_counter->hstats->num_counters)
+               return -EINVAL;
+
+       sum = get_running_counters_hwstat_sum(dev, port, index);
+       sum += port_counter->hstats->value[index];
+
+       return sum;
+}
+
+int rdma_counter_init(struct ib_device *dev)
 {
        struct rdma_port_counter *port_counter;
        u32 port;
 
        if (!dev->ops.alloc_hw_stats)
-               return;
+               return 0;
 
        rdma_for_each_port(dev, port) {
                port_counter = &dev->port_data[port].port_counter;
                port_counter->mode.mode = RDMA_COUNTER_MODE_NONE;
                mutex_init(&port_counter->lock);
+
+               port_counter->hstats = dev->ops.alloc_hw_stats(dev, port);
+               if (!port_counter->hstats)
+                       goto fail;
        }
+
+       return 0;
+
+fail:
+       rdma_for_each_port(dev, port) {
+               port_counter = &dev->port_data[port].port_counter;
+               kfree(port_counter->hstats);
+       }
+
+       return -ENOMEM;
 }
 
 void rdma_counter_cleanup(struct ib_device *dev)
 {
+       struct rdma_port_counter *port_counter;
+       u32 port;
+
+       if (!dev->ops.alloc_hw_stats)
+               return;
+
+       rdma_for_each_port(dev, port) {
+               port_counter = &dev->port_data[port].port_counter;
+               kfree(port_counter->hstats);
+       }
 }
diff --git a/drivers/infiniband/core/device.c b/drivers/infiniband/core/device.c
index b24a15d7c0c6..82437eb2d1df 100644
--- a/drivers/infiniband/core/device.c
+++ b/drivers/infiniband/core/device.c
@@ -1276,7 +1276,11 @@ int ib_register_device(struct ib_device *device, const 
char *name)
                goto dev_cleanup;
        }
 
-       rdma_counter_init(device);
+       ret = rdma_counter_init(device);
+       if (ret) {
+               dev_warn(&device->dev, "Couldn't initialize counter\n");
+               goto sysfs_cleanup;
+       }
 
        ret = enable_device_and_get(device);
        if (ret) {
@@ -1304,6 +1308,8 @@ int ib_register_device(struct ib_device *device, const 
char *name)
 
        return 0;
 
+sysfs_cleanup:
+       ib_device_unregister_sysfs(device);
 dev_cleanup:
        device_del(&device->dev);
 cg_cleanup:
diff --git a/drivers/infiniband/core/sysfs.c b/drivers/infiniband/core/sysfs.c
index 2fe89754e592..8d1cf1bbb5f5 100644
--- a/drivers/infiniband/core/sysfs.c
+++ b/drivers/infiniband/core/sysfs.c
@@ -43,6 +43,7 @@
 #include <rdma/ib_mad.h>
 #include <rdma/ib_pma.h>
 #include <rdma/ib_cache.h>
+#include <rdma/rdma_counter.h>
 
 struct ib_port;
 
@@ -795,9 +796,12 @@ static int update_hw_stats(struct ib_device *dev, struct 
rdma_hw_stats *stats,
        return 0;
 }
 
-static ssize_t print_hw_stat(struct rdma_hw_stats *stats, int index, char *buf)
+static ssize_t print_hw_stat(struct ib_device *dev, int port_num,
+                            struct rdma_hw_stats *stats, int index, char *buf)
 {
-       return sprintf(buf, "%llu\n", stats->value[index]);
+       u64 v = rdma_counter_get_hwstat_value(dev, port_num, index);
+
+       return sprintf(buf, "%llu\n", stats->value[index] + v);
 }
 
 static ssize_t show_hw_stats(struct kobject *kobj, struct attribute *attr,
@@ -823,7 +827,7 @@ static ssize_t show_hw_stats(struct kobject *kobj, struct 
attribute *attr,
        ret = update_hw_stats(dev, stats, hsa->port_num, hsa->index);
        if (ret)
                goto unlock;
-       ret = print_hw_stat(stats, hsa->index, buf);
+       ret = print_hw_stat(dev, hsa->port_num, stats, hsa->index, buf);
 unlock:
        mutex_unlock(&stats->lock);
 
diff --git a/include/rdma/rdma_counter.h b/include/rdma/rdma_counter.h
index 4bc62909a638..5ad86ae67cc5 100644
--- a/include/rdma/rdma_counter.h
+++ b/include/rdma/rdma_counter.h
@@ -27,6 +27,7 @@ struct rdma_counter_mode {
 
 struct rdma_port_counter {
        struct rdma_counter_mode mode;
+       struct rdma_hw_stats *hstats;
        struct mutex lock;
 };
 
@@ -41,13 +42,13 @@ struct rdma_counter {
        u8                              port;
 };
 
-void rdma_counter_init(struct ib_device *dev);
+int rdma_counter_init(struct ib_device *dev);
 void rdma_counter_cleanup(struct ib_device *dev);
 int rdma_counter_set_auto_mode(struct ib_device *dev, u8 port,
                               bool on, enum rdma_nl_counter_mask mask);
 int rdma_counter_bind_qp_auto(struct ib_qp *qp, u8 port);
 int rdma_counter_unbind_qp(struct ib_qp *qp, bool force);
-
 int rdma_counter_query_stats(struct rdma_counter *counter);
+u64 rdma_counter_get_hwstat_value(struct ib_device *dev, u8 port, u32 index);
 
 #endif /* _RDMA_COUNTER_H_ */
-- 
2.20.1

Reply via email to