xref: /linux/drivers/infiniband/hw/mana/counters.c (revision baa640d924e55eee9210164ac068ad32dbd69c20)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Copyright (c) 2024, Microsoft Corporation. All rights reserved.
4  */
5 
6 #include "counters.h"
7 
8 static const struct rdma_stat_desc mana_ib_port_stats_desc[] = {
9 	[MANA_IB_REQUESTER_TIMEOUT].name = "requester_timeout",
10 	[MANA_IB_REQUESTER_OOS_NAK].name = "requester_oos_nak",
11 	[MANA_IB_REQUESTER_RNR_NAK].name = "requester_rnr_nak",
12 	[MANA_IB_RESPONDER_RNR_NAK].name = "responder_rnr_nak",
13 	[MANA_IB_RESPONDER_OOS].name = "responder_oos",
14 	[MANA_IB_RESPONDER_DUP_REQUEST].name = "responder_dup_request",
15 	[MANA_IB_REQUESTER_IMPLICIT_NAK].name = "requester_implicit_nak",
16 	[MANA_IB_REQUESTER_READRESP_PSN_MISMATCH].name = "requester_readresp_psn_mismatch",
17 	[MANA_IB_NAK_INV_REQ].name = "nak_inv_req",
18 	[MANA_IB_NAK_ACCESS_ERR].name = "nak_access_error",
19 	[MANA_IB_NAK_OPP_ERR].name = "nak_opp_error",
20 	[MANA_IB_NAK_INV_READ].name = "nak_inv_read",
21 	[MANA_IB_RESPONDER_LOCAL_LEN_ERR].name = "responder_local_len_error",
22 	[MANA_IB_REQUESTOR_LOCAL_PROT_ERR].name = "requestor_local_prot_error",
23 	[MANA_IB_RESPONDER_REM_ACCESS_ERR].name = "responder_rem_access_error",
24 	[MANA_IB_RESPONDER_LOCAL_QP_ERR].name = "responder_local_qp_error",
25 	[MANA_IB_RESPONDER_MALFORMED_WQE].name = "responder_malformed_wqe",
26 	[MANA_IB_GENERAL_HW_ERR].name = "general_hw_error",
27 	[MANA_IB_REQUESTER_RNR_NAK_RETRIES_EXCEEDED].name = "requester_rnr_nak_retries_exceeded",
28 	[MANA_IB_REQUESTER_RETRIES_EXCEEDED].name = "requester_retries_exceeded",
29 	[MANA_IB_TOTAL_FATAL_ERR].name = "total_fatal_error",
30 	[MANA_IB_RECEIVED_CNPS].name = "received_cnps",
31 	[MANA_IB_NUM_QPS_CONGESTED].name = "num_qps_congested",
32 	[MANA_IB_RATE_INC_EVENTS].name = "rate_inc_events",
33 	[MANA_IB_NUM_QPS_RECOVERED].name = "num_qps_recovered",
34 	[MANA_IB_CURRENT_RATE].name = "current_rate",
35 };
36 
37 static const struct rdma_stat_desc mana_ib_device_stats_desc[] = {
38 	[MANA_IB_SENT_CNPS].name = "sent_cnps",
39 	[MANA_IB_RECEIVED_ECNS].name = "received_ecns",
40 	[MANA_IB_RECEIVED_CNP_COUNT].name = "received_cnp_count",
41 	[MANA_IB_QP_CONGESTED_EVENTS].name = "qp_congested_events",
42 	[MANA_IB_QP_RECOVERED_EVENTS].name = "qp_recovered_events",
43 	[MANA_IB_DEV_RATE_INC_EVENTS].name = "rate_inc_events",
44 };
45 
46 struct rdma_hw_stats *mana_ib_alloc_hw_device_stats(struct ib_device *ibdev)
47 {
48 	return rdma_alloc_hw_stats_struct(mana_ib_device_stats_desc,
49 					  ARRAY_SIZE(mana_ib_device_stats_desc),
50 					  RDMA_HW_STATS_DEFAULT_LIFESPAN);
51 }
52 
53 struct rdma_hw_stats *mana_ib_alloc_hw_port_stats(struct ib_device *ibdev,
54 						  u32 port_num)
55 {
56 	return rdma_alloc_hw_stats_struct(mana_ib_port_stats_desc,
57 					  ARRAY_SIZE(mana_ib_port_stats_desc),
58 					  RDMA_HW_STATS_DEFAULT_LIFESPAN);
59 }
60 
61 static int mana_ib_get_hw_device_stats(struct ib_device *ibdev, struct rdma_hw_stats *stats)
62 {
63 	struct mana_ib_dev *mdev = container_of(ibdev, struct mana_ib_dev,
64 						ib_dev);
65 	struct mana_rnic_query_device_cntrs_resp resp = {};
66 	struct mana_rnic_query_device_cntrs_req req = {};
67 	int err;
68 
69 	mana_gd_init_req_hdr(&req.hdr, MANA_IB_QUERY_DEVICE_COUNTERS,
70 			     sizeof(req), sizeof(resp));
71 	req.hdr.dev_id = mdev->gdma_dev->dev_id;
72 	req.adapter = mdev->adapter_handle;
73 
74 	err = mana_gd_send_request(mdev_to_gc(mdev), sizeof(req), &req,
75 				   sizeof(resp), &resp);
76 	if (err) {
77 		ibdev_err(&mdev->ib_dev, "Failed to query device counters err %d",
78 			  err);
79 		return err;
80 	}
81 
82 	stats->value[MANA_IB_SENT_CNPS] = resp.sent_cnps;
83 	stats->value[MANA_IB_RECEIVED_ECNS] = resp.received_ecns;
84 	stats->value[MANA_IB_RECEIVED_CNP_COUNT] = resp.received_cnp_count;
85 	stats->value[MANA_IB_QP_CONGESTED_EVENTS] = resp.qp_congested_events;
86 	stats->value[MANA_IB_QP_RECOVERED_EVENTS] = resp.qp_recovered_events;
87 	stats->value[MANA_IB_DEV_RATE_INC_EVENTS] = resp.rate_inc_events;
88 
89 	return ARRAY_SIZE(mana_ib_device_stats_desc);
90 }
91 
92 static int mana_ib_get_hw_port_stats(struct ib_device *ibdev, struct rdma_hw_stats *stats,
93 				     u32 port_num)
94 {
95 	struct mana_ib_dev *mdev = container_of(ibdev, struct mana_ib_dev,
96 						ib_dev);
97 	struct mana_rnic_query_vf_cntrs_resp resp = {};
98 	struct mana_rnic_query_vf_cntrs_req req = {};
99 	int err;
100 
101 	mana_gd_init_req_hdr(&req.hdr, MANA_IB_QUERY_VF_COUNTERS,
102 			     sizeof(req), sizeof(resp));
103 	req.hdr.dev_id = mdev->gdma_dev->dev_id;
104 	req.adapter = mdev->adapter_handle;
105 
106 	err = mana_gd_send_request(mdev_to_gc(mdev), sizeof(req), &req,
107 				   sizeof(resp), &resp);
108 	if (err) {
109 		ibdev_err(&mdev->ib_dev, "Failed to query vf counters err %d",
110 			  err);
111 		return err;
112 	}
113 
114 	stats->value[MANA_IB_REQUESTER_TIMEOUT] = resp.requester_timeout;
115 	stats->value[MANA_IB_REQUESTER_OOS_NAK] = resp.requester_oos_nak;
116 	stats->value[MANA_IB_REQUESTER_RNR_NAK] = resp.requester_rnr_nak;
117 	stats->value[MANA_IB_RESPONDER_RNR_NAK] = resp.responder_rnr_nak;
118 	stats->value[MANA_IB_RESPONDER_OOS] = resp.responder_oos;
119 	stats->value[MANA_IB_RESPONDER_DUP_REQUEST] = resp.responder_dup_request;
120 	stats->value[MANA_IB_REQUESTER_IMPLICIT_NAK] =
121 					resp.requester_implicit_nak;
122 	stats->value[MANA_IB_REQUESTER_READRESP_PSN_MISMATCH] =
123 					resp.requester_readresp_psn_mismatch;
124 	stats->value[MANA_IB_NAK_INV_REQ] = resp.nak_inv_req;
125 	stats->value[MANA_IB_NAK_ACCESS_ERR] = resp.nak_access_err;
126 	stats->value[MANA_IB_NAK_OPP_ERR] = resp.nak_opp_err;
127 	stats->value[MANA_IB_NAK_INV_READ] = resp.nak_inv_read;
128 	stats->value[MANA_IB_RESPONDER_LOCAL_LEN_ERR] =
129 					resp.responder_local_len_err;
130 	stats->value[MANA_IB_REQUESTOR_LOCAL_PROT_ERR] =
131 					resp.requestor_local_prot_err;
132 	stats->value[MANA_IB_RESPONDER_REM_ACCESS_ERR] =
133 					resp.responder_rem_access_err;
134 	stats->value[MANA_IB_RESPONDER_LOCAL_QP_ERR] =
135 					resp.responder_local_qp_err;
136 	stats->value[MANA_IB_RESPONDER_MALFORMED_WQE] =
137 					resp.responder_malformed_wqe;
138 	stats->value[MANA_IB_GENERAL_HW_ERR] = resp.general_hw_err;
139 	stats->value[MANA_IB_REQUESTER_RNR_NAK_RETRIES_EXCEEDED] =
140 					resp.requester_rnr_nak_retries_exceeded;
141 	stats->value[MANA_IB_REQUESTER_RETRIES_EXCEEDED] =
142 					resp.requester_retries_exceeded;
143 	stats->value[MANA_IB_TOTAL_FATAL_ERR] = resp.total_fatal_err;
144 
145 	stats->value[MANA_IB_RECEIVED_CNPS] = resp.received_cnps;
146 	stats->value[MANA_IB_NUM_QPS_CONGESTED] = resp.num_qps_congested;
147 	stats->value[MANA_IB_RATE_INC_EVENTS] = resp.rate_inc_events;
148 	stats->value[MANA_IB_NUM_QPS_RECOVERED] = resp.num_qps_recovered;
149 	stats->value[MANA_IB_CURRENT_RATE] = resp.current_rate;
150 
151 	return ARRAY_SIZE(mana_ib_port_stats_desc);
152 }
153 
154 int mana_ib_get_hw_stats(struct ib_device *ibdev, struct rdma_hw_stats *stats,
155 			 u32 port_num, int index)
156 {
157 	if (!port_num)
158 		return mana_ib_get_hw_device_stats(ibdev, stats);
159 	else
160 		return mana_ib_get_hw_port_stats(ibdev, stats, port_num);
161 }
162