1085 lines
		
	
	
		
			30 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			1085 lines
		
	
	
		
			30 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
 | |
| /*
 | |
|  * Copyright (c) 2013-2020, Mellanox Technologies inc. All rights reserved.
 | |
|  */
 | |
| 
 | |
| #include "mlx5_ib.h"
 | |
| #include <linux/mlx5/eswitch.h>
 | |
| #include <linux/mlx5/vport.h>
 | |
| #include "counters.h"
 | |
| #include "ib_rep.h"
 | |
| #include "qp.h"
 | |
| 
 | |
| struct mlx5_ib_counter {
 | |
| 	const char *name;
 | |
| 	size_t offset;
 | |
| 	u32 type;
 | |
| };
 | |
| 
 | |
| #define INIT_Q_COUNTER(_name)		\
 | |
| 	{ .name = #_name, .offset = MLX5_BYTE_OFF(query_q_counter_out, _name)}
 | |
| 
 | |
| #define INIT_VPORT_Q_COUNTER(_name)		\
 | |
| 	{ .name = "vport_" #_name, .offset =	\
 | |
| 		MLX5_BYTE_OFF(query_q_counter_out, _name)}
 | |
| 
 | |
| static const struct mlx5_ib_counter basic_q_cnts[] = {
 | |
| 	INIT_Q_COUNTER(rx_write_requests),
 | |
| 	INIT_Q_COUNTER(rx_read_requests),
 | |
| 	INIT_Q_COUNTER(rx_atomic_requests),
 | |
| 	INIT_Q_COUNTER(rx_dct_connect),
 | |
| 	INIT_Q_COUNTER(out_of_buffer),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter out_of_seq_q_cnts[] = {
 | |
| 	INIT_Q_COUNTER(out_of_sequence),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter retrans_q_cnts[] = {
 | |
| 	INIT_Q_COUNTER(duplicate_request),
 | |
| 	INIT_Q_COUNTER(rnr_nak_retry_err),
 | |
| 	INIT_Q_COUNTER(packet_seq_err),
 | |
| 	INIT_Q_COUNTER(implied_nak_seq_err),
 | |
| 	INIT_Q_COUNTER(local_ack_timeout_err),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter vport_basic_q_cnts[] = {
 | |
| 	INIT_VPORT_Q_COUNTER(rx_write_requests),
 | |
| 	INIT_VPORT_Q_COUNTER(rx_read_requests),
 | |
| 	INIT_VPORT_Q_COUNTER(rx_atomic_requests),
 | |
| 	INIT_VPORT_Q_COUNTER(rx_dct_connect),
 | |
| 	INIT_VPORT_Q_COUNTER(out_of_buffer),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter vport_out_of_seq_q_cnts[] = {
 | |
| 	INIT_VPORT_Q_COUNTER(out_of_sequence),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter vport_retrans_q_cnts[] = {
 | |
| 	INIT_VPORT_Q_COUNTER(duplicate_request),
 | |
| 	INIT_VPORT_Q_COUNTER(rnr_nak_retry_err),
 | |
| 	INIT_VPORT_Q_COUNTER(packet_seq_err),
 | |
| 	INIT_VPORT_Q_COUNTER(implied_nak_seq_err),
 | |
| 	INIT_VPORT_Q_COUNTER(local_ack_timeout_err),
 | |
| };
 | |
| 
 | |
| #define INIT_CONG_COUNTER(_name)		\
 | |
| 	{ .name = #_name, .offset =	\
 | |
| 		MLX5_BYTE_OFF(query_cong_statistics_out, _name ## _high)}
 | |
| 
 | |
| static const struct mlx5_ib_counter cong_cnts[] = {
 | |
| 	INIT_CONG_COUNTER(rp_cnp_ignored),
 | |
| 	INIT_CONG_COUNTER(rp_cnp_handled),
 | |
| 	INIT_CONG_COUNTER(np_ecn_marked_roce_packets),
 | |
| 	INIT_CONG_COUNTER(np_cnp_sent),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter extended_err_cnts[] = {
 | |
| 	INIT_Q_COUNTER(resp_local_length_error),
 | |
| 	INIT_Q_COUNTER(resp_cqe_error),
 | |
| 	INIT_Q_COUNTER(req_cqe_error),
 | |
| 	INIT_Q_COUNTER(req_remote_invalid_request),
 | |
| 	INIT_Q_COUNTER(req_remote_access_errors),
 | |
| 	INIT_Q_COUNTER(resp_remote_access_errors),
 | |
| 	INIT_Q_COUNTER(resp_cqe_flush_error),
 | |
| 	INIT_Q_COUNTER(req_cqe_flush_error),
 | |
| 	INIT_Q_COUNTER(req_transport_retries_exceeded),
 | |
| 	INIT_Q_COUNTER(req_rnr_retries_exceeded),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter roce_accl_cnts[] = {
 | |
| 	INIT_Q_COUNTER(roce_adp_retrans),
 | |
| 	INIT_Q_COUNTER(roce_adp_retrans_to),
 | |
| 	INIT_Q_COUNTER(roce_slow_restart),
 | |
| 	INIT_Q_COUNTER(roce_slow_restart_cnps),
 | |
| 	INIT_Q_COUNTER(roce_slow_restart_trans),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter vport_extended_err_cnts[] = {
 | |
| 	INIT_VPORT_Q_COUNTER(resp_local_length_error),
 | |
| 	INIT_VPORT_Q_COUNTER(resp_cqe_error),
 | |
| 	INIT_VPORT_Q_COUNTER(req_cqe_error),
 | |
| 	INIT_VPORT_Q_COUNTER(req_remote_invalid_request),
 | |
| 	INIT_VPORT_Q_COUNTER(req_remote_access_errors),
 | |
| 	INIT_VPORT_Q_COUNTER(resp_remote_access_errors),
 | |
| 	INIT_VPORT_Q_COUNTER(resp_cqe_flush_error),
 | |
| 	INIT_VPORT_Q_COUNTER(req_cqe_flush_error),
 | |
| 	INIT_VPORT_Q_COUNTER(req_transport_retries_exceeded),
 | |
| 	INIT_VPORT_Q_COUNTER(req_rnr_retries_exceeded),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter vport_roce_accl_cnts[] = {
 | |
| 	INIT_VPORT_Q_COUNTER(roce_adp_retrans),
 | |
| 	INIT_VPORT_Q_COUNTER(roce_adp_retrans_to),
 | |
| 	INIT_VPORT_Q_COUNTER(roce_slow_restart),
 | |
| 	INIT_VPORT_Q_COUNTER(roce_slow_restart_cnps),
 | |
| 	INIT_VPORT_Q_COUNTER(roce_slow_restart_trans),
 | |
| };
 | |
| 
 | |
| #define INIT_EXT_PPCNT_COUNTER(_name)		\
 | |
| 	{ .name = #_name, .offset =	\
 | |
| 	MLX5_BYTE_OFF(ppcnt_reg, \
 | |
| 		      counter_set.eth_extended_cntrs_grp_data_layout._name##_high)}
 | |
| 
 | |
| static const struct mlx5_ib_counter ext_ppcnt_cnts[] = {
 | |
| 	INIT_EXT_PPCNT_COUNTER(rx_icrc_encapsulated),
 | |
| };
 | |
| 
 | |
| #define INIT_OP_COUNTER(_name, _type)		\
 | |
| 	{ .name = #_name, .type = MLX5_IB_OPCOUNTER_##_type}
 | |
| 
 | |
| static const struct mlx5_ib_counter basic_op_cnts[] = {
 | |
| 	INIT_OP_COUNTER(cc_rx_ce_pkts, CC_RX_CE_PKTS),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter rdmarx_cnp_op_cnts[] = {
 | |
| 	INIT_OP_COUNTER(cc_rx_cnp_pkts, CC_RX_CNP_PKTS),
 | |
| };
 | |
| 
 | |
| static const struct mlx5_ib_counter rdmatx_cnp_op_cnts[] = {
 | |
| 	INIT_OP_COUNTER(cc_tx_cnp_pkts, CC_TX_CNP_PKTS),
 | |
| };
 | |
| 
 | |
| static int mlx5_ib_read_counters(struct ib_counters *counters,
 | |
| 				 struct ib_counters_read_attr *read_attr,
 | |
| 				 struct uverbs_attr_bundle *attrs)
 | |
| {
 | |
| 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
 | |
| 	struct mlx5_read_counters_attr mread_attr = {};
 | |
| 	struct mlx5_ib_flow_counters_desc *desc;
 | |
| 	int ret, i;
 | |
| 
 | |
| 	mutex_lock(&mcounters->mcntrs_mutex);
 | |
| 	if (mcounters->cntrs_max_index > read_attr->ncounters) {
 | |
| 		ret = -EINVAL;
 | |
| 		goto err_bound;
 | |
| 	}
 | |
| 
 | |
| 	mread_attr.out = kcalloc(mcounters->counters_num, sizeof(u64),
 | |
| 				 GFP_KERNEL);
 | |
| 	if (!mread_attr.out) {
 | |
| 		ret = -ENOMEM;
 | |
| 		goto err_bound;
 | |
| 	}
 | |
| 
 | |
| 	mread_attr.hw_cntrs_hndl = mcounters->hw_cntrs_hndl;
 | |
| 	mread_attr.flags = read_attr->flags;
 | |
| 	ret = mcounters->read_counters(counters->device, &mread_attr);
 | |
| 	if (ret)
 | |
| 		goto err_read;
 | |
| 
 | |
| 	/* do the pass over the counters data array to assign according to the
 | |
| 	 * descriptions and indexing pairs
 | |
| 	 */
 | |
| 	desc = mcounters->counters_data;
 | |
| 	for (i = 0; i < mcounters->ncounters; i++)
 | |
| 		read_attr->counters_buff[desc[i].index] += mread_attr.out[desc[i].description];
 | |
| 
 | |
| err_read:
 | |
| 	kfree(mread_attr.out);
 | |
| err_bound:
 | |
| 	mutex_unlock(&mcounters->mcntrs_mutex);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_destroy_counters(struct ib_counters *counters)
 | |
| {
 | |
| 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
 | |
| 
 | |
| 	mlx5_ib_counters_clear_description(counters);
 | |
| 	if (mcounters->hw_cntrs_hndl)
 | |
| 		mlx5_fc_destroy(to_mdev(counters->device)->mdev,
 | |
| 				mcounters->hw_cntrs_hndl);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_create_counters(struct ib_counters *counters,
 | |
| 				   struct uverbs_attr_bundle *attrs)
 | |
| {
 | |
| 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
 | |
| 
 | |
| 	mutex_init(&mcounters->mcntrs_mutex);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static bool vport_qcounters_supported(struct mlx5_ib_dev *dev)
 | |
| {
 | |
| 	return MLX5_CAP_GEN(dev->mdev, q_counter_other_vport) &&
 | |
| 	       MLX5_CAP_GEN(dev->mdev, q_counter_aggregation);
 | |
| }
 | |
| 
 | |
| static const struct mlx5_ib_counters *get_counters(struct mlx5_ib_dev *dev,
 | |
| 						   u32 port_num)
 | |
| {
 | |
| 	if ((is_mdev_switchdev_mode(dev->mdev) &&
 | |
| 	     !vport_qcounters_supported(dev)) || !port_num)
 | |
| 		return &dev->port[0].cnts;
 | |
| 
 | |
| 	return is_mdev_switchdev_mode(dev->mdev) ?
 | |
| 	       &dev->port[1].cnts : &dev->port[port_num - 1].cnts;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * mlx5_ib_get_counters_id - Returns counters id to use for device+port
 | |
|  * @dev:	Pointer to mlx5 IB device
 | |
|  * @port_num:	Zero based port number
 | |
|  *
 | |
|  * mlx5_ib_get_counters_id() Returns counters set id to use for given
 | |
|  * device port combination in switchdev and non switchdev mode of the
 | |
|  * parent device.
 | |
|  */
 | |
| u16 mlx5_ib_get_counters_id(struct mlx5_ib_dev *dev, u32 port_num)
 | |
| {
 | |
| 	const struct mlx5_ib_counters *cnts = get_counters(dev, port_num + 1);
 | |
| 
 | |
| 	return cnts->set_id;
 | |
| }
 | |
| 
 | |
| static struct rdma_hw_stats *do_alloc_stats(const struct mlx5_ib_counters *cnts)
 | |
| {
 | |
| 	struct rdma_hw_stats *stats;
 | |
| 	u32 num_hw_counters;
 | |
| 	int i;
 | |
| 
 | |
| 	num_hw_counters = cnts->num_q_counters + cnts->num_cong_counters +
 | |
| 			  cnts->num_ext_ppcnt_counters;
 | |
| 	stats = rdma_alloc_hw_stats_struct(cnts->descs,
 | |
| 					   num_hw_counters +
 | |
| 					   cnts->num_op_counters,
 | |
| 					   RDMA_HW_STATS_DEFAULT_LIFESPAN);
 | |
| 	if (!stats)
 | |
| 		return NULL;
 | |
| 
 | |
| 	for (i = 0; i < cnts->num_op_counters; i++)
 | |
| 		set_bit(num_hw_counters + i, stats->is_disabled);
 | |
| 
 | |
| 	return stats;
 | |
| }
 | |
| 
 | |
| static struct rdma_hw_stats *
 | |
| mlx5_ib_alloc_hw_device_stats(struct ib_device *ibdev)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 	const struct mlx5_ib_counters *cnts = &dev->port[0].cnts;
 | |
| 
 | |
| 	return do_alloc_stats(cnts);
 | |
| }
 | |
| 
 | |
| static struct rdma_hw_stats *
 | |
| mlx5_ib_alloc_hw_port_stats(struct ib_device *ibdev, u32 port_num)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 	const struct mlx5_ib_counters *cnts = get_counters(dev, port_num);
 | |
| 
 | |
| 	return do_alloc_stats(cnts);
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_query_q_counters(struct mlx5_core_dev *mdev,
 | |
| 				    const struct mlx5_ib_counters *cnts,
 | |
| 				    struct rdma_hw_stats *stats,
 | |
| 				    u16 set_id)
 | |
| {
 | |
| 	u32 out[MLX5_ST_SZ_DW(query_q_counter_out)] = {};
 | |
| 	u32 in[MLX5_ST_SZ_DW(query_q_counter_in)] = {};
 | |
| 	__be32 val;
 | |
| 	int ret, i;
 | |
| 
 | |
| 	MLX5_SET(query_q_counter_in, in, opcode, MLX5_CMD_OP_QUERY_Q_COUNTER);
 | |
| 	MLX5_SET(query_q_counter_in, in, counter_set_id, set_id);
 | |
| 	ret = mlx5_cmd_exec_inout(mdev, query_q_counter, in, out);
 | |
| 	if (ret)
 | |
| 		return ret;
 | |
| 
 | |
| 	for (i = 0; i < cnts->num_q_counters; i++) {
 | |
| 		val = *(__be32 *)((void *)out + cnts->offsets[i]);
 | |
| 		stats->value[i] = (u64)be32_to_cpu(val);
 | |
| 	}
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_query_ext_ppcnt_counters(struct mlx5_ib_dev *dev,
 | |
| 					    const struct mlx5_ib_counters *cnts,
 | |
| 					    struct rdma_hw_stats *stats)
 | |
| {
 | |
| 	int offset = cnts->num_q_counters + cnts->num_cong_counters;
 | |
| 	u32 in[MLX5_ST_SZ_DW(ppcnt_reg)] = {};
 | |
| 	int sz = MLX5_ST_SZ_BYTES(ppcnt_reg);
 | |
| 	int ret, i;
 | |
| 	void *out;
 | |
| 
 | |
| 	out = kvzalloc(sz, GFP_KERNEL);
 | |
| 	if (!out)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	MLX5_SET(ppcnt_reg, in, local_port, 1);
 | |
| 	MLX5_SET(ppcnt_reg, in, grp, MLX5_ETHERNET_EXTENDED_COUNTERS_GROUP);
 | |
| 	ret = mlx5_core_access_reg(dev->mdev, in, sz, out, sz, MLX5_REG_PPCNT,
 | |
| 				   0, 0);
 | |
| 	if (ret)
 | |
| 		goto free;
 | |
| 
 | |
| 	for (i = 0; i < cnts->num_ext_ppcnt_counters; i++)
 | |
| 		stats->value[i + offset] =
 | |
| 			be64_to_cpup((__be64 *)(out +
 | |
| 				    cnts->offsets[i + offset]));
 | |
| free:
 | |
| 	kvfree(out);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_query_q_counters_vport(struct mlx5_ib_dev *dev,
 | |
| 					  u32 port_num,
 | |
| 					  const struct mlx5_ib_counters *cnts,
 | |
| 					  struct rdma_hw_stats *stats)
 | |
| 
 | |
| {
 | |
| 	u32 out[MLX5_ST_SZ_DW(query_q_counter_out)] = {};
 | |
| 	u32 in[MLX5_ST_SZ_DW(query_q_counter_in)] = {};
 | |
| 	struct mlx5_core_dev *mdev;
 | |
| 	__be32 val;
 | |
| 	int ret, i;
 | |
| 
 | |
| 	if (!dev->port[port_num].rep ||
 | |
| 	    dev->port[port_num].rep->vport == MLX5_VPORT_UPLINK)
 | |
| 		return 0;
 | |
| 
 | |
| 	mdev = mlx5_eswitch_get_core_dev(dev->port[port_num].rep->esw);
 | |
| 	if (!mdev)
 | |
| 		return -EOPNOTSUPP;
 | |
| 
 | |
| 	MLX5_SET(query_q_counter_in, in, opcode, MLX5_CMD_OP_QUERY_Q_COUNTER);
 | |
| 	MLX5_SET(query_q_counter_in, in, other_vport, 1);
 | |
| 	MLX5_SET(query_q_counter_in, in, vport_number,
 | |
| 		 dev->port[port_num].rep->vport);
 | |
| 	MLX5_SET(query_q_counter_in, in, aggregate, 1);
 | |
| 	ret = mlx5_cmd_exec_inout(mdev, query_q_counter, in, out);
 | |
| 	if (ret)
 | |
| 		return ret;
 | |
| 
 | |
| 	for (i = 0; i < cnts->num_q_counters; i++) {
 | |
| 		val = *(__be32 *)((void *)out + cnts->offsets[i]);
 | |
| 		stats->value[i] = (u64)be32_to_cpu(val);
 | |
| 	}
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int do_get_hw_stats(struct ib_device *ibdev,
 | |
| 			   struct rdma_hw_stats *stats,
 | |
| 			   u32 port_num, int index)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 	const struct mlx5_ib_counters *cnts = get_counters(dev, port_num);
 | |
| 	struct mlx5_core_dev *mdev;
 | |
| 	int ret, num_counters;
 | |
| 
 | |
| 	if (!stats)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	num_counters = cnts->num_q_counters +
 | |
| 		       cnts->num_cong_counters +
 | |
| 		       cnts->num_ext_ppcnt_counters;
 | |
| 
 | |
| 	if (is_mdev_switchdev_mode(dev->mdev) && dev->is_rep && port_num != 0)
 | |
| 		ret = mlx5_ib_query_q_counters_vport(dev, port_num - 1, cnts,
 | |
| 						     stats);
 | |
| 	else
 | |
| 		ret = mlx5_ib_query_q_counters(dev->mdev, cnts, stats,
 | |
| 					       cnts->set_id);
 | |
| 	if (ret)
 | |
| 		return ret;
 | |
| 
 | |
| 	/* We don't expose device counters over Vports */
 | |
| 	if (is_mdev_switchdev_mode(dev->mdev) && port_num != 0)
 | |
| 		goto done;
 | |
| 
 | |
| 	if (MLX5_CAP_PCAM_FEATURE(dev->mdev, rx_icrc_encapsulated_counter)) {
 | |
| 		ret =  mlx5_ib_query_ext_ppcnt_counters(dev, cnts, stats);
 | |
| 		if (ret)
 | |
| 			return ret;
 | |
| 	}
 | |
| 
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, cc_query_allowed)) {
 | |
| 		if (!port_num)
 | |
| 			port_num = 1;
 | |
| 		mdev = mlx5_ib_get_native_port_mdev(dev, port_num, NULL);
 | |
| 		if (!mdev) {
 | |
| 			/* If port is not affiliated yet, its in down state
 | |
| 			 * which doesn't have any counters yet, so it would be
 | |
| 			 * zero. So no need to read from the HCA.
 | |
| 			 */
 | |
| 			goto done;
 | |
| 		}
 | |
| 		ret = mlx5_lag_query_cong_counters(dev->mdev,
 | |
| 						   stats->value +
 | |
| 						   cnts->num_q_counters,
 | |
| 						   cnts->num_cong_counters,
 | |
| 						   cnts->offsets +
 | |
| 						   cnts->num_q_counters);
 | |
| 
 | |
| 		mlx5_ib_put_native_port_mdev(dev, port_num);
 | |
| 		if (ret)
 | |
| 			return ret;
 | |
| 	}
 | |
| 
 | |
| done:
 | |
| 	return num_counters;
 | |
| }
 | |
| 
 | |
| static int do_get_op_stat(struct ib_device *ibdev,
 | |
| 			  struct rdma_hw_stats *stats,
 | |
| 			  u32 port_num, int index)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 	const struct mlx5_ib_counters *cnts;
 | |
| 	const struct mlx5_ib_op_fc *opfcs;
 | |
| 	u64 packets = 0, bytes;
 | |
| 	u32 type;
 | |
| 	int ret;
 | |
| 
 | |
| 	cnts = get_counters(dev, port_num);
 | |
| 
 | |
| 	opfcs = cnts->opfcs;
 | |
| 	type = *(u32 *)cnts->descs[index].priv;
 | |
| 	if (type >= MLX5_IB_OPCOUNTER_MAX)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	if (!opfcs[type].fc)
 | |
| 		goto out;
 | |
| 
 | |
| 	ret = mlx5_fc_query(dev->mdev, opfcs[type].fc,
 | |
| 			    &packets, &bytes);
 | |
| 	if (ret)
 | |
| 		return ret;
 | |
| 
 | |
| out:
 | |
| 	stats->value[index] = packets;
 | |
| 	return index;
 | |
| }
 | |
| 
 | |
| static int do_get_op_stats(struct ib_device *ibdev,
 | |
| 			   struct rdma_hw_stats *stats,
 | |
| 			   u32 port_num)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 	const struct mlx5_ib_counters *cnts;
 | |
| 	int index, ret, num_hw_counters;
 | |
| 
 | |
| 	cnts = get_counters(dev, port_num);
 | |
| 	num_hw_counters = cnts->num_q_counters + cnts->num_cong_counters +
 | |
| 			  cnts->num_ext_ppcnt_counters;
 | |
| 	for (index = num_hw_counters;
 | |
| 	     index < (num_hw_counters + cnts->num_op_counters); index++) {
 | |
| 		ret = do_get_op_stat(ibdev, stats, port_num, index);
 | |
| 		if (ret != index)
 | |
| 			return ret;
 | |
| 	}
 | |
| 
 | |
| 	return cnts->num_op_counters;
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_get_hw_stats(struct ib_device *ibdev,
 | |
| 				struct rdma_hw_stats *stats,
 | |
| 				u32 port_num, int index)
 | |
| {
 | |
| 	int num_counters, num_hw_counters, num_op_counters;
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 	const struct mlx5_ib_counters *cnts;
 | |
| 
 | |
| 	cnts = get_counters(dev, port_num);
 | |
| 	num_hw_counters = cnts->num_q_counters + cnts->num_cong_counters +
 | |
| 		cnts->num_ext_ppcnt_counters;
 | |
| 	num_counters = num_hw_counters + cnts->num_op_counters;
 | |
| 
 | |
| 	if (index < 0 || index > num_counters)
 | |
| 		return -EINVAL;
 | |
| 	else if (index > 0 && index < num_hw_counters)
 | |
| 		return do_get_hw_stats(ibdev, stats, port_num, index);
 | |
| 	else if (index >= num_hw_counters && index < num_counters)
 | |
| 		return do_get_op_stat(ibdev, stats, port_num, index);
 | |
| 
 | |
| 	num_hw_counters = do_get_hw_stats(ibdev, stats, port_num, index);
 | |
| 	if (num_hw_counters < 0)
 | |
| 		return num_hw_counters;
 | |
| 
 | |
| 	num_op_counters = do_get_op_stats(ibdev, stats, port_num);
 | |
| 	if (num_op_counters < 0)
 | |
| 		return num_op_counters;
 | |
| 
 | |
| 	return num_hw_counters + num_op_counters;
 | |
| }
 | |
| 
 | |
| static struct rdma_hw_stats *
 | |
| mlx5_ib_counter_alloc_stats(struct rdma_counter *counter)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(counter->device);
 | |
| 	const struct mlx5_ib_counters *cnts = get_counters(dev, counter->port);
 | |
| 
 | |
| 	return do_alloc_stats(cnts);
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_counter_update_stats(struct rdma_counter *counter)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(counter->device);
 | |
| 	const struct mlx5_ib_counters *cnts = get_counters(dev, counter->port);
 | |
| 
 | |
| 	return mlx5_ib_query_q_counters(dev->mdev, cnts,
 | |
| 					counter->stats, counter->id);
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_counter_dealloc(struct rdma_counter *counter)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(counter->device);
 | |
| 	u32 in[MLX5_ST_SZ_DW(dealloc_q_counter_in)] = {};
 | |
| 
 | |
| 	if (!counter->id)
 | |
| 		return 0;
 | |
| 
 | |
| 	MLX5_SET(dealloc_q_counter_in, in, opcode,
 | |
| 		 MLX5_CMD_OP_DEALLOC_Q_COUNTER);
 | |
| 	MLX5_SET(dealloc_q_counter_in, in, counter_set_id, counter->id);
 | |
| 	return mlx5_cmd_exec_in(dev->mdev, dealloc_q_counter, in);
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_counter_bind_qp(struct rdma_counter *counter,
 | |
| 				   struct ib_qp *qp)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(qp->device);
 | |
| 	int err;
 | |
| 
 | |
| 	if (!counter->id) {
 | |
| 		u32 out[MLX5_ST_SZ_DW(alloc_q_counter_out)] = {};
 | |
| 		u32 in[MLX5_ST_SZ_DW(alloc_q_counter_in)] = {};
 | |
| 
 | |
| 		MLX5_SET(alloc_q_counter_in, in, opcode,
 | |
| 			 MLX5_CMD_OP_ALLOC_Q_COUNTER);
 | |
| 		MLX5_SET(alloc_q_counter_in, in, uid, MLX5_SHARED_RESOURCE_UID);
 | |
| 		err = mlx5_cmd_exec_inout(dev->mdev, alloc_q_counter, in, out);
 | |
| 		if (err)
 | |
| 			return err;
 | |
| 		counter->id =
 | |
| 			MLX5_GET(alloc_q_counter_out, out, counter_set_id);
 | |
| 	}
 | |
| 
 | |
| 	err = mlx5_ib_qp_set_counter(qp, counter);
 | |
| 	if (err)
 | |
| 		goto fail_set_counter;
 | |
| 
 | |
| 	return 0;
 | |
| 
 | |
| fail_set_counter:
 | |
| 	mlx5_ib_counter_dealloc(counter);
 | |
| 	counter->id = 0;
 | |
| 
 | |
| 	return err;
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_counter_unbind_qp(struct ib_qp *qp)
 | |
| {
 | |
| 	return mlx5_ib_qp_set_counter(qp, NULL);
 | |
| }
 | |
| 
 | |
| static void mlx5_ib_fill_counters(struct mlx5_ib_dev *dev,
 | |
| 				  struct rdma_stat_desc *descs, size_t *offsets,
 | |
| 				  u32 port_num)
 | |
| {
 | |
| 	bool is_vport = is_mdev_switchdev_mode(dev->mdev) &&
 | |
| 			port_num != MLX5_VPORT_PF;
 | |
| 	const struct mlx5_ib_counter *names;
 | |
| 	int j = 0, i, size;
 | |
| 
 | |
| 	names = is_vport ? vport_basic_q_cnts : basic_q_cnts;
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_basic_q_cnts) :
 | |
| 			  ARRAY_SIZE(basic_q_cnts);
 | |
| 	for (i = 0; i < size; i++, j++) {
 | |
| 		descs[j].name = names[i].name;
 | |
| 		offsets[j] = names[i].offset;
 | |
| 	}
 | |
| 
 | |
| 	names = is_vport ? vport_out_of_seq_q_cnts : out_of_seq_q_cnts;
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_out_of_seq_q_cnts) :
 | |
| 			  ARRAY_SIZE(out_of_seq_q_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, out_of_seq_cnt)) {
 | |
| 		for (i = 0; i < size; i++, j++) {
 | |
| 			descs[j].name = names[i].name;
 | |
| 			offsets[j] = names[i].offset;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	names = is_vport ? vport_retrans_q_cnts : retrans_q_cnts;
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_retrans_q_cnts) :
 | |
| 			  ARRAY_SIZE(retrans_q_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, retransmission_q_counters)) {
 | |
| 		for (i = 0; i < size; i++, j++) {
 | |
| 			descs[j].name = names[i].name;
 | |
| 			offsets[j] = names[i].offset;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	names = is_vport ? vport_extended_err_cnts : extended_err_cnts;
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_extended_err_cnts) :
 | |
| 			  ARRAY_SIZE(extended_err_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, enhanced_error_q_counters)) {
 | |
| 		for (i = 0; i < size; i++, j++) {
 | |
| 			descs[j].name = names[i].name;
 | |
| 			offsets[j] = names[i].offset;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	names = is_vport ? vport_roce_accl_cnts : roce_accl_cnts;
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_roce_accl_cnts) :
 | |
| 			  ARRAY_SIZE(roce_accl_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, roce_accl)) {
 | |
| 		for (i = 0; i < size; i++, j++) {
 | |
| 			descs[j].name = names[i].name;
 | |
| 			offsets[j] = names[i].offset;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (is_vport)
 | |
| 		return;
 | |
| 
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, cc_query_allowed)) {
 | |
| 		for (i = 0; i < ARRAY_SIZE(cong_cnts); i++, j++) {
 | |
| 			descs[j].name = cong_cnts[i].name;
 | |
| 			offsets[j] = cong_cnts[i].offset;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (MLX5_CAP_PCAM_FEATURE(dev->mdev, rx_icrc_encapsulated_counter)) {
 | |
| 		for (i = 0; i < ARRAY_SIZE(ext_ppcnt_cnts); i++, j++) {
 | |
| 			descs[j].name = ext_ppcnt_cnts[i].name;
 | |
| 			offsets[j] = ext_ppcnt_cnts[i].offset;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	for (i = 0; i < ARRAY_SIZE(basic_op_cnts); i++, j++) {
 | |
| 		descs[j].name = basic_op_cnts[i].name;
 | |
| 		descs[j].flags |= IB_STAT_FLAG_OPTIONAL;
 | |
| 		descs[j].priv = &basic_op_cnts[i].type;
 | |
| 	}
 | |
| 
 | |
| 	if (MLX5_CAP_FLOWTABLE(dev->mdev,
 | |
| 			       ft_field_support_2_nic_receive_rdma.bth_opcode)) {
 | |
| 		for (i = 0; i < ARRAY_SIZE(rdmarx_cnp_op_cnts); i++, j++) {
 | |
| 			descs[j].name = rdmarx_cnp_op_cnts[i].name;
 | |
| 			descs[j].flags |= IB_STAT_FLAG_OPTIONAL;
 | |
| 			descs[j].priv = &rdmarx_cnp_op_cnts[i].type;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (MLX5_CAP_FLOWTABLE(dev->mdev,
 | |
| 			       ft_field_support_2_nic_transmit_rdma.bth_opcode)) {
 | |
| 		for (i = 0; i < ARRAY_SIZE(rdmatx_cnp_op_cnts); i++, j++) {
 | |
| 			descs[j].name = rdmatx_cnp_op_cnts[i].name;
 | |
| 			descs[j].flags |= IB_STAT_FLAG_OPTIONAL;
 | |
| 			descs[j].priv = &rdmatx_cnp_op_cnts[i].type;
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| 
 | |
| static int __mlx5_ib_alloc_counters(struct mlx5_ib_dev *dev,
 | |
| 				    struct mlx5_ib_counters *cnts, u32 port_num)
 | |
| {
 | |
| 	bool is_vport = is_mdev_switchdev_mode(dev->mdev) &&
 | |
| 			port_num != MLX5_VPORT_PF;
 | |
| 	u32 num_counters, num_op_counters = 0, size;
 | |
| 
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_basic_q_cnts) :
 | |
| 			  ARRAY_SIZE(basic_q_cnts);
 | |
| 	num_counters = size;
 | |
| 
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_out_of_seq_q_cnts) :
 | |
| 			  ARRAY_SIZE(out_of_seq_q_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, out_of_seq_cnt))
 | |
| 		num_counters += size;
 | |
| 
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_retrans_q_cnts) :
 | |
| 			  ARRAY_SIZE(retrans_q_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, retransmission_q_counters))
 | |
| 		num_counters += size;
 | |
| 
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_extended_err_cnts) :
 | |
| 			  ARRAY_SIZE(extended_err_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, enhanced_error_q_counters))
 | |
| 		num_counters += size;
 | |
| 
 | |
| 	size = is_vport ? ARRAY_SIZE(vport_roce_accl_cnts) :
 | |
| 			  ARRAY_SIZE(roce_accl_cnts);
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, roce_accl))
 | |
| 		num_counters += size;
 | |
| 
 | |
| 	cnts->num_q_counters = num_counters;
 | |
| 
 | |
| 	if (is_vport)
 | |
| 		goto skip_non_qcounters;
 | |
| 
 | |
| 	if (MLX5_CAP_GEN(dev->mdev, cc_query_allowed)) {
 | |
| 		cnts->num_cong_counters = ARRAY_SIZE(cong_cnts);
 | |
| 		num_counters += ARRAY_SIZE(cong_cnts);
 | |
| 	}
 | |
| 	if (MLX5_CAP_PCAM_FEATURE(dev->mdev, rx_icrc_encapsulated_counter)) {
 | |
| 		cnts->num_ext_ppcnt_counters = ARRAY_SIZE(ext_ppcnt_cnts);
 | |
| 		num_counters += ARRAY_SIZE(ext_ppcnt_cnts);
 | |
| 	}
 | |
| 
 | |
| 	num_op_counters = ARRAY_SIZE(basic_op_cnts);
 | |
| 
 | |
| 	if (MLX5_CAP_FLOWTABLE(dev->mdev,
 | |
| 			       ft_field_support_2_nic_receive_rdma.bth_opcode))
 | |
| 		num_op_counters += ARRAY_SIZE(rdmarx_cnp_op_cnts);
 | |
| 
 | |
| 	if (MLX5_CAP_FLOWTABLE(dev->mdev,
 | |
| 			       ft_field_support_2_nic_transmit_rdma.bth_opcode))
 | |
| 		num_op_counters += ARRAY_SIZE(rdmatx_cnp_op_cnts);
 | |
| 
 | |
| skip_non_qcounters:
 | |
| 	cnts->num_op_counters = num_op_counters;
 | |
| 	num_counters += num_op_counters;
 | |
| 	cnts->descs = kcalloc(num_counters,
 | |
| 			      sizeof(struct rdma_stat_desc), GFP_KERNEL);
 | |
| 	if (!cnts->descs)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	cnts->offsets = kcalloc(num_counters,
 | |
| 				sizeof(*cnts->offsets), GFP_KERNEL);
 | |
| 	if (!cnts->offsets)
 | |
| 		goto err;
 | |
| 
 | |
| 	return 0;
 | |
| 
 | |
| err:
 | |
| 	kfree(cnts->descs);
 | |
| 	cnts->descs = NULL;
 | |
| 	return -ENOMEM;
 | |
| }
 | |
| 
 | |
| static void mlx5_ib_dealloc_counters(struct mlx5_ib_dev *dev)
 | |
| {
 | |
| 	u32 in[MLX5_ST_SZ_DW(dealloc_q_counter_in)] = {};
 | |
| 	int num_cnt_ports = dev->num_ports;
 | |
| 	int i, j;
 | |
| 
 | |
| 	if (is_mdev_switchdev_mode(dev->mdev))
 | |
| 		num_cnt_ports = min(2, num_cnt_ports);
 | |
| 
 | |
| 	MLX5_SET(dealloc_q_counter_in, in, opcode,
 | |
| 		 MLX5_CMD_OP_DEALLOC_Q_COUNTER);
 | |
| 
 | |
| 	for (i = 0; i < num_cnt_ports; i++) {
 | |
| 		if (dev->port[i].cnts.set_id) {
 | |
| 			MLX5_SET(dealloc_q_counter_in, in, counter_set_id,
 | |
| 				 dev->port[i].cnts.set_id);
 | |
| 			mlx5_cmd_exec_in(dev->mdev, dealloc_q_counter, in);
 | |
| 		}
 | |
| 		kfree(dev->port[i].cnts.descs);
 | |
| 		kfree(dev->port[i].cnts.offsets);
 | |
| 
 | |
| 		for (j = 0; j < MLX5_IB_OPCOUNTER_MAX; j++) {
 | |
| 			if (!dev->port[i].cnts.opfcs[j].fc)
 | |
| 				continue;
 | |
| 
 | |
| 			if (IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS))
 | |
| 				mlx5_ib_fs_remove_op_fc(dev,
 | |
| 					&dev->port[i].cnts.opfcs[j], j);
 | |
| 			mlx5_fc_destroy(dev->mdev,
 | |
| 					dev->port[i].cnts.opfcs[j].fc);
 | |
| 			dev->port[i].cnts.opfcs[j].fc = NULL;
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_alloc_counters(struct mlx5_ib_dev *dev)
 | |
| {
 | |
| 	u32 out[MLX5_ST_SZ_DW(alloc_q_counter_out)] = {};
 | |
| 	u32 in[MLX5_ST_SZ_DW(alloc_q_counter_in)] = {};
 | |
| 	int num_cnt_ports = dev->num_ports;
 | |
| 	int err = 0;
 | |
| 	int i;
 | |
| 	bool is_shared;
 | |
| 
 | |
| 	MLX5_SET(alloc_q_counter_in, in, opcode, MLX5_CMD_OP_ALLOC_Q_COUNTER);
 | |
| 	is_shared = MLX5_CAP_GEN(dev->mdev, log_max_uctx) != 0;
 | |
| 
 | |
| 	/*
 | |
| 	 * In switchdev we need to allocate two ports, one that is used for
 | |
| 	 * the device Q_counters and it is essentially the real Q_counters of
 | |
| 	 * this device, while the other is used as a helper for PF to be able to
 | |
| 	 * query all other vports.
 | |
| 	 */
 | |
| 	if (is_mdev_switchdev_mode(dev->mdev))
 | |
| 		num_cnt_ports = min(2, num_cnt_ports);
 | |
| 
 | |
| 	for (i = 0; i < num_cnt_ports; i++) {
 | |
| 		err = __mlx5_ib_alloc_counters(dev, &dev->port[i].cnts, i);
 | |
| 		if (err)
 | |
| 			goto err_alloc;
 | |
| 
 | |
| 		mlx5_ib_fill_counters(dev, dev->port[i].cnts.descs,
 | |
| 				      dev->port[i].cnts.offsets, i);
 | |
| 
 | |
| 		MLX5_SET(alloc_q_counter_in, in, uid,
 | |
| 			 is_shared ? MLX5_SHARED_RESOURCE_UID : 0);
 | |
| 
 | |
| 		err = mlx5_cmd_exec_inout(dev->mdev, alloc_q_counter, in, out);
 | |
| 		if (err) {
 | |
| 			mlx5_ib_warn(dev,
 | |
| 				     "couldn't allocate queue counter for port %d, err %d\n",
 | |
| 				     i + 1, err);
 | |
| 			goto err_alloc;
 | |
| 		}
 | |
| 
 | |
| 		dev->port[i].cnts.set_id =
 | |
| 			MLX5_GET(alloc_q_counter_out, out, counter_set_id);
 | |
| 	}
 | |
| 	return 0;
 | |
| 
 | |
| err_alloc:
 | |
| 	mlx5_ib_dealloc_counters(dev);
 | |
| 	return err;
 | |
| }
 | |
| 
 | |
| static int read_flow_counters(struct ib_device *ibdev,
 | |
| 			      struct mlx5_read_counters_attr *read_attr)
 | |
| {
 | |
| 	struct mlx5_fc *fc = read_attr->hw_cntrs_hndl;
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
 | |
| 
 | |
| 	return mlx5_fc_query(dev->mdev, fc,
 | |
| 			     &read_attr->out[IB_COUNTER_PACKETS],
 | |
| 			     &read_attr->out[IB_COUNTER_BYTES]);
 | |
| }
 | |
| 
 | |
| /* flow counters currently expose two counters packets and bytes */
 | |
| #define FLOW_COUNTERS_NUM 2
 | |
| static int counters_set_description(
 | |
| 	struct ib_counters *counters, enum mlx5_ib_counters_type counters_type,
 | |
| 	struct mlx5_ib_flow_counters_desc *desc_data, u32 ncounters)
 | |
| {
 | |
| 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
 | |
| 	u32 cntrs_max_index = 0;
 | |
| 	int i;
 | |
| 
 | |
| 	if (counters_type != MLX5_IB_COUNTERS_FLOW)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	/* init the fields for the object */
 | |
| 	mcounters->type = counters_type;
 | |
| 	mcounters->read_counters = read_flow_counters;
 | |
| 	mcounters->counters_num = FLOW_COUNTERS_NUM;
 | |
| 	mcounters->ncounters = ncounters;
 | |
| 	/* each counter entry have both description and index pair */
 | |
| 	for (i = 0; i < ncounters; i++) {
 | |
| 		if (desc_data[i].description > IB_COUNTER_BYTES)
 | |
| 			return -EINVAL;
 | |
| 
 | |
| 		if (cntrs_max_index <= desc_data[i].index)
 | |
| 			cntrs_max_index = desc_data[i].index + 1;
 | |
| 	}
 | |
| 
 | |
| 	mutex_lock(&mcounters->mcntrs_mutex);
 | |
| 	mcounters->counters_data = desc_data;
 | |
| 	mcounters->cntrs_max_index = cntrs_max_index;
 | |
| 	mutex_unlock(&mcounters->mcntrs_mutex);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| #define MAX_COUNTERS_NUM (USHRT_MAX / (sizeof(u32) * 2))
 | |
| int mlx5_ib_flow_counters_set_data(struct ib_counters *ibcounters,
 | |
| 				   struct mlx5_ib_create_flow *ucmd)
 | |
| {
 | |
| 	struct mlx5_ib_mcounters *mcounters = to_mcounters(ibcounters);
 | |
| 	struct mlx5_ib_flow_counters_data *cntrs_data = NULL;
 | |
| 	struct mlx5_ib_flow_counters_desc *desc_data = NULL;
 | |
| 	bool hw_hndl = false;
 | |
| 	int ret = 0;
 | |
| 
 | |
| 	if (ucmd && ucmd->ncounters_data != 0) {
 | |
| 		cntrs_data = ucmd->data;
 | |
| 		if (cntrs_data->ncounters > MAX_COUNTERS_NUM)
 | |
| 			return -EINVAL;
 | |
| 
 | |
| 		desc_data = kcalloc(cntrs_data->ncounters,
 | |
| 				    sizeof(*desc_data),
 | |
| 				    GFP_KERNEL);
 | |
| 		if (!desc_data)
 | |
| 			return  -ENOMEM;
 | |
| 
 | |
| 		if (copy_from_user(desc_data,
 | |
| 				   u64_to_user_ptr(cntrs_data->counters_data),
 | |
| 				   sizeof(*desc_data) * cntrs_data->ncounters)) {
 | |
| 			ret = -EFAULT;
 | |
| 			goto free;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (!mcounters->hw_cntrs_hndl) {
 | |
| 		mcounters->hw_cntrs_hndl = mlx5_fc_create(
 | |
| 			to_mdev(ibcounters->device)->mdev, false);
 | |
| 		if (IS_ERR(mcounters->hw_cntrs_hndl)) {
 | |
| 			ret = PTR_ERR(mcounters->hw_cntrs_hndl);
 | |
| 			goto free;
 | |
| 		}
 | |
| 		hw_hndl = true;
 | |
| 	}
 | |
| 
 | |
| 	if (desc_data) {
 | |
| 		/* counters already bound to at least one flow */
 | |
| 		if (mcounters->cntrs_max_index) {
 | |
| 			ret = -EINVAL;
 | |
| 			goto free_hndl;
 | |
| 		}
 | |
| 
 | |
| 		ret = counters_set_description(ibcounters,
 | |
| 					       MLX5_IB_COUNTERS_FLOW,
 | |
| 					       desc_data,
 | |
| 					       cntrs_data->ncounters);
 | |
| 		if (ret)
 | |
| 			goto free_hndl;
 | |
| 
 | |
| 	} else if (!mcounters->cntrs_max_index) {
 | |
| 		/* counters not bound yet, must have udata passed */
 | |
| 		ret = -EINVAL;
 | |
| 		goto free_hndl;
 | |
| 	}
 | |
| 
 | |
| 	return 0;
 | |
| 
 | |
| free_hndl:
 | |
| 	if (hw_hndl) {
 | |
| 		mlx5_fc_destroy(to_mdev(ibcounters->device)->mdev,
 | |
| 				mcounters->hw_cntrs_hndl);
 | |
| 		mcounters->hw_cntrs_hndl = NULL;
 | |
| 	}
 | |
| free:
 | |
| 	kfree(desc_data);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| void mlx5_ib_counters_clear_description(struct ib_counters *counters)
 | |
| {
 | |
| 	struct mlx5_ib_mcounters *mcounters;
 | |
| 
 | |
| 	if (!counters || atomic_read(&counters->usecnt) != 1)
 | |
| 		return;
 | |
| 
 | |
| 	mcounters = to_mcounters(counters);
 | |
| 
 | |
| 	mutex_lock(&mcounters->mcntrs_mutex);
 | |
| 	kfree(mcounters->counters_data);
 | |
| 	mcounters->counters_data = NULL;
 | |
| 	mcounters->cntrs_max_index = 0;
 | |
| 	mutex_unlock(&mcounters->mcntrs_mutex);
 | |
| }
 | |
| 
 | |
| static int mlx5_ib_modify_stat(struct ib_device *device, u32 port,
 | |
| 			       unsigned int index, bool enable)
 | |
| {
 | |
| 	struct mlx5_ib_dev *dev = to_mdev(device);
 | |
| 	struct mlx5_ib_counters *cnts;
 | |
| 	struct mlx5_ib_op_fc *opfc;
 | |
| 	u32 num_hw_counters, type;
 | |
| 	int ret;
 | |
| 
 | |
| 	cnts = &dev->port[port - 1].cnts;
 | |
| 	num_hw_counters = cnts->num_q_counters + cnts->num_cong_counters +
 | |
| 		cnts->num_ext_ppcnt_counters;
 | |
| 	if (index < num_hw_counters ||
 | |
| 	    index >= (num_hw_counters + cnts->num_op_counters))
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	if (!(cnts->descs[index].flags & IB_STAT_FLAG_OPTIONAL))
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	type = *(u32 *)cnts->descs[index].priv;
 | |
| 	if (type >= MLX5_IB_OPCOUNTER_MAX)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	opfc = &cnts->opfcs[type];
 | |
| 
 | |
| 	if (enable) {
 | |
| 		if (opfc->fc)
 | |
| 			return -EEXIST;
 | |
| 
 | |
| 		opfc->fc = mlx5_fc_create(dev->mdev, false);
 | |
| 		if (IS_ERR(opfc->fc))
 | |
| 			return PTR_ERR(opfc->fc);
 | |
| 
 | |
| 		ret = mlx5_ib_fs_add_op_fc(dev, port, opfc, type);
 | |
| 		if (ret) {
 | |
| 			mlx5_fc_destroy(dev->mdev, opfc->fc);
 | |
| 			opfc->fc = NULL;
 | |
| 		}
 | |
| 		return ret;
 | |
| 	}
 | |
| 
 | |
| 	if (!opfc->fc)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	mlx5_ib_fs_remove_op_fc(dev, opfc, type);
 | |
| 	mlx5_fc_destroy(dev->mdev, opfc->fc);
 | |
| 	opfc->fc = NULL;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static const struct ib_device_ops hw_stats_ops = {
 | |
| 	.alloc_hw_port_stats = mlx5_ib_alloc_hw_port_stats,
 | |
| 	.get_hw_stats = mlx5_ib_get_hw_stats,
 | |
| 	.counter_bind_qp = mlx5_ib_counter_bind_qp,
 | |
| 	.counter_unbind_qp = mlx5_ib_counter_unbind_qp,
 | |
| 	.counter_dealloc = mlx5_ib_counter_dealloc,
 | |
| 	.counter_alloc_stats = mlx5_ib_counter_alloc_stats,
 | |
| 	.counter_update_stats = mlx5_ib_counter_update_stats,
 | |
| 	.modify_hw_stat = IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS) ?
 | |
| 			  mlx5_ib_modify_stat : NULL,
 | |
| };
 | |
| 
 | |
| static const struct ib_device_ops hw_switchdev_vport_op = {
 | |
| 	.alloc_hw_port_stats = mlx5_ib_alloc_hw_port_stats,
 | |
| };
 | |
| 
 | |
| static const struct ib_device_ops hw_switchdev_stats_ops = {
 | |
| 	.alloc_hw_device_stats = mlx5_ib_alloc_hw_device_stats,
 | |
| 	.get_hw_stats = mlx5_ib_get_hw_stats,
 | |
| 	.counter_bind_qp = mlx5_ib_counter_bind_qp,
 | |
| 	.counter_unbind_qp = mlx5_ib_counter_unbind_qp,
 | |
| 	.counter_dealloc = mlx5_ib_counter_dealloc,
 | |
| 	.counter_alloc_stats = mlx5_ib_counter_alloc_stats,
 | |
| 	.counter_update_stats = mlx5_ib_counter_update_stats,
 | |
| };
 | |
| 
 | |
| static const struct ib_device_ops counters_ops = {
 | |
| 	.create_counters = mlx5_ib_create_counters,
 | |
| 	.destroy_counters = mlx5_ib_destroy_counters,
 | |
| 	.read_counters = mlx5_ib_read_counters,
 | |
| 
 | |
| 	INIT_RDMA_OBJ_SIZE(ib_counters, mlx5_ib_mcounters, ibcntrs),
 | |
| };
 | |
| 
 | |
| int mlx5_ib_counters_init(struct mlx5_ib_dev *dev)
 | |
| {
 | |
| 	ib_set_device_ops(&dev->ib_dev, &counters_ops);
 | |
| 
 | |
| 	if (!MLX5_CAP_GEN(dev->mdev, max_qp_cnt))
 | |
| 		return 0;
 | |
| 
 | |
| 	if (is_mdev_switchdev_mode(dev->mdev)) {
 | |
| 		ib_set_device_ops(&dev->ib_dev, &hw_switchdev_stats_ops);
 | |
| 		if (vport_qcounters_supported(dev))
 | |
| 			ib_set_device_ops(&dev->ib_dev, &hw_switchdev_vport_op);
 | |
| 	} else
 | |
| 		ib_set_device_ops(&dev->ib_dev, &hw_stats_ops);
 | |
| 	return mlx5_ib_alloc_counters(dev);
 | |
| }
 | |
| 
 | |
| void mlx5_ib_counters_cleanup(struct mlx5_ib_dev *dev)
 | |
| {
 | |
| 	if (!MLX5_CAP_GEN(dev->mdev, max_qp_cnt))
 | |
| 		return;
 | |
| 
 | |
| 	mlx5_ib_dealloc_counters(dev);
 | |
| }
 |