2013-07-07 22:25:49 +08:00
|
|
|
/*
|
2015-04-02 22:07:29 +08:00
|
|
|
* Copyright (c) 2013-2015, Mellanox Technologies. All rights reserved.
|
2013-07-07 22:25:49 +08:00
|
|
|
*
|
|
|
|
* This software is available to you under a choice of one of two
|
|
|
|
* licenses. You may choose to be licensed under the terms of the GNU
|
|
|
|
* General Public License (GPL) Version 2, available from the file
|
|
|
|
* COPYING in the main directory of this source tree, or the
|
|
|
|
* OpenIB.org BSD license below:
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or
|
|
|
|
* without modification, are permitted provided that the following
|
|
|
|
* conditions are met:
|
|
|
|
*
|
|
|
|
* - Redistributions of source code must retain the above
|
|
|
|
* copyright notice, this list of conditions and the following
|
|
|
|
* disclaimer.
|
|
|
|
*
|
|
|
|
* - Redistributions in binary form must reproduce the above
|
|
|
|
* copyright notice, this list of conditions and the following
|
|
|
|
* disclaimer in the documentation and/or other materials
|
|
|
|
* provided with the distribution.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
|
|
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
|
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
|
|
|
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
|
|
|
|
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
|
|
|
|
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
|
|
|
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
|
|
* SOFTWARE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef MLX5_DRIVER_H
|
|
|
|
#define MLX5_DRIVER_H
|
|
|
|
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/completion.h>
|
|
|
|
#include <linux/pci.h>
|
2018-01-04 10:35:51 +08:00
|
|
|
#include <linux/irq.h>
|
2013-07-07 22:25:49 +08:00
|
|
|
#include <linux/spinlock_types.h>
|
|
|
|
#include <linux/semaphore.h>
|
2014-02-14 12:45:17 +08:00
|
|
|
#include <linux/slab.h>
|
2013-07-07 22:25:49 +08:00
|
|
|
#include <linux/vmalloc.h>
|
2019-06-20 15:03:47 +08:00
|
|
|
#include <linux/xarray.h>
|
2016-05-13 20:55:41 +08:00
|
|
|
#include <linux/workqueue.h>
|
2017-01-02 17:37:46 +08:00
|
|
|
#include <linux/mempool.h>
|
net/mlx5_core: Use tasklet for user-space CQ completion events
Previously, we've fired all our completion callbacks straight from
our ISR.
Some of those callbacks were lightweight (for example, mlx5 Ethernet
napi callbacks), but some of them did more work (for example,
the user-space RDMA stack uverbs' completion handler). Besides that,
doing more than the minimal work in ISR is generally considered wrong,
it could even lead to a hard lockup of the system. Since when a lot
of completion events are generated by the hardware, the loop over
those events could be so long, that we'll get into a hard lockup by
the system watchdog.
In order to avoid that, add a new way of invoking completion events
callbacks. In the interrupt itself, we add the CQs which receive
completion event to a per-EQ list and schedule a tasklet. In the
tasklet context we loop over all the CQs in the list and invoke the
user callback.
Signed-off-by: Matan Barak <matanb@mellanox.com>
Signed-off-by: Doug Ledford <dledford@redhat.com>
2016-04-17 22:08:40 +08:00
|
|
|
#include <linux/interrupt.h>
|
2017-03-26 22:01:57 +08:00
|
|
|
#include <linux/idr.h>
|
2018-11-27 06:38:56 +08:00
|
|
|
#include <linux/notifier.h>
|
2019-08-06 09:59:50 +08:00
|
|
|
#include <linux/refcount.h>
|
2020-10-08 21:06:37 +08:00
|
|
|
#include <linux/auxiliary_bus.h>
|
2014-02-14 12:45:17 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
#include <linux/mlx5/device.h>
|
|
|
|
#include <linux/mlx5/doorbell.h>
|
2018-11-21 06:12:21 +08:00
|
|
|
#include <linux/mlx5/eq.h>
|
2017-08-15 18:46:04 +08:00
|
|
|
#include <linux/timecounter.h>
|
|
|
|
#include <linux/ptp_clock_kernel.h>
|
2018-12-11 22:09:53 +08:00
|
|
|
#include <net/devlink.h>
|
2013-07-07 22:25:49 +08:00
|
|
|
|
2020-10-04 19:30:58 +08:00
|
|
|
#define MLX5_ADEV_NAME "mlx5_core"
|
|
|
|
|
2021-08-19 21:18:57 +08:00
|
|
|
#define MLX5_IRQ_EQ_CTRL (U8_MAX)
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
enum {
|
|
|
|
MLX5_BOARD_ID_LEN = 64,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
/* one minute for the sake of bringup. Generally, commands must always
|
|
|
|
* complete and we may need to increase this timeout value
|
|
|
|
*/
|
2016-03-02 06:13:39 +08:00
|
|
|
MLX5_CMD_TIMEOUT_MSEC = 60 * 1000,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_CMD_WQ_MAX_NAME = 32,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
CMD_OWNER_SW = 0x0,
|
|
|
|
CMD_OWNER_HW = 0x1,
|
|
|
|
CMD_STATUS_SUCCESS = 0,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_sqp_t {
|
|
|
|
MLX5_SQP_SMI = 0,
|
|
|
|
MLX5_SQP_GSI = 1,
|
|
|
|
MLX5_SQP_IEEE_1588 = 2,
|
|
|
|
MLX5_SQP_SNIFFER = 3,
|
|
|
|
MLX5_SQP_SYNC_UMR = 4,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_MAX_PORTS = 2,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
2018-10-10 14:25:16 +08:00
|
|
|
MLX5_ATOMIC_MODE_OFFSET = 16,
|
|
|
|
MLX5_ATOMIC_MODE_IB_COMP = 1,
|
|
|
|
MLX5_ATOMIC_MODE_CX = 2,
|
|
|
|
MLX5_ATOMIC_MODE_8B = 3,
|
|
|
|
MLX5_ATOMIC_MODE_16B = 4,
|
|
|
|
MLX5_ATOMIC_MODE_32B = 5,
|
|
|
|
MLX5_ATOMIC_MODE_64B = 6,
|
|
|
|
MLX5_ATOMIC_MODE_128B = 7,
|
|
|
|
MLX5_ATOMIC_MODE_256B = 8,
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
2017-07-19 05:08:46 +08:00
|
|
|
MLX5_REG_QPTS = 0x4002,
|
2016-02-23 00:17:25 +08:00
|
|
|
MLX5_REG_QETCR = 0x4005,
|
|
|
|
MLX5_REG_QTCT = 0x400a,
|
2017-07-19 05:08:46 +08:00
|
|
|
MLX5_REG_QPDPM = 0x4013,
|
2017-07-19 05:03:17 +08:00
|
|
|
MLX5_REG_QCAM = 0x4019,
|
2016-11-27 23:02:06 +08:00
|
|
|
MLX5_REG_DCBX_PARAM = 0x4020,
|
|
|
|
MLX5_REG_DCBX_APP = 0x4021,
|
2017-03-14 02:05:45 +08:00
|
|
|
MLX5_REG_FPGA_CAP = 0x4022,
|
|
|
|
MLX5_REG_FPGA_CTRL = 0x4023,
|
2017-04-18 18:10:41 +08:00
|
|
|
MLX5_REG_FPGA_ACCESS_REG = 0x4024,
|
2019-05-30 06:50:24 +08:00
|
|
|
MLX5_REG_CORE_DUMP = 0x402e,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_REG_PCAP = 0x5001,
|
|
|
|
MLX5_REG_PMTU = 0x5003,
|
|
|
|
MLX5_REG_PTYS = 0x5004,
|
|
|
|
MLX5_REG_PAOS = 0x5006,
|
2015-08-16 21:04:51 +08:00
|
|
|
MLX5_REG_PFCC = 0x5007,
|
2015-08-04 19:05:47 +08:00
|
|
|
MLX5_REG_PPCNT = 0x5008,
|
2018-03-03 05:47:01 +08:00
|
|
|
MLX5_REG_PPTB = 0x500b,
|
|
|
|
MLX5_REG_PBMC = 0x500c,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_REG_PMAOS = 0x5012,
|
|
|
|
MLX5_REG_PUDE = 0x5009,
|
|
|
|
MLX5_REG_PMPE = 0x5010,
|
|
|
|
MLX5_REG_PELC = 0x500e,
|
2015-06-05 00:30:45 +08:00
|
|
|
MLX5_REG_PVLC = 0x500f,
|
2016-04-25 03:51:52 +08:00
|
|
|
MLX5_REG_PCMR = 0x5041,
|
2021-02-15 22:13:02 +08:00
|
|
|
MLX5_REG_PDDR = 0x5031,
|
2016-04-25 03:51:54 +08:00
|
|
|
MLX5_REG_PMLP = 0x5002,
|
2018-10-09 19:16:43 +08:00
|
|
|
MLX5_REG_PPLM = 0x5023,
|
2016-12-08 21:52:00 +08:00
|
|
|
MLX5_REG_PCAM = 0x507f,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_REG_NODE_DESC = 0x6001,
|
|
|
|
MLX5_REG_HOST_ENDIANNESS = 0x7004,
|
2016-04-25 03:51:54 +08:00
|
|
|
MLX5_REG_MCIA = 0x9014,
|
2020-04-25 03:45:06 +08:00
|
|
|
MLX5_REG_MFRL = 0x9028,
|
2016-04-25 03:51:53 +08:00
|
|
|
MLX5_REG_MLCR = 0x902b,
|
2018-07-17 09:35:30 +08:00
|
|
|
MLX5_REG_MTRC_CAP = 0x9040,
|
|
|
|
MLX5_REG_MTRC_CONF = 0x9041,
|
|
|
|
MLX5_REG_MTRC_STDB = 0x9042,
|
|
|
|
MLX5_REG_MTRC_CTRL = 0x9043,
|
2019-03-30 06:38:03 +08:00
|
|
|
MLX5_REG_MPEIN = 0x9050,
|
2016-11-17 19:46:01 +08:00
|
|
|
MLX5_REG_MPCNT = 0x9051,
|
2016-10-10 21:05:53 +08:00
|
|
|
MLX5_REG_MTPPS = 0x9053,
|
|
|
|
MLX5_REG_MTPPSE = 0x9054,
|
2021-02-13 06:30:38 +08:00
|
|
|
MLX5_REG_MTUTC = 0x9055,
|
2018-07-17 09:35:31 +08:00
|
|
|
MLX5_REG_MPEGC = 0x9056,
|
2019-06-29 06:35:50 +08:00
|
|
|
MLX5_REG_MCQS = 0x9060,
|
2017-04-18 18:35:39 +08:00
|
|
|
MLX5_REG_MCQI = 0x9061,
|
|
|
|
MLX5_REG_MCC = 0x9062,
|
|
|
|
MLX5_REG_MCDA = 0x9063,
|
2016-12-08 21:52:00 +08:00
|
|
|
MLX5_REG_MCAM = 0x907f,
|
2019-10-07 15:30:32 +08:00
|
|
|
MLX5_REG_MIRC = 0x9162,
|
2020-06-22 14:03:31 +08:00
|
|
|
MLX5_REG_SBCAM = 0xB01F,
|
2019-11-04 20:51:55 +08:00
|
|
|
MLX5_REG_RESOURCE_DUMP = 0xC000,
|
2021-07-21 21:14:12 +08:00
|
|
|
MLX5_REG_DTOR = 0xC00E,
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2017-07-19 05:08:46 +08:00
|
|
|
enum mlx5_qpts_trust_state {
|
|
|
|
MLX5_QPTS_TRUST_PCP = 1,
|
|
|
|
MLX5_QPTS_TRUST_DSCP = 2,
|
|
|
|
};
|
|
|
|
|
2016-11-27 23:02:06 +08:00
|
|
|
enum mlx5_dcbx_oper_mode {
|
|
|
|
MLX5E_DCBX_PARAM_VER_OPER_HOST = 0x0,
|
|
|
|
MLX5E_DCBX_PARAM_VER_OPER_AUTO = 0x3,
|
|
|
|
};
|
|
|
|
|
2015-12-14 22:34:10 +08:00
|
|
|
enum {
|
|
|
|
MLX5_ATOMIC_OPS_CMP_SWAP = 1 << 0,
|
|
|
|
MLX5_ATOMIC_OPS_FETCH_ADD = 1 << 1,
|
2018-10-10 14:25:16 +08:00
|
|
|
MLX5_ATOMIC_OPS_EXTENDED_CMP_SWAP = 1 << 2,
|
|
|
|
MLX5_ATOMIC_OPS_EXTENDED_FETCH_ADD = 1 << 3,
|
2015-12-14 22:34:10 +08:00
|
|
|
};
|
|
|
|
|
2014-12-11 23:04:19 +08:00
|
|
|
enum mlx5_page_fault_resume_flags {
|
|
|
|
MLX5_PAGE_FAULT_RESUME_REQUESTOR = 1 << 0,
|
|
|
|
MLX5_PAGE_FAULT_RESUME_WRITE = 1 << 1,
|
|
|
|
MLX5_PAGE_FAULT_RESUME_RDMA = 1 << 2,
|
|
|
|
MLX5_PAGE_FAULT_RESUME_ERROR = 1 << 7,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
enum dbg_rsc_type {
|
|
|
|
MLX5_DBG_RSC_QP,
|
|
|
|
MLX5_DBG_RSC_EQ,
|
|
|
|
MLX5_DBG_RSC_CQ,
|
|
|
|
};
|
|
|
|
|
2017-05-30 15:18:24 +08:00
|
|
|
enum port_state_policy {
|
|
|
|
MLX5_POLICY_DOWN = 0,
|
|
|
|
MLX5_POLICY_UP = 1,
|
|
|
|
MLX5_POLICY_FOLLOW = 2,
|
|
|
|
MLX5_POLICY_INVALID = 0xffffffff
|
|
|
|
};
|
|
|
|
|
2019-06-29 06:35:58 +08:00
|
|
|
enum mlx5_coredev_type {
|
|
|
|
MLX5_COREDEV_PF,
|
2020-12-12 14:12:18 +08:00
|
|
|
MLX5_COREDEV_VF,
|
|
|
|
MLX5_COREDEV_SF,
|
2019-06-29 06:35:58 +08:00
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_field_desc {
|
|
|
|
int i;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_rsc_debug {
|
|
|
|
struct mlx5_core_dev *dev;
|
|
|
|
void *object;
|
|
|
|
enum dbg_rsc_type type;
|
|
|
|
struct dentry *root;
|
2020-05-08 02:59:35 +08:00
|
|
|
struct mlx5_field_desc fields[];
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_dev_event {
|
2018-11-27 06:38:59 +08:00
|
|
|
MLX5_DEV_EVENT_SYS_ERROR = 128, /* 0 - 127 are FW events */
|
2019-02-21 22:29:27 +08:00
|
|
|
MLX5_DEV_EVENT_PORT_AFFINITY = 129,
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2015-05-29 03:28:43 +08:00
|
|
|
enum mlx5_port_status {
|
2015-08-16 21:04:50 +08:00
|
|
|
MLX5_PORT_UP = 1,
|
|
|
|
MLX5_PORT_DOWN = 2,
|
2015-05-29 03:28:43 +08:00
|
|
|
};
|
|
|
|
|
2020-03-20 03:43:13 +08:00
|
|
|
enum mlx5_cmdif_state {
|
|
|
|
MLX5_CMDIF_STATE_UNINITIALIZED,
|
|
|
|
MLX5_CMDIF_STATE_UP,
|
|
|
|
MLX5_CMDIF_STATE_DOWN,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_cmd_first {
|
|
|
|
__be32 data[4];
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_msg {
|
|
|
|
struct list_head list;
|
2016-11-17 19:45:55 +08:00
|
|
|
struct cmd_msg_cache *parent;
|
2013-07-07 22:25:49 +08:00
|
|
|
u32 len;
|
|
|
|
struct mlx5_cmd_first first;
|
|
|
|
struct mlx5_cmd_mailbox *next;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_debug {
|
|
|
|
struct dentry *dbg_root;
|
|
|
|
void *in_msg;
|
|
|
|
void *out_msg;
|
|
|
|
u8 status;
|
|
|
|
u16 inlen;
|
|
|
|
u16 outlen;
|
|
|
|
};
|
|
|
|
|
2016-11-17 19:45:55 +08:00
|
|
|
struct cmd_msg_cache {
|
2013-07-07 22:25:49 +08:00
|
|
|
/* protect block chain allocations
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
struct list_head head;
|
2016-11-17 19:45:55 +08:00
|
|
|
unsigned int max_inbox_size;
|
|
|
|
unsigned int num_ent;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2016-11-17 19:45:55 +08:00
|
|
|
enum {
|
|
|
|
MLX5_NUM_COMMAND_CACHES = 5,
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_stats {
|
|
|
|
u64 sum;
|
|
|
|
u64 n;
|
|
|
|
struct dentry *root;
|
|
|
|
/* protect command average calculations */
|
|
|
|
spinlock_t lock;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd {
|
2018-11-21 06:12:24 +08:00
|
|
|
struct mlx5_nb nb;
|
|
|
|
|
2020-03-20 03:43:13 +08:00
|
|
|
enum mlx5_cmdif_state state;
|
2015-04-02 22:07:25 +08:00
|
|
|
void *cmd_alloc_buf;
|
|
|
|
dma_addr_t alloc_dma;
|
|
|
|
int alloc_size;
|
2013-07-07 22:25:49 +08:00
|
|
|
void *cmd_buf;
|
|
|
|
dma_addr_t dma;
|
|
|
|
u16 cmdif_rev;
|
|
|
|
u8 log_sz;
|
|
|
|
u8 log_stride;
|
|
|
|
int max_reg_cmds;
|
|
|
|
int events;
|
|
|
|
u32 __iomem *vector;
|
|
|
|
|
|
|
|
/* protect command queue allocations
|
|
|
|
*/
|
|
|
|
spinlock_t alloc_lock;
|
|
|
|
|
|
|
|
/* protect token allocations
|
|
|
|
*/
|
|
|
|
spinlock_t token_lock;
|
|
|
|
u8 token;
|
|
|
|
unsigned long bitmask;
|
|
|
|
char wq_name[MLX5_CMD_WQ_MAX_NAME];
|
|
|
|
struct workqueue_struct *wq;
|
|
|
|
struct semaphore sem;
|
|
|
|
struct semaphore pages_sem;
|
|
|
|
int mode;
|
2020-03-19 03:44:32 +08:00
|
|
|
u16 allowed_opcode;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_cmd_work_ent *ent_arr[MLX5_MAX_COMMANDS];
|
2017-08-22 19:46:59 +08:00
|
|
|
struct dma_pool *pool;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_cmd_debug dbg;
|
2016-11-17 19:45:55 +08:00
|
|
|
struct cmd_msg_cache cache[MLX5_NUM_COMMAND_CACHES];
|
2013-07-07 22:25:49 +08:00
|
|
|
int checksum_disabled;
|
2020-05-28 14:16:02 +08:00
|
|
|
struct mlx5_cmd_stats *stats;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_mailbox {
|
|
|
|
void *buf;
|
|
|
|
dma_addr_t dma;
|
|
|
|
struct mlx5_cmd_mailbox *next;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_buf_list {
|
|
|
|
void *buf;
|
|
|
|
dma_addr_t map;
|
|
|
|
};
|
|
|
|
|
2016-11-30 23:59:37 +08:00
|
|
|
struct mlx5_frag_buf {
|
|
|
|
struct mlx5_buf_list *frags;
|
|
|
|
int npages;
|
|
|
|
int size;
|
|
|
|
u8 page_shift;
|
|
|
|
};
|
|
|
|
|
2018-01-02 22:08:06 +08:00
|
|
|
struct mlx5_frag_buf_ctrl {
|
2018-09-12 20:36:41 +08:00
|
|
|
struct mlx5_buf_list *frags;
|
2018-01-02 22:08:06 +08:00
|
|
|
u32 sz_m1;
|
2018-08-21 21:04:41 +08:00
|
|
|
u16 frag_sz_m1;
|
2018-08-21 21:07:58 +08:00
|
|
|
u16 strides_offset;
|
2018-01-02 22:08:06 +08:00
|
|
|
u8 log_sz;
|
|
|
|
u8 log_stride;
|
|
|
|
u8 log_frag_strides;
|
|
|
|
};
|
|
|
|
|
2014-02-23 20:19:06 +08:00
|
|
|
struct mlx5_core_psv {
|
|
|
|
u32 psv_idx;
|
|
|
|
struct psv_layout {
|
|
|
|
u32 pd;
|
|
|
|
u16 syndrome;
|
|
|
|
u16 reserved;
|
|
|
|
u16 bg;
|
|
|
|
u16 app_tag;
|
|
|
|
u32 ref_tag;
|
|
|
|
} psv;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_core_sig_ctx {
|
|
|
|
struct mlx5_core_psv psv_memory;
|
|
|
|
struct mlx5_core_psv psv_wire;
|
2014-02-23 20:19:12 +08:00
|
|
|
struct ib_sig_err err_item;
|
|
|
|
bool sig_status_checked;
|
|
|
|
bool sig_err_exists;
|
|
|
|
u32 sigerr_count;
|
2014-02-23 20:19:06 +08:00
|
|
|
};
|
2013-07-07 22:25:49 +08:00
|
|
|
|
2017-01-02 17:37:48 +08:00
|
|
|
enum {
|
|
|
|
MLX5_MKEY_MR = 1,
|
|
|
|
MLX5_MKEY_MW,
|
2019-01-13 22:01:17 +08:00
|
|
|
MLX5_MKEY_INDIRECT_DEVX,
|
2017-01-02 17:37:48 +08:00
|
|
|
};
|
|
|
|
|
2016-03-01 00:05:28 +08:00
|
|
|
struct mlx5_core_mkey {
|
2013-07-07 22:25:49 +08:00
|
|
|
u64 iova;
|
|
|
|
u64 size;
|
|
|
|
u32 key;
|
|
|
|
u32 pd;
|
2017-01-02 17:37:48 +08:00
|
|
|
u32 type;
|
2021-02-02 15:13:09 +08:00
|
|
|
struct wait_queue_head wait;
|
|
|
|
refcount_t usecount;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2017-01-02 17:37:46 +08:00
|
|
|
#define MLX5_24BIT_MASK ((1 << 24) - 1)
|
|
|
|
|
2014-10-02 17:19:45 +08:00
|
|
|
enum mlx5_res_type {
|
2016-01-15 01:13:00 +08:00
|
|
|
MLX5_RES_QP = MLX5_EVENT_QUEUE_TYPE_QP,
|
|
|
|
MLX5_RES_RQ = MLX5_EVENT_QUEUE_TYPE_RQ,
|
|
|
|
MLX5_RES_SQ = MLX5_EVENT_QUEUE_TYPE_SQ,
|
|
|
|
MLX5_RES_SRQ = 3,
|
|
|
|
MLX5_RES_XSRQ = 4,
|
2017-08-17 20:52:10 +08:00
|
|
|
MLX5_RES_XRQ = 5,
|
2018-01-02 22:19:28 +08:00
|
|
|
MLX5_RES_DCT = MLX5_EVENT_QUEUE_TYPE_DCT,
|
2014-10-02 17:19:45 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_core_rsc_common {
|
|
|
|
enum mlx5_res_type res;
|
2019-08-06 09:59:50 +08:00
|
|
|
refcount_t refcount;
|
2014-10-02 17:19:45 +08:00
|
|
|
struct completion free;
|
|
|
|
};
|
|
|
|
|
2017-01-04 05:55:23 +08:00
|
|
|
struct mlx5_uars_page {
|
2013-07-07 22:25:49 +08:00
|
|
|
void __iomem *map;
|
2017-01-04 05:55:23 +08:00
|
|
|
bool wc;
|
|
|
|
u32 index;
|
|
|
|
struct list_head list;
|
|
|
|
unsigned int bfregs;
|
|
|
|
unsigned long *reg_bitmap; /* for non fast path bf regs */
|
|
|
|
unsigned long *fp_bitmap;
|
|
|
|
unsigned int reg_avail;
|
|
|
|
unsigned int fp_avail;
|
|
|
|
struct kref ref_count;
|
|
|
|
struct mlx5_core_dev *mdev;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2017-01-04 05:55:23 +08:00
|
|
|
struct mlx5_bfreg_head {
|
|
|
|
/* protect blue flame registers allocations */
|
|
|
|
struct mutex lock;
|
|
|
|
struct list_head list;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_bfreg_data {
|
|
|
|
struct mlx5_bfreg_head reg_head;
|
|
|
|
struct mlx5_bfreg_head wc_head;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_sq_bfreg {
|
|
|
|
void __iomem *map;
|
|
|
|
struct mlx5_uars_page *up;
|
|
|
|
bool wc;
|
|
|
|
u32 index;
|
|
|
|
unsigned int offset;
|
|
|
|
};
|
2013-07-07 22:25:49 +08:00
|
|
|
|
|
|
|
struct mlx5_core_health {
|
|
|
|
struct health_buffer __iomem *health;
|
|
|
|
__be32 __iomem *health_counter;
|
|
|
|
struct timer_list timer;
|
|
|
|
u32 prev;
|
|
|
|
int miss_counter;
|
2018-12-11 22:09:56 +08:00
|
|
|
u8 synd;
|
2018-11-12 21:23:02 +08:00
|
|
|
u32 fatal_error;
|
2018-07-17 16:18:26 +08:00
|
|
|
u32 crdump_size;
|
2016-10-25 23:36:33 +08:00
|
|
|
/* wq spinlock to synchronize draining */
|
|
|
|
spinlock_t wq_lock;
|
2015-10-08 22:14:00 +08:00
|
|
|
struct workqueue_struct *wq;
|
2016-10-25 23:36:33 +08:00
|
|
|
unsigned long flags;
|
2019-01-28 00:38:39 +08:00
|
|
|
struct work_struct fatal_report_work;
|
2018-12-11 22:09:56 +08:00
|
|
|
struct work_struct report_work;
|
2018-12-11 22:09:53 +08:00
|
|
|
struct devlink_health_reporter *fw_reporter;
|
2018-12-11 22:09:57 +08:00
|
|
|
struct devlink_health_reporter *fw_fatal_reporter;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_qp_table {
|
2018-11-27 06:39:06 +08:00
|
|
|
struct notifier_block nb;
|
2018-11-21 06:12:25 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
/* protect radix tree
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
struct radix_tree_root tree;
|
|
|
|
};
|
|
|
|
|
2015-12-02 00:03:09 +08:00
|
|
|
struct mlx5_vf_context {
|
|
|
|
int enabled;
|
2017-05-30 15:18:24 +08:00
|
|
|
u64 port_guid;
|
|
|
|
u64 node_guid;
|
IB/mlx5: Return the administrative GUID if exists
A user can change the operational GUID (a.k.a affective GUID) through
link/infiniband. Therefore it is preferred to return the currently set
GUID if it exists instead of the operational.
This way the PF can query which VF GUID will be set in the next bind. In
order to align with MAC address, zero is returned if administrative GUID
is not set.
For example, before setting administrative GUID:
$ ip link show
ib0: <BROADCAST,MULTICAST,UP,LOWER_UP> mtu 4092 qdisc mq state UP mode DEFAULT group default qlen 256
link/infiniband 00:00:00:08:fe:80:00:00:00:00:00:00:52:54:00:c0:fe:12:34:55 brd 00:ff:ff:ff:ff:12:40:1b:ff:ff:00:00:00:00:00:00:ff:ff:ff:ff
vf 0 link/infiniband 00:00:00:08:fe:80:00:00:00:00:00:00:52:54:00:c0:fe:12:34:55 brd 00:ff:ff:ff:ff:12:40:1b:ff:ff:00:00:00:00:00:00:ff:ff:ff:ff,
spoof checking off, NODE_GUID 00:00:00:00:00:00:00:00, PORT_GUID 00:00:00:00:00:00:00:00, link-state auto, trust off, query_rss off
Then:
$ ip link set ib0 vf 0 node_guid 11:00:af:21:cb:05:11:00
$ ip link set ib0 vf 0 port_guid 22:11:af:21:cb:05:11:00
After setting administrative GUID:
$ ip link show
ib0: <BROADCAST,MULTICAST,UP,LOWER_UP> mtu 4092 qdisc mq state UP mode DEFAULT group default qlen 256
link/infiniband 00:00:00:08:fe:80:00:00:00:00:00:00:52:54:00:c0:fe:12:34:55 brd 00:ff:ff:ff:ff:12:40:1b:ff:ff:00:00:00:00:00:00:ff:ff:ff:ff
vf 0 link/infiniband 00:00:00:08:fe:80:00:00:00:00:00:00:52:54:00:c0:fe:12:34:55 brd 00:ff:ff:ff:ff:12:40:1b:ff:ff:00:00:00:00:00:00:ff:ff:ff:ff,
spoof checking off, NODE_GUID 11:00:af:21:cb:05:11:00, PORT_GUID 22:11:af:21:cb:05:11:00, link-state auto, trust off, query_rss off
Fixes: 9c0015ef0928 ("IB/mlx5: Implement callbacks for getting VFs GUID attributes")
Link: https://lore.kernel.org/r/20200116120048.12744-1-leon@kernel.org
Signed-off-by: Danit Goldberg <danitg@mellanox.com>
Signed-off-by: Leon Romanovsky <leonro@mellanox.com>
Signed-off-by: Jason Gunthorpe <jgg@mellanox.com>
2020-01-16 20:00:48 +08:00
|
|
|
/* Valid bits are used to validate administrative guid only.
|
|
|
|
* Enabled after ndo_set_vf_guid
|
|
|
|
*/
|
|
|
|
u8 port_guid_valid:1;
|
|
|
|
u8 node_guid_valid:1;
|
2017-05-30 15:18:24 +08:00
|
|
|
enum port_state_policy policy;
|
2015-12-02 00:03:09 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_core_sriov {
|
|
|
|
struct mlx5_vf_context *vfs_ctx;
|
|
|
|
int num_vfs;
|
2019-06-11 07:38:19 +08:00
|
|
|
u16 max_vfs;
|
2015-12-02 00:03:09 +08:00
|
|
|
};
|
|
|
|
|
net/mlx5: Add flow counter pool
Add a pool of flow counters, based on flow counter bulks, removing the
need to allocate a new counter via a costly FW command during the flow
creation process. The time it takes to acquire/release a flow counter
is cut from ~50 [us] to ~50 [ns].
The pool is part of the mlx5 driver instance, and provides flow
counters for aging flows. mlx5_fc_create() was modified to provide
counters for aging flows from the pool by default, and
mlx5_destroy_fc() was modified to release counters back to the pool
for later reuse. If bulk allocation is not supported or fails, and for
non-aging flows, the fallback behavior is to allocate and free
individual counters.
The pool is comprised of three lists of flow counter bulks, one of
fully used bulks, one of partially used bulks, and one of unused
bulks. Counters are provided from the partially used bulks first, to
help limit bulk fragmentation.
The pool maintains a threshold, and strives to maintain the amount of
available counters below it. The pool is increased in size when a
counter acquisition request is made and there are no available
counters, and it is decreased in size when the last counter in a bulk
is released and there are more available counters than the threshold.
All pool size changes are done in the context of the
acquiring/releasing process.
The value of the threshold is directly correlated to the amount of
used counters the pool is providing, while constrained by a hard
maximum, and is recalculated every time a bulk is allocated/freed.
This ensures that the pool only consumes large amounts of memory for
available counters if the pool is being used heavily. When fully
populated and at the hard maximum, the buffer of available counters
consumes ~40 [MB].
Signed-off-by: Gavi Teitz <gavi@mellanox.com>
Reviewed-by: Vlad Buslov <vladbu@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
2019-06-28 01:53:03 +08:00
|
|
|
struct mlx5_fc_pool {
|
|
|
|
struct mlx5_core_dev *dev;
|
|
|
|
struct mutex pool_lock; /* protects pool lists */
|
|
|
|
struct list_head fully_used;
|
|
|
|
struct list_head partially_used;
|
|
|
|
struct list_head unused;
|
|
|
|
int available_fcs;
|
|
|
|
int used_fcs;
|
|
|
|
int threshold;
|
|
|
|
};
|
|
|
|
|
2016-05-13 20:55:41 +08:00
|
|
|
struct mlx5_fc_stats {
|
2018-07-24 21:37:40 +08:00
|
|
|
spinlock_t counters_idr_lock; /* protects counters_idr */
|
|
|
|
struct idr counters_idr;
|
2018-07-24 14:52:11 +08:00
|
|
|
struct list_head counters;
|
2018-07-23 15:55:39 +08:00
|
|
|
struct llist_head addlist;
|
2018-07-23 16:32:05 +08:00
|
|
|
struct llist_head dellist;
|
2016-05-13 20:55:41 +08:00
|
|
|
|
|
|
|
struct workqueue_struct *wq;
|
|
|
|
struct delayed_work work;
|
|
|
|
unsigned long next_query;
|
2017-02-24 18:16:33 +08:00
|
|
|
unsigned long sampling_interval; /* jiffies */
|
2019-07-30 05:12:52 +08:00
|
|
|
u32 *bulk_query_out;
|
net/mlx5: Add flow counter pool
Add a pool of flow counters, based on flow counter bulks, removing the
need to allocate a new counter via a costly FW command during the flow
creation process. The time it takes to acquire/release a flow counter
is cut from ~50 [us] to ~50 [ns].
The pool is part of the mlx5 driver instance, and provides flow
counters for aging flows. mlx5_fc_create() was modified to provide
counters for aging flows from the pool by default, and
mlx5_destroy_fc() was modified to release counters back to the pool
for later reuse. If bulk allocation is not supported or fails, and for
non-aging flows, the fallback behavior is to allocate and free
individual counters.
The pool is comprised of three lists of flow counter bulks, one of
fully used bulks, one of partially used bulks, and one of unused
bulks. Counters are provided from the partially used bulks first, to
help limit bulk fragmentation.
The pool maintains a threshold, and strives to maintain the amount of
available counters below it. The pool is increased in size when a
counter acquisition request is made and there are no available
counters, and it is decreased in size when the last counter in a bulk
is released and there are more available counters than the threshold.
All pool size changes are done in the context of the
acquiring/releasing process.
The value of the threshold is directly correlated to the amount of
used counters the pool is providing, while constrained by a hard
maximum, and is recalculated every time a bulk is allocated/freed.
This ensures that the pool only consumes large amounts of memory for
available counters if the pool is being used heavily. When fully
populated and at the hard maximum, the buffer of available counters
consumes ~40 [MB].
Signed-off-by: Gavi Teitz <gavi@mellanox.com>
Reviewed-by: Vlad Buslov <vladbu@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
2019-06-28 01:53:03 +08:00
|
|
|
struct mlx5_fc_pool fc_pool;
|
2016-05-13 20:55:41 +08:00
|
|
|
};
|
|
|
|
|
2018-11-21 06:12:27 +08:00
|
|
|
struct mlx5_events;
|
2017-06-05 04:11:55 +08:00
|
|
|
struct mlx5_mpfs;
|
2015-12-02 00:03:18 +08:00
|
|
|
struct mlx5_eswitch;
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
struct mlx5_lag;
|
2018-12-05 03:24:46 +08:00
|
|
|
struct mlx5_devcom;
|
2020-10-07 14:00:49 +08:00
|
|
|
struct mlx5_fw_reset;
|
2018-11-20 02:52:38 +08:00
|
|
|
struct mlx5_eq_table;
|
2019-06-11 07:38:27 +08:00
|
|
|
struct mlx5_irq_table;
|
2020-12-12 14:12:16 +08:00
|
|
|
struct mlx5_vhca_state_notifier;
|
2020-12-12 14:12:17 +08:00
|
|
|
struct mlx5_sf_dev_table;
|
net/mlx5: SF, Add port add delete functionality
To handle SF port management outside of the eswitch as independent
software layer, introduce eswitch notifier APIs so that mlx5 upper
layer who wish to support sf port management in switchdev mode can
perform its task whenever eswitch mode is set to switchdev or before
eswitch is disabled.
Initialize sf port table on such eswitch event.
Add SF port add and delete functionality in switchdev mode.
Destroy all SF ports when eswitch is disabled.
Expose SF port add and delete to user via devlink commands.
$ devlink dev eswitch set pci/0000:06:00.0 mode switchdev
$ devlink port show
pci/0000:06:00.0/65535: type eth netdev ens2f0np0 flavour physical port 0 splittable false
$ devlink port add pci/0000:06:00.0 flavour pcisf pfnum 0 sfnum 88
pci/0000:06:00.0/32768: type eth netdev eth6 flavour pcisf controller 0 pfnum 0 sfnum 88 external false splittable false
function:
hw_addr 00:00:00:00:00:00 state inactive opstate detached
$ devlink port show ens2f0npf0sf88
pci/0000:06:00.0/32768: type eth netdev ens2f0npf0sf88 flavour pcisf controller 0 pfnum 0 sfnum 88 external false splittable false
function:
hw_addr 00:00:00:00:00:00 state inactive opstate detached
or by its unique port index:
$ devlink port show pci/0000:06:00.0/32768
pci/0000:06:00.0/32768: type eth netdev ens2f0npf0sf88 flavour pcisf controller 0 pfnum 0 sfnum 88 external false splittable false
function:
hw_addr 00:00:00:00:00:00 state inactive opstate detached
$ devlink port show ens2f0npf0sf88 -jp
{
"port": {
"pci/0000:06:00.0/32768": {
"type": "eth",
"netdev": "ens2f0npf0sf88",
"flavour": "pcisf",
"controller": 0,
"pfnum": 0,
"sfnum": 88,
"external": false,
"splittable": false,
"function": {
"hw_addr": "00:00:00:00:00:00",
"state": "inactive",
"opstate": "detached"
}
}
}
}
Signed-off-by: Parav Pandit <parav@nvidia.com>
Reviewed-by: Vu Pham <vuhuong@nvidia.com>
Signed-off-by: Saeed Mahameed <saeedm@nvidia.com>
2020-12-12 14:12:21 +08:00
|
|
|
struct mlx5_sf_hw_table;
|
|
|
|
struct mlx5_sf_table;
|
2015-12-02 00:03:18 +08:00
|
|
|
|
2018-03-19 21:10:29 +08:00
|
|
|
struct mlx5_rate_limit {
|
|
|
|
u32 rate;
|
|
|
|
u32 max_burst_sz;
|
|
|
|
u16 typical_pkt_sz;
|
|
|
|
};
|
|
|
|
|
2016-06-23 22:02:37 +08:00
|
|
|
struct mlx5_rl_entry {
|
2020-02-20 03:05:17 +08:00
|
|
|
u8 rl_raw[MLX5_ST_SZ_BYTES(set_pp_rate_limit_context)];
|
|
|
|
u64 refcount;
|
2021-02-19 14:18:12 +08:00
|
|
|
u16 index;
|
2020-02-20 03:05:17 +08:00
|
|
|
u16 uid;
|
|
|
|
u8 dedicated : 1;
|
2016-06-23 22:02:37 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_rl_table {
|
|
|
|
/* protect rate limit table */
|
|
|
|
struct mutex rl_lock;
|
|
|
|
u16 max_size;
|
|
|
|
u32 max_rate;
|
|
|
|
u32 min_rate;
|
|
|
|
struct mlx5_rl_entry *rl_entry;
|
2021-02-19 18:06:54 +08:00
|
|
|
u64 refcount;
|
2016-06-23 22:02:37 +08:00
|
|
|
};
|
|
|
|
|
2019-04-30 02:14:16 +08:00
|
|
|
struct mlx5_core_roce {
|
|
|
|
struct mlx5_flow_table *ft;
|
|
|
|
struct mlx5_flow_group *fg;
|
|
|
|
struct mlx5_flow_handle *allow_rule;
|
|
|
|
};
|
|
|
|
|
2020-10-08 21:06:37 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PRIV_FLAGS_DISABLE_IB_ADEV = 1 << 0,
|
|
|
|
MLX5_PRIV_FLAGS_DISABLE_ALL_ADEV = 1 << 1,
|
2021-05-14 16:14:19 +08:00
|
|
|
/* Set during device detach to block any further devices
|
|
|
|
* creation/deletion on drivers rescan. Unset during device attach.
|
|
|
|
*/
|
|
|
|
MLX5_PRIV_FLAGS_DETACH = 1 << 2,
|
2020-10-08 21:06:37 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_adev {
|
|
|
|
struct auxiliary_device adev;
|
|
|
|
struct mlx5_core_dev *mdev;
|
|
|
|
int idx;
|
|
|
|
};
|
|
|
|
|
2021-03-08 20:16:02 +08:00
|
|
|
struct mlx5_ft_pool;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_priv {
|
2019-06-11 07:38:27 +08:00
|
|
|
/* IRQ table valid only for real pci devices PF or VF */
|
|
|
|
struct mlx5_irq_table *irq_table;
|
2018-11-20 02:52:38 +08:00
|
|
|
struct mlx5_eq_table *eq_table;
|
2013-07-07 22:25:49 +08:00
|
|
|
|
|
|
|
/* pages stuff */
|
2018-11-21 06:12:23 +08:00
|
|
|
struct mlx5_nb pg_nb;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct workqueue_struct *pg_wq;
|
2020-05-18 16:13:52 +08:00
|
|
|
struct xarray page_root_xa;
|
2013-07-07 22:25:49 +08:00
|
|
|
int fw_pages;
|
2014-12-11 23:04:23 +08:00
|
|
|
atomic_t reg_pages;
|
2013-10-23 14:53:19 +08:00
|
|
|
struct list_head free_list;
|
2015-12-02 00:03:09 +08:00
|
|
|
int vfs_pages;
|
2020-11-21 07:03:37 +08:00
|
|
|
int host_pf_pages;
|
2013-07-07 22:25:49 +08:00
|
|
|
|
|
|
|
struct mlx5_core_health health;
|
2021-01-27 07:24:07 +08:00
|
|
|
struct list_head traps;
|
2013-07-07 22:25:49 +08:00
|
|
|
|
|
|
|
/* start: qp staff */
|
|
|
|
struct dentry *qp_debugfs;
|
|
|
|
struct dentry *eq_debugfs;
|
|
|
|
struct dentry *cq_debugfs;
|
|
|
|
struct dentry *cmdif_debugfs;
|
|
|
|
/* end: qp staff */
|
|
|
|
|
|
|
|
/* start: alloc staff */
|
2021-07-30 11:03:00 +08:00
|
|
|
/* protect buffer allocation according to numa node */
|
2015-07-24 04:35:57 +08:00
|
|
|
struct mutex alloc_mutex;
|
|
|
|
int numa_node;
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mutex pgdir_mutex;
|
|
|
|
struct list_head pgdir_list;
|
|
|
|
/* end: alloc staff */
|
|
|
|
struct dentry *dbg_root;
|
|
|
|
|
2014-07-29 04:30:22 +08:00
|
|
|
struct list_head ctx_list;
|
|
|
|
spinlock_t ctx_lock;
|
2020-10-08 21:06:37 +08:00
|
|
|
struct mlx5_adev **adev;
|
|
|
|
int adev_idx;
|
2018-11-27 06:39:01 +08:00
|
|
|
struct mlx5_events *events;
|
2017-06-07 17:14:24 +08:00
|
|
|
|
2016-07-04 22:23:06 +08:00
|
|
|
struct mlx5_flow_steering *steering;
|
2017-06-05 04:11:55 +08:00
|
|
|
struct mlx5_mpfs *mpfs;
|
2015-12-02 00:03:18 +08:00
|
|
|
struct mlx5_eswitch *eswitch;
|
2015-12-02 00:03:09 +08:00
|
|
|
struct mlx5_core_sriov sriov;
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
struct mlx5_lag *lag;
|
2020-10-08 21:06:37 +08:00
|
|
|
u32 flags;
|
2018-12-05 03:24:46 +08:00
|
|
|
struct mlx5_devcom *devcom;
|
2020-10-07 14:00:49 +08:00
|
|
|
struct mlx5_fw_reset *fw_reset;
|
2019-04-30 02:14:16 +08:00
|
|
|
struct mlx5_core_roce roce;
|
2016-05-13 20:55:41 +08:00
|
|
|
struct mlx5_fc_stats fc_stats;
|
2016-06-23 22:02:37 +08:00
|
|
|
struct mlx5_rl_table rl_table;
|
2021-03-08 20:16:02 +08:00
|
|
|
struct mlx5_ft_pool *ft_pool;
|
2016-11-17 19:45:57 +08:00
|
|
|
|
2017-01-04 05:55:23 +08:00
|
|
|
struct mlx5_bfreg_data bfregs;
|
2017-01-04 05:55:24 +08:00
|
|
|
struct mlx5_uars_page *uar;
|
2020-12-12 14:12:16 +08:00
|
|
|
#ifdef CONFIG_MLX5_SF
|
|
|
|
struct mlx5_vhca_state_notifier *vhca_state_notifier;
|
2020-12-12 14:12:17 +08:00
|
|
|
struct mlx5_sf_dev_table *sf_dev_table;
|
2020-12-12 14:12:18 +08:00
|
|
|
struct mlx5_core_dev *parent_mdev;
|
2020-12-12 14:12:16 +08:00
|
|
|
#endif
|
net/mlx5: SF, Add port add delete functionality
To handle SF port management outside of the eswitch as independent
software layer, introduce eswitch notifier APIs so that mlx5 upper
layer who wish to support sf port management in switchdev mode can
perform its task whenever eswitch mode is set to switchdev or before
eswitch is disabled.
Initialize sf port table on such eswitch event.
Add SF port add and delete functionality in switchdev mode.
Destroy all SF ports when eswitch is disabled.
Expose SF port add and delete to user via devlink commands.
$ devlink dev eswitch set pci/0000:06:00.0 mode switchdev
$ devlink port show
pci/0000:06:00.0/65535: type eth netdev ens2f0np0 flavour physical port 0 splittable false
$ devlink port add pci/0000:06:00.0 flavour pcisf pfnum 0 sfnum 88
pci/0000:06:00.0/32768: type eth netdev eth6 flavour pcisf controller 0 pfnum 0 sfnum 88 external false splittable false
function:
hw_addr 00:00:00:00:00:00 state inactive opstate detached
$ devlink port show ens2f0npf0sf88
pci/0000:06:00.0/32768: type eth netdev ens2f0npf0sf88 flavour pcisf controller 0 pfnum 0 sfnum 88 external false splittable false
function:
hw_addr 00:00:00:00:00:00 state inactive opstate detached
or by its unique port index:
$ devlink port show pci/0000:06:00.0/32768
pci/0000:06:00.0/32768: type eth netdev ens2f0npf0sf88 flavour pcisf controller 0 pfnum 0 sfnum 88 external false splittable false
function:
hw_addr 00:00:00:00:00:00 state inactive opstate detached
$ devlink port show ens2f0npf0sf88 -jp
{
"port": {
"pci/0000:06:00.0/32768": {
"type": "eth",
"netdev": "ens2f0npf0sf88",
"flavour": "pcisf",
"controller": 0,
"pfnum": 0,
"sfnum": 88,
"external": false,
"splittable": false,
"function": {
"hw_addr": "00:00:00:00:00:00",
"state": "inactive",
"opstate": "detached"
}
}
}
}
Signed-off-by: Parav Pandit <parav@nvidia.com>
Reviewed-by: Vu Pham <vuhuong@nvidia.com>
Signed-off-by: Saeed Mahameed <saeedm@nvidia.com>
2020-12-12 14:12:21 +08:00
|
|
|
#ifdef CONFIG_MLX5_SF_MANAGER
|
|
|
|
struct mlx5_sf_hw_table *sf_hw_table;
|
|
|
|
struct mlx5_sf_table *sf_table;
|
|
|
|
#endif
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2015-10-14 22:43:46 +08:00
|
|
|
enum mlx5_device_state {
|
2021-08-01 16:37:57 +08:00
|
|
|
MLX5_DEVICE_STATE_UP = 1,
|
2015-10-14 22:43:46 +08:00
|
|
|
MLX5_DEVICE_STATE_INTERNAL_ERROR,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_interface_state {
|
2017-08-09 02:17:00 +08:00
|
|
|
MLX5_INTERFACE_STATE_UP = BIT(0),
|
2015-10-14 22:43:46 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_pci_status {
|
|
|
|
MLX5_PCI_STATUS_DISABLED,
|
|
|
|
MLX5_PCI_STATUS_ENABLED,
|
|
|
|
};
|
|
|
|
|
2017-01-02 17:37:46 +08:00
|
|
|
enum mlx5_pagefault_type_flags {
|
|
|
|
MLX5_PFAULT_REQUESTOR = 1 << 0,
|
|
|
|
MLX5_PFAULT_WRITE = 1 << 1,
|
|
|
|
MLX5_PFAULT_RDMA = 1 << 2,
|
|
|
|
};
|
|
|
|
|
2016-07-01 19:51:04 +08:00
|
|
|
struct mlx5_td {
|
2019-03-11 12:18:24 +08:00
|
|
|
/* protects tirs list changes while tirs refresh */
|
|
|
|
struct mutex list_lock;
|
2016-07-01 19:51:04 +08:00
|
|
|
struct list_head tirs_list;
|
|
|
|
u32 tdn;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5e_resources {
|
2021-01-26 17:51:04 +08:00
|
|
|
struct mlx5e_hw_objs {
|
|
|
|
u32 pdn;
|
|
|
|
struct mlx5_td td;
|
|
|
|
struct mlx5_core_mkey mkey;
|
|
|
|
struct mlx5_sq_bfreg bfreg;
|
|
|
|
} hw_objs;
|
2020-10-28 17:21:26 +08:00
|
|
|
struct devlink_port dl_port;
|
2020-09-16 15:11:33 +08:00
|
|
|
struct net_device *uplink_netdev;
|
2016-07-01 19:51:04 +08:00
|
|
|
};
|
|
|
|
|
2019-08-30 07:42:30 +08:00
|
|
|
enum mlx5_sw_icm_type {
|
|
|
|
MLX5_SW_ICM_TYPE_STEERING,
|
|
|
|
MLX5_SW_ICM_TYPE_HEADER_MODIFY,
|
|
|
|
};
|
|
|
|
|
2017-03-26 22:01:57 +08:00
|
|
|
#define MLX5_MAX_RESERVED_GIDS 8
|
|
|
|
|
|
|
|
struct mlx5_rsvd_gids {
|
|
|
|
unsigned int start;
|
|
|
|
unsigned int count;
|
|
|
|
struct ida ida;
|
|
|
|
};
|
|
|
|
|
2017-08-15 18:46:04 +08:00
|
|
|
#define MAX_PIN_NUM 8
|
|
|
|
struct mlx5_pps {
|
|
|
|
u8 pin_caps[MAX_PIN_NUM];
|
|
|
|
struct work_struct out_work;
|
|
|
|
u64 start[MAX_PIN_NUM];
|
|
|
|
u8 enabled;
|
|
|
|
};
|
|
|
|
|
2021-02-13 06:30:40 +08:00
|
|
|
struct mlx5_timer {
|
2017-08-15 18:46:04 +08:00
|
|
|
struct cyclecounter cycles;
|
|
|
|
struct timecounter tc;
|
|
|
|
u32 nominal_c_mult;
|
|
|
|
unsigned long overflow_period;
|
|
|
|
struct delayed_work overflow_work;
|
2021-02-13 06:30:40 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_clock {
|
|
|
|
struct mlx5_nb pps_nb;
|
|
|
|
seqlock_t lock;
|
|
|
|
struct hwtstamp_config hwtstamp_config;
|
2017-08-15 18:46:04 +08:00
|
|
|
struct ptp_clock *ptp;
|
|
|
|
struct ptp_clock_info ptp_info;
|
|
|
|
struct mlx5_pps pps_info;
|
2021-02-13 06:30:40 +08:00
|
|
|
struct mlx5_timer timer;
|
2017-08-15 18:46:04 +08:00
|
|
|
};
|
|
|
|
|
2019-08-30 07:42:30 +08:00
|
|
|
struct mlx5_dm;
|
2018-07-17 06:22:01 +08:00
|
|
|
struct mlx5_fw_tracer;
|
2018-05-10 04:28:00 +08:00
|
|
|
struct mlx5_vxlan;
|
2019-01-30 23:21:55 +08:00
|
|
|
struct mlx5_geneve;
|
2019-08-22 13:05:51 +08:00
|
|
|
struct mlx5_hv_vhca;
|
2018-07-17 06:22:01 +08:00
|
|
|
|
2019-08-30 07:42:30 +08:00
|
|
|
#define MLX5_LOG_SW_ICM_BLOCK_SIZE(dev) (MLX5_CAP_DEV_MEM(dev, log_sw_icm_alloc_granularity))
|
|
|
|
#define MLX5_SW_ICM_BLOCK_SIZE(dev) (1 << MLX5_LOG_SW_ICM_BLOCK_SIZE(dev))
|
|
|
|
|
2021-05-12 18:52:27 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PROF_MASK_QP_SIZE = (u64)1 << 0,
|
|
|
|
MLX5_PROF_MASK_MR_CACHE = (u64)1 << 1,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MR_CACHE_LAST_STD_ENTRY = 20,
|
|
|
|
MLX5_IMR_MTT_CACHE_ENTRY,
|
|
|
|
MLX5_IMR_KSM_CACHE_ENTRY,
|
|
|
|
MAX_MR_CACHE_ENTRIES
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_profile {
|
|
|
|
u64 mask;
|
|
|
|
u8 log_max_qp;
|
|
|
|
struct {
|
|
|
|
int size;
|
|
|
|
int limit;
|
|
|
|
} mr_cache[MAX_MR_CACHE_ENTRIES];
|
|
|
|
};
|
|
|
|
|
2021-07-13 17:36:05 +08:00
|
|
|
struct mlx5_hca_cap {
|
|
|
|
u32 cur[MLX5_UN_SZ_DW(hca_cap_union)];
|
|
|
|
u32 max[MLX5_UN_SZ_DW(hca_cap_union)];
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_core_dev {
|
2019-04-30 02:14:02 +08:00
|
|
|
struct device *device;
|
2019-06-29 06:35:58 +08:00
|
|
|
enum mlx5_coredev_type coredev_type;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct pci_dev *pdev;
|
2015-10-14 22:43:46 +08:00
|
|
|
/* sync pci state */
|
|
|
|
struct mutex pci_status_mutex;
|
|
|
|
enum mlx5_pci_status pci_status;
|
2013-07-07 22:25:49 +08:00
|
|
|
u8 rev_id;
|
|
|
|
char board_id[MLX5_BOARD_ID_LEN];
|
|
|
|
struct mlx5_cmd cmd;
|
2016-12-08 22:03:31 +08:00
|
|
|
struct {
|
2021-07-13 19:17:03 +08:00
|
|
|
struct mlx5_hca_cap *hca[MLX5_CAP_NUM];
|
2016-12-08 22:03:31 +08:00
|
|
|
u32 pcam[MLX5_ST_SZ_DW(pcam_reg)];
|
2019-10-07 15:31:42 +08:00
|
|
|
u32 mcam[MLX5_MCAM_REGS_NUM][MLX5_ST_SZ_DW(mcam_reg)];
|
2017-08-24 22:21:44 +08:00
|
|
|
u32 fpga[MLX5_ST_SZ_DW(fpga_cap)];
|
2017-07-19 05:03:17 +08:00
|
|
|
u32 qcam[MLX5_ST_SZ_DW(qcam_reg)];
|
2019-02-13 14:55:35 +08:00
|
|
|
u8 embedded_cpu;
|
2016-12-08 22:03:31 +08:00
|
|
|
} caps;
|
2018-09-05 22:06:37 +08:00
|
|
|
u64 sys_image_guid;
|
2013-07-07 22:25:49 +08:00
|
|
|
phys_addr_t iseg_base;
|
|
|
|
struct mlx5_init_seg __iomem *iseg;
|
2019-03-30 06:38:01 +08:00
|
|
|
phys_addr_t bar_addr;
|
2015-10-14 22:43:46 +08:00
|
|
|
enum mlx5_device_state state;
|
|
|
|
/* sync interface state */
|
|
|
|
struct mutex intf_state_mutex;
|
2016-04-22 05:33:07 +08:00
|
|
|
unsigned long intf_state;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_priv priv;
|
2021-05-12 18:52:27 +08:00
|
|
|
struct mlx5_profile profile;
|
2015-05-29 03:28:48 +08:00
|
|
|
u32 issi;
|
2016-07-01 19:51:04 +08:00
|
|
|
struct mlx5e_resources mlx5e_res;
|
2019-08-30 07:42:30 +08:00
|
|
|
struct mlx5_dm *dm;
|
2018-05-10 04:28:00 +08:00
|
|
|
struct mlx5_vxlan *vxlan;
|
2019-01-30 23:21:55 +08:00
|
|
|
struct mlx5_geneve *geneve;
|
2017-03-26 22:01:57 +08:00
|
|
|
struct {
|
|
|
|
struct mlx5_rsvd_gids reserved_gids;
|
2018-01-04 23:25:31 +08:00
|
|
|
u32 roce_en;
|
2017-03-26 22:01:57 +08:00
|
|
|
} roce;
|
2017-03-14 02:05:45 +08:00
|
|
|
#ifdef CONFIG_MLX5_FPGA
|
|
|
|
struct mlx5_fpga_device *fpga;
|
2019-11-18 20:30:20 +08:00
|
|
|
#endif
|
|
|
|
#ifdef CONFIG_MLX5_ACCEL
|
|
|
|
const struct mlx5_accel_ipsec_ops *ipsec_ops;
|
2016-04-29 06:36:39 +08:00
|
|
|
#endif
|
2017-08-15 18:46:04 +08:00
|
|
|
struct mlx5_clock clock;
|
2018-01-17 02:08:40 +08:00
|
|
|
struct mlx5_ib_clock_info *clock_info;
|
2018-07-17 06:22:01 +08:00
|
|
|
struct mlx5_fw_tracer *tracer;
|
2020-02-12 06:32:43 +08:00
|
|
|
struct mlx5_rsc_dump *rsc_dump;
|
2018-06-28 20:05:58 +08:00
|
|
|
u32 vsc_addr;
|
2019-08-22 13:05:51 +08:00
|
|
|
struct mlx5_hv_vhca *hv_vhca;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_db {
|
|
|
|
__be32 *db;
|
|
|
|
union {
|
|
|
|
struct mlx5_db_pgdir *pgdir;
|
|
|
|
struct mlx5_ib_user_db_page *user_page;
|
|
|
|
} u;
|
|
|
|
dma_addr_t dma;
|
|
|
|
int index;
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_COMP_EQ_SIZE = 1024,
|
|
|
|
};
|
|
|
|
|
2015-05-29 03:28:42 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PTYS_IB = 1 << 0,
|
|
|
|
MLX5_PTYS_EN = 1 << 2,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
typedef void (*mlx5_cmd_cbk_t)(int status, void *context);
|
|
|
|
|
2017-02-23 17:19:36 +08:00
|
|
|
enum {
|
|
|
|
MLX5_CMD_ENT_STATE_PENDING_COMP,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_cmd_work_ent {
|
2017-02-23 17:19:36 +08:00
|
|
|
unsigned long state;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_cmd_msg *in;
|
|
|
|
struct mlx5_cmd_msg *out;
|
2013-10-23 14:53:14 +08:00
|
|
|
void *uout;
|
|
|
|
int uout_size;
|
2013-07-07 22:25:49 +08:00
|
|
|
mlx5_cmd_cbk_t callback;
|
2016-06-30 22:34:43 +08:00
|
|
|
struct delayed_work cb_timeout_work;
|
2013-07-07 22:25:49 +08:00
|
|
|
void *context;
|
2013-10-23 14:53:14 +08:00
|
|
|
int idx;
|
2019-12-27 13:01:53 +08:00
|
|
|
struct completion handling;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct completion done;
|
|
|
|
struct mlx5_cmd *cmd;
|
|
|
|
struct work_struct work;
|
|
|
|
struct mlx5_cmd_layout *lay;
|
|
|
|
int ret;
|
|
|
|
int page_queue;
|
|
|
|
u8 status;
|
|
|
|
u8 token;
|
2014-07-17 05:04:44 +08:00
|
|
|
u64 ts1;
|
|
|
|
u64 ts2;
|
2013-10-23 14:53:14 +08:00
|
|
|
u16 op;
|
2017-02-09 19:20:46 +08:00
|
|
|
bool polling;
|
net/mlx5: Avoid possible free of command entry while timeout comp handler
Upon command completion timeout, driver simulates a forced command
completion. In a rare case where real interrupt for that command arrives
simultaneously, it might release the command entry while the forced
handler might still access it.
Fix that by adding an entry refcount, to track current amount of allowed
handlers. Command entry to be released only when this refcount is
decremented to zero.
Command refcount is always initialized to one. For callback commands,
command completion handler is the symmetric flow to decrement it. For
non-callback commands, it is wait_func().
Before ringing the doorbell, increment the refcount for the real completion
handler. Once the real completion handler is called, it will decrement it.
For callback commands, once the delayed work is scheduled, increment the
refcount. Upon callback command completion handler, we will try to cancel
the timeout callback. In case of success, we need to decrement the callback
refcount as it will never run.
In addition, gather the entry index free and the entry free into a one
flow for all command types release.
Fixes: e126ba97dba9 ("mlx5: Add driver for Mellanox Connect-IB adapters")
Signed-off-by: Eran Ben Elisha <eranbe@mellanox.com>
Reviewed-by: Moshe Shemesh <moshe@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@nvidia.com>
2020-08-04 15:40:21 +08:00
|
|
|
/* Track the max comp handlers */
|
|
|
|
refcount_t refcnt;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_pas {
|
|
|
|
u64 pa;
|
|
|
|
u8 log_sz;
|
|
|
|
};
|
|
|
|
|
2015-06-05 00:30:41 +08:00
|
|
|
enum phy_port_state {
|
|
|
|
MLX5_AAA_111
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_hca_vport_context {
|
|
|
|
u32 field_select;
|
|
|
|
bool sm_virt_aware;
|
|
|
|
bool has_smi;
|
|
|
|
bool has_raw;
|
|
|
|
enum port_state_policy policy;
|
|
|
|
enum phy_port_state phys_state;
|
|
|
|
enum ib_port_state vport_state;
|
|
|
|
u8 port_physical_state;
|
|
|
|
u64 sys_image_guid;
|
|
|
|
u64 port_guid;
|
|
|
|
u64 node_guid;
|
|
|
|
u32 cap_mask1;
|
|
|
|
u32 cap_mask1_perm;
|
2018-12-09 17:49:51 +08:00
|
|
|
u16 cap_mask2;
|
|
|
|
u16 cap_mask2_perm;
|
2015-06-05 00:30:41 +08:00
|
|
|
u16 lid;
|
|
|
|
u8 init_type_reply; /* bitmask: see ib spec 14.2.5.6 InitTypeReply */
|
|
|
|
u8 lmc;
|
|
|
|
u8 subnet_timeout;
|
|
|
|
u16 sm_lid;
|
|
|
|
u8 sm_sl;
|
|
|
|
u16 qkey_violation_counter;
|
|
|
|
u16 pkey_violation_counter;
|
|
|
|
bool grh_required;
|
|
|
|
};
|
|
|
|
|
2018-01-02 22:08:06 +08:00
|
|
|
static inline void *mlx5_buf_offset(struct mlx5_frag_buf *buf, int offset)
|
2013-07-07 22:25:49 +08:00
|
|
|
{
|
2018-01-02 22:08:06 +08:00
|
|
|
return buf->frags->buf + offset;
|
2013-07-07 22:25:49 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
#define STRUCT_FIELD(header, field) \
|
|
|
|
.struct_offset_bytes = offsetof(struct ib_unpacked_ ## header, field), \
|
|
|
|
.struct_size_bytes = sizeof((struct ib_unpacked_ ## header *)0)->field
|
|
|
|
|
|
|
|
static inline struct mlx5_core_dev *pci2mlx5_core_dev(struct pci_dev *pdev)
|
|
|
|
{
|
|
|
|
return pci_get_drvdata(pdev);
|
|
|
|
}
|
|
|
|
|
|
|
|
extern struct dentry *mlx5_debugfs_root;
|
|
|
|
|
|
|
|
static inline u16 fw_rev_maj(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->fw_rev) & 0xffff;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u16 fw_rev_min(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->fw_rev) >> 16;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u16 fw_rev_sub(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->cmdif_rev_fw_sub) & 0xffff;
|
|
|
|
}
|
|
|
|
|
2014-02-23 20:19:10 +08:00
|
|
|
static inline u32 mlx5_base_mkey(const u32 key)
|
|
|
|
{
|
|
|
|
return key & 0xffffff00u;
|
|
|
|
}
|
|
|
|
|
2021-03-11 15:09:15 +08:00
|
|
|
static inline u32 wq_get_byte_sz(u8 log_sz, u8 log_stride)
|
|
|
|
{
|
|
|
|
return ((u32)1 << log_sz) << log_stride;
|
|
|
|
}
|
|
|
|
|
2018-09-12 20:36:41 +08:00
|
|
|
static inline void mlx5_init_fbc_offset(struct mlx5_buf_list *frags,
|
|
|
|
u8 log_stride, u8 log_sz,
|
2018-08-21 21:07:58 +08:00
|
|
|
u16 strides_offset,
|
2018-07-08 17:14:59 +08:00
|
|
|
struct mlx5_frag_buf_ctrl *fbc)
|
2018-01-02 22:08:06 +08:00
|
|
|
{
|
2018-09-12 20:36:41 +08:00
|
|
|
fbc->frags = frags;
|
2018-04-04 17:54:23 +08:00
|
|
|
fbc->log_stride = log_stride;
|
|
|
|
fbc->log_sz = log_sz;
|
2018-01-02 22:08:06 +08:00
|
|
|
fbc->sz_m1 = (1 << fbc->log_sz) - 1;
|
|
|
|
fbc->log_frag_strides = PAGE_SHIFT - fbc->log_stride;
|
|
|
|
fbc->frag_sz_m1 = (1 << fbc->log_frag_strides) - 1;
|
2018-07-08 17:14:59 +08:00
|
|
|
fbc->strides_offset = strides_offset;
|
|
|
|
}
|
|
|
|
|
2018-09-12 20:36:41 +08:00
|
|
|
static inline void mlx5_init_fbc(struct mlx5_buf_list *frags,
|
|
|
|
u8 log_stride, u8 log_sz,
|
2018-07-08 17:14:59 +08:00
|
|
|
struct mlx5_frag_buf_ctrl *fbc)
|
|
|
|
{
|
2018-09-12 20:36:41 +08:00
|
|
|
mlx5_init_fbc_offset(frags, log_stride, log_sz, 0, fbc);
|
2018-04-04 17:54:23 +08:00
|
|
|
}
|
|
|
|
|
2018-01-02 22:08:06 +08:00
|
|
|
static inline void *mlx5_frag_buf_get_wqe(struct mlx5_frag_buf_ctrl *fbc,
|
|
|
|
u32 ix)
|
|
|
|
{
|
2018-07-08 17:14:59 +08:00
|
|
|
unsigned int frag;
|
|
|
|
|
|
|
|
ix += fbc->strides_offset;
|
|
|
|
frag = ix >> fbc->log_frag_strides;
|
2018-01-02 22:08:06 +08:00
|
|
|
|
2018-09-12 20:36:41 +08:00
|
|
|
return fbc->frags[frag].buf + ((fbc->frag_sz_m1 & ix) << fbc->log_stride);
|
2018-01-02 22:08:06 +08:00
|
|
|
}
|
|
|
|
|
net/mlx5: WQ, fixes for fragmented WQ buffers API
mlx5e netdevice used to calculate fragment edges by a call to
mlx5_wq_cyc_get_frag_size(). This calculation did not give the correct
indication for queues smaller than a PAGE_SIZE, (broken by default on
PowerPC, where PAGE_SIZE == 64KB). Here it is replaced by the correct new
calls/API.
Since (TX/RX) Work Queues buffers are fragmented, here we introduce
changes to the API in core driver, so that it gets a stride index and
returns the index of last stride on same fragment, and an additional
wrapping function that returns the number of physically contiguous
strides that can be written contiguously to the work queue.
This obsoletes the following API functions, and their buggy
usage in EN driver:
* mlx5_wq_cyc_get_frag_size()
* mlx5_wq_cyc_ctr2fragix()
The new API improves modularity and hides the details of such
calculation for mlx5e netdevice and mlx5_ib rdma drivers.
New calculation is also more efficient, and improves performance
as follows:
Packet rate test: pktgen, UDP / IPv4, 64byte, single ring, 8K ring size.
Before: 16,477,619 pps
After: 17,085,793 pps
3.7% improvement
Fixes: 3a2f70331226 ("net/mlx5: Use order-0 allocations for all WQ types")
Signed-off-by: Tariq Toukan <tariqt@mellanox.com>
Reviewed-by: Eran Ben Elisha <eranbe@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
2018-08-21 19:41:41 +08:00
|
|
|
static inline u32
|
|
|
|
mlx5_frag_buf_get_idx_last_contig_stride(struct mlx5_frag_buf_ctrl *fbc, u32 ix)
|
|
|
|
{
|
|
|
|
u32 last_frag_stride_idx = (ix + fbc->strides_offset) | fbc->frag_sz_m1;
|
|
|
|
|
|
|
|
return min_t(u32, last_frag_stride_idx - fbc->strides_offset, fbc->sz_m1);
|
|
|
|
}
|
|
|
|
|
2020-03-19 03:44:32 +08:00
|
|
|
enum {
|
|
|
|
CMD_ALLOWED_OPCODE_ALL,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_cmd_use_events(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cmd_use_polling(struct mlx5_core_dev *dev);
|
2020-03-19 03:44:32 +08:00
|
|
|
void mlx5_cmd_allowed_opcode(struct mlx5_core_dev *dev, u16 opcode);
|
2016-07-20 01:17:12 +08:00
|
|
|
|
2019-01-19 08:33:10 +08:00
|
|
|
struct mlx5_async_ctx {
|
|
|
|
struct mlx5_core_dev *dev;
|
|
|
|
atomic_t num_inflight;
|
|
|
|
struct wait_queue_head wait;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_async_work;
|
|
|
|
|
|
|
|
typedef void (*mlx5_async_cbk_t)(int status, struct mlx5_async_work *context);
|
|
|
|
|
|
|
|
struct mlx5_async_work {
|
|
|
|
struct mlx5_async_ctx *ctx;
|
|
|
|
mlx5_async_cbk_t user_callback;
|
|
|
|
};
|
|
|
|
|
|
|
|
void mlx5_cmd_init_async_ctx(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_async_ctx *ctx);
|
|
|
|
void mlx5_cmd_cleanup_async_ctx(struct mlx5_async_ctx *ctx);
|
|
|
|
int mlx5_cmd_exec_cb(struct mlx5_async_ctx *ctx, void *in, int in_size,
|
|
|
|
void *out, int out_size, mlx5_async_cbk_t callback,
|
|
|
|
struct mlx5_async_work *work);
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_cmd_exec(struct mlx5_core_dev *dev, void *in, int in_size, void *out,
|
|
|
|
int out_size);
|
2020-04-06 01:57:00 +08:00
|
|
|
|
|
|
|
#define mlx5_cmd_exec_inout(dev, ifc_cmd, in, out) \
|
|
|
|
({ \
|
|
|
|
mlx5_cmd_exec(dev, in, MLX5_ST_SZ_BYTES(ifc_cmd##_in), out, \
|
|
|
|
MLX5_ST_SZ_BYTES(ifc_cmd##_out)); \
|
|
|
|
})
|
|
|
|
|
|
|
|
#define mlx5_cmd_exec_in(dev, ifc_cmd, in) \
|
|
|
|
({ \
|
|
|
|
u32 _out[MLX5_ST_SZ_DW(ifc_cmd##_out)] = {}; \
|
|
|
|
mlx5_cmd_exec_inout(dev, ifc_cmd, in, _out); \
|
|
|
|
})
|
|
|
|
|
2017-02-09 19:20:46 +08:00
|
|
|
int mlx5_cmd_exec_polling(struct mlx5_core_dev *dev, void *in, int in_size,
|
|
|
|
void *out, int out_size);
|
2016-07-20 01:17:12 +08:00
|
|
|
void mlx5_cmd_mbox_status(void *out, u8 *status, u32 *syndrome);
|
2020-09-12 02:48:55 +08:00
|
|
|
bool mlx5_cmd_is_down(struct mlx5_core_dev *dev);
|
2016-07-20 01:17:12 +08:00
|
|
|
|
|
|
|
int mlx5_core_get_caps(struct mlx5_core_dev *dev, enum mlx5_cap_type cap_type);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_cmd_alloc_uar(struct mlx5_core_dev *dev, u32 *uarn);
|
|
|
|
int mlx5_cmd_free_uar(struct mlx5_core_dev *dev, u32 uarn);
|
2019-03-30 06:37:55 +08:00
|
|
|
void mlx5_health_flush(struct mlx5_core_dev *dev);
|
2015-10-08 22:14:00 +08:00
|
|
|
void mlx5_health_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_health_init(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_start_health_poll(struct mlx5_core_dev *dev);
|
2018-08-05 14:19:33 +08:00
|
|
|
void mlx5_stop_health_poll(struct mlx5_core_dev *dev, bool disable_health);
|
2016-10-25 23:36:33 +08:00
|
|
|
void mlx5_drain_health_wq(struct mlx5_core_dev *dev);
|
2017-05-07 18:48:31 +08:00
|
|
|
void mlx5_trigger_health_work(struct mlx5_core_dev *dev);
|
2018-01-02 22:08:06 +08:00
|
|
|
int mlx5_buf_alloc(struct mlx5_core_dev *dev,
|
|
|
|
int size, struct mlx5_frag_buf *buf);
|
|
|
|
void mlx5_buf_free(struct mlx5_core_dev *dev, struct mlx5_frag_buf *buf);
|
2016-11-30 23:59:37 +08:00
|
|
|
int mlx5_frag_buf_alloc_node(struct mlx5_core_dev *dev, int size,
|
|
|
|
struct mlx5_frag_buf *buf, int node);
|
|
|
|
void mlx5_frag_buf_free(struct mlx5_core_dev *dev, struct mlx5_frag_buf *buf);
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_cmd_mailbox *mlx5_alloc_cmd_mailbox_chain(struct mlx5_core_dev *dev,
|
|
|
|
gfp_t flags, int npages);
|
|
|
|
void mlx5_free_cmd_mailbox_chain(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_cmd_mailbox *head);
|
2016-03-01 00:05:28 +08:00
|
|
|
int mlx5_core_create_mkey(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_core_mkey *mkey,
|
2016-07-16 11:28:36 +08:00
|
|
|
u32 *in, int inlen);
|
2016-03-01 00:05:28 +08:00
|
|
|
int mlx5_core_destroy_mkey(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_core_mkey *mkey);
|
|
|
|
int mlx5_core_query_mkey(struct mlx5_core_dev *dev, struct mlx5_core_mkey *mkey,
|
2016-07-16 11:28:36 +08:00
|
|
|
u32 *out, int outlen);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_core_alloc_pd(struct mlx5_core_dev *dev, u32 *pdn);
|
|
|
|
int mlx5_core_dealloc_pd(struct mlx5_core_dev *dev, u32 pdn);
|
2018-11-21 06:12:23 +08:00
|
|
|
int mlx5_pagealloc_init(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_pagealloc_cleanup(struct mlx5_core_dev *dev);
|
2018-11-21 06:12:23 +08:00
|
|
|
void mlx5_pagealloc_start(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_pagealloc_stop(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_core_req_pages_handler(struct mlx5_core_dev *dev, u16 func_id,
|
2019-02-13 14:55:35 +08:00
|
|
|
s32 npages, bool ec_function);
|
2013-07-18 20:31:08 +08:00
|
|
|
int mlx5_satisfy_startup_pages(struct mlx5_core_dev *dev, int boot);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_reclaim_startup_pages(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_register_debugfs(void);
|
|
|
|
void mlx5_unregister_debugfs(void);
|
2018-01-02 22:08:06 +08:00
|
|
|
|
|
|
|
void mlx5_fill_page_array(struct mlx5_frag_buf *buf, __be64 *pas);
|
2020-07-15 12:28:32 +08:00
|
|
|
void mlx5_fill_page_frag_array_perm(struct mlx5_frag_buf *buf, __be64 *pas, u8 perm);
|
2016-11-30 23:59:37 +08:00
|
|
|
void mlx5_fill_page_frag_array(struct mlx5_frag_buf *frag_buf, __be64 *pas);
|
2021-04-11 20:32:55 +08:00
|
|
|
int mlx5_vector2eqn(struct mlx5_core_dev *dev, int vector, int *eqn);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_core_attach_mcg(struct mlx5_core_dev *dev, union ib_gid *mgid, u32 qpn);
|
|
|
|
int mlx5_core_detach_mcg(struct mlx5_core_dev *dev, union ib_gid *mgid, u32 qpn);
|
|
|
|
|
2019-08-10 18:17:18 +08:00
|
|
|
void mlx5_qp_debugfs_init(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_qp_debugfs_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_core_access_reg(struct mlx5_core_dev *dev, void *data_in,
|
|
|
|
int size_in, void *data_out, int size_out,
|
|
|
|
u16 reg_num, int arg, int write);
|
2015-05-29 03:28:42 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_db_alloc(struct mlx5_core_dev *dev, struct mlx5_db *db);
|
2015-07-24 04:35:57 +08:00
|
|
|
int mlx5_db_alloc_node(struct mlx5_core_dev *dev, struct mlx5_db *db,
|
|
|
|
int node);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_db_free(struct mlx5_core_dev *dev, struct mlx5_db *db);
|
|
|
|
|
|
|
|
const char *mlx5_command_str(int command);
|
2019-08-10 18:17:18 +08:00
|
|
|
void mlx5_cmdif_debugfs_init(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_cmdif_debugfs_cleanup(struct mlx5_core_dev *dev);
|
2014-02-23 20:19:06 +08:00
|
|
|
int mlx5_core_create_psv(struct mlx5_core_dev *dev, u32 pdn,
|
|
|
|
int npsvs, u32 *sig_index);
|
|
|
|
int mlx5_core_destroy_psv(struct mlx5_core_dev *dev, int psv_num);
|
2014-10-02 17:19:45 +08:00
|
|
|
void mlx5_core_put_rsc(struct mlx5_core_rsc_common *common);
|
2014-12-11 23:04:19 +08:00
|
|
|
int mlx5_query_odp_caps(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_odp_caps *odp_caps);
|
2016-02-19 00:15:00 +08:00
|
|
|
int mlx5_core_query_ib_ppcnt(struct mlx5_core_dev *dev,
|
|
|
|
u8 port_num, void *out, size_t sz);
|
2013-07-07 22:25:49 +08:00
|
|
|
|
2016-06-23 22:02:37 +08:00
|
|
|
int mlx5_init_rl_table(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cleanup_rl_table(struct mlx5_core_dev *dev);
|
2018-03-19 21:10:29 +08:00
|
|
|
int mlx5_rl_add_rate(struct mlx5_core_dev *dev, u16 *index,
|
|
|
|
struct mlx5_rate_limit *rl);
|
|
|
|
void mlx5_rl_remove_rate(struct mlx5_core_dev *dev, struct mlx5_rate_limit *rl);
|
2016-06-23 22:02:37 +08:00
|
|
|
bool mlx5_rl_is_in_range(struct mlx5_core_dev *dev, u32 rate);
|
2020-02-20 03:05:17 +08:00
|
|
|
int mlx5_rl_add_rate_raw(struct mlx5_core_dev *dev, void *rl_in, u16 uid,
|
|
|
|
bool dedicated_entry, u16 *index);
|
|
|
|
void mlx5_rl_remove_rate_raw(struct mlx5_core_dev *dev, u16 index);
|
2018-03-19 21:10:29 +08:00
|
|
|
bool mlx5_rl_are_equal(struct mlx5_rate_limit *rl_0,
|
|
|
|
struct mlx5_rate_limit *rl_1);
|
2017-01-04 05:55:23 +08:00
|
|
|
int mlx5_alloc_bfreg(struct mlx5_core_dev *mdev, struct mlx5_sq_bfreg *bfreg,
|
|
|
|
bool map_wc, bool fast_path);
|
|
|
|
void mlx5_free_bfreg(struct mlx5_core_dev *mdev, struct mlx5_sq_bfreg *bfreg);
|
2016-06-23 22:02:37 +08:00
|
|
|
|
2018-11-20 02:52:38 +08:00
|
|
|
unsigned int mlx5_comp_vectors_count(struct mlx5_core_dev *dev);
|
|
|
|
struct cpumask *
|
|
|
|
mlx5_comp_irq_get_affinity_mask(struct mlx5_core_dev *dev, int vector);
|
2017-03-26 22:01:57 +08:00
|
|
|
unsigned int mlx5_core_reserved_gids_count(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_core_roce_gid_set(struct mlx5_core_dev *dev, unsigned int index,
|
|
|
|
u8 roce_version, u8 roce_l3_type, const u8 *gid,
|
2018-01-04 23:25:41 +08:00
|
|
|
const u8 *mac, bool vlan, u16 vlan_id, u8 port_num);
|
2017-03-26 22:01:57 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
static inline u32 mlx5_mkey_to_idx(u32 mkey)
|
|
|
|
{
|
|
|
|
return mkey >> 8;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u32 mlx5_idx_to_mkey(u32 mkey_idx)
|
|
|
|
{
|
|
|
|
return mkey_idx << 8;
|
|
|
|
}
|
|
|
|
|
2013-10-23 14:53:14 +08:00
|
|
|
static inline u8 mlx5_mkey_variant(u32 mkey)
|
|
|
|
{
|
|
|
|
return mkey & 0xff;
|
|
|
|
}
|
|
|
|
|
2021-01-27 07:24:11 +08:00
|
|
|
/* Async-atomic event notifier used by mlx5 core to forward FW
|
2021-07-30 11:03:00 +08:00
|
|
|
* evetns received from event queue to mlx5 consumers.
|
2021-01-27 07:24:11 +08:00
|
|
|
* Optimise event queue dipatching.
|
|
|
|
*/
|
2018-11-27 06:38:56 +08:00
|
|
|
int mlx5_notifier_register(struct mlx5_core_dev *dev, struct notifier_block *nb);
|
|
|
|
int mlx5_notifier_unregister(struct mlx5_core_dev *dev, struct notifier_block *nb);
|
2021-01-27 07:24:11 +08:00
|
|
|
|
|
|
|
/* Async-atomic event notifier used for forwarding
|
|
|
|
* evetns from the event queue into the to mlx5 events dispatcher,
|
|
|
|
* eswitch, clock and others.
|
|
|
|
*/
|
2019-07-01 00:23:24 +08:00
|
|
|
int mlx5_eq_notifier_register(struct mlx5_core_dev *dev, struct mlx5_nb *nb);
|
|
|
|
int mlx5_eq_notifier_unregister(struct mlx5_core_dev *dev, struct mlx5_nb *nb);
|
2018-11-27 06:38:56 +08:00
|
|
|
|
2021-01-27 07:24:11 +08:00
|
|
|
/* Blocking event notifier used to forward SW events, used for slow path */
|
|
|
|
int mlx5_blocking_notifier_register(struct mlx5_core_dev *dev, struct notifier_block *nb);
|
|
|
|
int mlx5_blocking_notifier_unregister(struct mlx5_core_dev *dev, struct notifier_block *nb);
|
|
|
|
int mlx5_blocking_notifier_call_chain(struct mlx5_core_dev *dev, unsigned int event,
|
|
|
|
void *data);
|
|
|
|
|
2015-06-05 00:30:42 +08:00
|
|
|
int mlx5_core_query_vendor_id(struct mlx5_core_dev *mdev, u32 *vendor_id);
|
2014-07-29 04:30:22 +08:00
|
|
|
|
2016-05-09 18:38:42 +08:00
|
|
|
int mlx5_cmd_create_vport_lag(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_cmd_destroy_vport_lag(struct mlx5_core_dev *dev);
|
2018-08-23 18:47:53 +08:00
|
|
|
bool mlx5_lag_is_roce(struct mlx5_core_dev *dev);
|
|
|
|
bool mlx5_lag_is_sriov(struct mlx5_core_dev *dev);
|
2019-02-22 00:24:48 +08:00
|
|
|
bool mlx5_lag_is_multipath(struct mlx5_core_dev *dev);
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
bool mlx5_lag_is_active(struct mlx5_core_dev *dev);
|
2021-08-04 07:19:47 +08:00
|
|
|
bool mlx5_lag_is_master(struct mlx5_core_dev *dev);
|
|
|
|
bool mlx5_lag_is_shared_fdb(struct mlx5_core_dev *dev);
|
2016-05-09 19:06:44 +08:00
|
|
|
struct net_device *mlx5_lag_get_roce_netdev(struct mlx5_core_dev *dev);
|
2020-05-01 03:21:41 +08:00
|
|
|
u8 mlx5_lag_get_slave_port(struct mlx5_core_dev *dev,
|
|
|
|
struct net_device *slave);
|
2017-12-21 23:38:26 +08:00
|
|
|
int mlx5_lag_query_cong_counters(struct mlx5_core_dev *dev,
|
|
|
|
u64 *values,
|
|
|
|
int num_counters,
|
|
|
|
size_t *offsets);
|
2021-08-04 07:19:47 +08:00
|
|
|
struct mlx5_core_dev *mlx5_lag_get_peer_mdev(struct mlx5_core_dev *dev);
|
2017-01-04 05:55:24 +08:00
|
|
|
struct mlx5_uars_page *mlx5_get_uars_page(struct mlx5_core_dev *mdev);
|
|
|
|
void mlx5_put_uars_page(struct mlx5_core_dev *mdev, struct mlx5_uars_page *up);
|
2019-08-30 07:42:30 +08:00
|
|
|
int mlx5_dm_sw_icm_alloc(struct mlx5_core_dev *dev, enum mlx5_sw_icm_type type,
|
2020-04-25 03:45:04 +08:00
|
|
|
u64 length, u32 log_alignment, u16 uid,
|
|
|
|
phys_addr_t *addr, u32 *obj_id);
|
2019-08-30 07:42:30 +08:00
|
|
|
int mlx5_dm_sw_icm_dealloc(struct mlx5_core_dev *dev, enum mlx5_sw_icm_type type,
|
|
|
|
u64 length, u16 uid, phys_addr_t addr, u32 obj_id);
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
|
2018-08-14 19:08:51 +08:00
|
|
|
#ifdef CONFIG_MLX5_CORE_IPOIB
|
2017-04-27 22:01:34 +08:00
|
|
|
struct net_device *mlx5_rdma_netdev_alloc(struct mlx5_core_dev *mdev,
|
|
|
|
struct ib_device *ibdev,
|
|
|
|
const char *name,
|
|
|
|
void (*setup)(struct net_device *));
|
|
|
|
#endif /* CONFIG_MLX5_CORE_IPOIB */
|
2018-08-14 19:08:51 +08:00
|
|
|
int mlx5_rdma_rn_get_params(struct mlx5_core_dev *mdev,
|
|
|
|
struct ib_device *device,
|
|
|
|
struct rdma_netdev_alloc_params *params);
|
2013-07-07 22:25:49 +08:00
|
|
|
|
2015-12-02 00:03:09 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PCI_DEV_IS_VF = 1 << 0,
|
|
|
|
};
|
|
|
|
|
2019-05-15 13:04:27 +08:00
|
|
|
static inline bool mlx5_core_is_pf(const struct mlx5_core_dev *dev)
|
2015-12-02 00:03:09 +08:00
|
|
|
{
|
2019-06-29 06:35:58 +08:00
|
|
|
return dev->coredev_type == MLX5_COREDEV_PF;
|
2015-12-02 00:03:09 +08:00
|
|
|
}
|
|
|
|
|
2019-10-29 07:35:30 +08:00
|
|
|
static inline bool mlx5_core_is_vf(const struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return dev->coredev_type == MLX5_COREDEV_VF;
|
|
|
|
}
|
|
|
|
|
2020-11-21 07:03:36 +08:00
|
|
|
static inline bool mlx5_core_is_ecpf(const struct mlx5_core_dev *dev)
|
2019-02-13 14:55:35 +08:00
|
|
|
{
|
|
|
|
return dev->caps.embedded_cpu;
|
|
|
|
}
|
|
|
|
|
2019-05-15 13:04:27 +08:00
|
|
|
static inline bool
|
|
|
|
mlx5_core_is_ecpf_esw_manager(const struct mlx5_core_dev *dev)
|
2019-02-13 14:55:38 +08:00
|
|
|
{
|
|
|
|
return dev->caps.embedded_cpu && MLX5_CAP_GEN(dev, eswitch_manager);
|
|
|
|
}
|
|
|
|
|
2019-05-15 13:04:27 +08:00
|
|
|
static inline bool mlx5_ecpf_vport_exists(const struct mlx5_core_dev *dev)
|
2018-12-11 01:59:33 +08:00
|
|
|
{
|
|
|
|
return mlx5_core_is_pf(dev) && MLX5_CAP_ESW(dev, ecpf_vport_exists);
|
|
|
|
}
|
|
|
|
|
2019-05-15 13:04:27 +08:00
|
|
|
static inline u16 mlx5_core_max_vfs(const struct mlx5_core_dev *dev)
|
2019-02-13 14:55:39 +08:00
|
|
|
{
|
2019-06-11 07:38:19 +08:00
|
|
|
return dev->priv.sriov.max_vfs;
|
2019-02-13 14:55:39 +08:00
|
|
|
}
|
|
|
|
|
2015-06-05 00:30:41 +08:00
|
|
|
static inline int mlx5_get_gid_table_len(u16 param)
|
|
|
|
{
|
|
|
|
if (param > 4) {
|
|
|
|
pr_warn("gid table length is zero\n");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 8 * (1 << param);
|
|
|
|
}
|
|
|
|
|
2016-06-23 22:02:37 +08:00
|
|
|
static inline bool mlx5_rl_is_supported(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return !!(dev->priv.rl_table.max_size);
|
|
|
|
}
|
|
|
|
|
{net, IB}/mlx5: Manage port association for multiport RoCE
When mlx5_ib_add is called determine if the mlx5 core device being
added is capable of dual port RoCE operation. If it is, determine
whether it is a master device or a slave device using the
num_vhca_ports and affiliate_nic_vport_criteria capabilities.
If the device is a slave, attempt to find a master device to affiliate it
with. Devices that can be affiliated will share a system image guid. If
none are found place it on a list of unaffiliated ports. If a master is
found bind the port to it by configuring the port affiliation in the NIC
vport context.
Similarly when mlx5_ib_remove is called determine the port type. If it's
a slave port, unaffiliate it from the master device, otherwise just
remove it from the unaffiliated port list.
The IB device is registered as a multiport device, even if a 2nd port is
not available for affiliation. When the 2nd port is affiliated later the
GID cache must be refreshed in order to get the default GIDs for the 2nd
port in the cache. Export roce_rescan_device to provide a mechanism to
refresh the cache after a new port is bound.
In a multiport configuration all IB object (QP, MR, PD, etc) related
commands should flow through the master mlx5_core_dev, other commands
must be sent to the slave port mlx5_core_mdev, an interface is provide
to get the correct mdev for non IB object commands.
Signed-off-by: Daniel Jurgens <danielj@mellanox.com>
Reviewed-by: Parav Pandit <parav@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
Signed-off-by: Jason Gunthorpe <jgg@mellanox.com>
2018-01-04 23:25:36 +08:00
|
|
|
static inline int mlx5_core_is_mp_slave(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return MLX5_CAP_GEN(dev, affiliate_nic_vport_criteria) &&
|
|
|
|
MLX5_CAP_GEN(dev, num_vhca_ports) <= 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int mlx5_core_is_mp_master(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return MLX5_CAP_GEN(dev, num_vhca_ports) > 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int mlx5_core_mp_enabled(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return mlx5_core_is_mp_slave(dev) ||
|
|
|
|
mlx5_core_is_mp_master(dev);
|
|
|
|
}
|
|
|
|
|
2018-01-04 23:25:35 +08:00
|
|
|
static inline int mlx5_core_native_port_num(struct mlx5_core_dev *dev)
|
|
|
|
{
|
{net, IB}/mlx5: Manage port association for multiport RoCE
When mlx5_ib_add is called determine if the mlx5 core device being
added is capable of dual port RoCE operation. If it is, determine
whether it is a master device or a slave device using the
num_vhca_ports and affiliate_nic_vport_criteria capabilities.
If the device is a slave, attempt to find a master device to affiliate it
with. Devices that can be affiliated will share a system image guid. If
none are found place it on a list of unaffiliated ports. If a master is
found bind the port to it by configuring the port affiliation in the NIC
vport context.
Similarly when mlx5_ib_remove is called determine the port type. If it's
a slave port, unaffiliate it from the master device, otherwise just
remove it from the unaffiliated port list.
The IB device is registered as a multiport device, even if a 2nd port is
not available for affiliation. When the 2nd port is affiliated later the
GID cache must be refreshed in order to get the default GIDs for the 2nd
port in the cache. Export roce_rescan_device to provide a mechanism to
refresh the cache after a new port is bound.
In a multiport configuration all IB object (QP, MR, PD, etc) related
commands should flow through the master mlx5_core_dev, other commands
must be sent to the slave port mlx5_core_mdev, an interface is provide
to get the correct mdev for non IB object commands.
Signed-off-by: Daniel Jurgens <danielj@mellanox.com>
Reviewed-by: Parav Pandit <parav@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
Signed-off-by: Jason Gunthorpe <jgg@mellanox.com>
2018-01-04 23:25:36 +08:00
|
|
|
if (!mlx5_core_mp_enabled(dev))
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
return MLX5_CAP_GEN(dev, native_port_num);
|
2018-01-04 23:25:35 +08:00
|
|
|
}
|
|
|
|
|
2015-10-08 22:13:58 +08:00
|
|
|
enum {
|
|
|
|
MLX5_TRIGGERED_CMD_COMP = (u64)1 << 32,
|
|
|
|
};
|
|
|
|
|
2021-03-04 20:45:15 +08:00
|
|
|
static inline bool mlx5_is_roce_init_enabled(struct mlx5_core_dev *dev)
|
2019-11-09 07:45:24 +08:00
|
|
|
{
|
|
|
|
struct devlink *devlink = priv_to_devlink(dev);
|
|
|
|
union devlink_param_value val;
|
|
|
|
|
|
|
|
devlink_param_driverinit_value_get(devlink,
|
|
|
|
DEVLINK_PARAM_GENERIC_ID_ENABLE_ROCE,
|
|
|
|
&val);
|
|
|
|
return val.vbool;
|
|
|
|
}
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
#endif /* MLX5_DRIVER_H */
|