2013-07-07 22:25:49 +08:00
|
|
|
/*
|
2015-04-02 22:07:29 +08:00
|
|
|
* Copyright (c) 2013-2015, Mellanox Technologies. All rights reserved.
|
2013-07-07 22:25:49 +08:00
|
|
|
*
|
|
|
|
* This software is available to you under a choice of one of two
|
|
|
|
* licenses. You may choose to be licensed under the terms of the GNU
|
|
|
|
* General Public License (GPL) Version 2, available from the file
|
|
|
|
* COPYING in the main directory of this source tree, or the
|
|
|
|
* OpenIB.org BSD license below:
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or
|
|
|
|
* without modification, are permitted provided that the following
|
|
|
|
* conditions are met:
|
|
|
|
*
|
|
|
|
* - Redistributions of source code must retain the above
|
|
|
|
* copyright notice, this list of conditions and the following
|
|
|
|
* disclaimer.
|
|
|
|
*
|
|
|
|
* - Redistributions in binary form must reproduce the above
|
|
|
|
* copyright notice, this list of conditions and the following
|
|
|
|
* disclaimer in the documentation and/or other materials
|
|
|
|
* provided with the distribution.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
|
|
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
|
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
|
|
|
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
|
|
|
|
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
|
|
|
|
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
|
|
|
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
|
|
* SOFTWARE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef MLX5_DRIVER_H
|
|
|
|
#define MLX5_DRIVER_H
|
|
|
|
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/completion.h>
|
|
|
|
#include <linux/pci.h>
|
|
|
|
#include <linux/spinlock_types.h>
|
|
|
|
#include <linux/semaphore.h>
|
2014-02-14 12:45:17 +08:00
|
|
|
#include <linux/slab.h>
|
2013-07-07 22:25:49 +08:00
|
|
|
#include <linux/vmalloc.h>
|
|
|
|
#include <linux/radix-tree.h>
|
2016-05-13 20:55:41 +08:00
|
|
|
#include <linux/workqueue.h>
|
net/mlx5_core: Use tasklet for user-space CQ completion events
Previously, we've fired all our completion callbacks straight from
our ISR.
Some of those callbacks were lightweight (for example, mlx5 Ethernet
napi callbacks), but some of them did more work (for example,
the user-space RDMA stack uverbs' completion handler). Besides that,
doing more than the minimal work in ISR is generally considered wrong,
it could even lead to a hard lockup of the system. Since when a lot
of completion events are generated by the hardware, the loop over
those events could be so long, that we'll get into a hard lockup by
the system watchdog.
In order to avoid that, add a new way of invoking completion events
callbacks. In the interrupt itself, we add the CQs which receive
completion event to a per-EQ list and schedule a tasklet. In the
tasklet context we loop over all the CQs in the list and invoke the
user callback.
Signed-off-by: Matan Barak <matanb@mellanox.com>
Signed-off-by: Doug Ledford <dledford@redhat.com>
2016-04-17 22:08:40 +08:00
|
|
|
#include <linux/interrupt.h>
|
2014-02-14 12:45:17 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
#include <linux/mlx5/device.h>
|
|
|
|
#include <linux/mlx5/doorbell.h>
|
2016-06-17 20:33:32 +08:00
|
|
|
#include <linux/mlx5/srq.h>
|
2013-07-07 22:25:49 +08:00
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_BOARD_ID_LEN = 64,
|
|
|
|
MLX5_MAX_NAME_LEN = 16,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
/* one minute for the sake of bringup. Generally, commands must always
|
|
|
|
* complete and we may need to increase this timeout value
|
|
|
|
*/
|
2016-03-02 06:13:39 +08:00
|
|
|
MLX5_CMD_TIMEOUT_MSEC = 60 * 1000,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_CMD_WQ_MAX_NAME = 32,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
CMD_OWNER_SW = 0x0,
|
|
|
|
CMD_OWNER_HW = 0x1,
|
|
|
|
CMD_STATUS_SUCCESS = 0,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_sqp_t {
|
|
|
|
MLX5_SQP_SMI = 0,
|
|
|
|
MLX5_SQP_GSI = 1,
|
|
|
|
MLX5_SQP_IEEE_1588 = 2,
|
|
|
|
MLX5_SQP_SNIFFER = 3,
|
|
|
|
MLX5_SQP_SYNC_UMR = 4,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_MAX_PORTS = 2,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_EQ_VEC_PAGES = 0,
|
|
|
|
MLX5_EQ_VEC_CMD = 1,
|
|
|
|
MLX5_EQ_VEC_ASYNC = 2,
|
|
|
|
MLX5_EQ_VEC_COMP_BASE,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
2015-05-29 03:28:39 +08:00
|
|
|
MLX5_MAX_IRQ_NAME = 32
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_ATOMIC_MODE_IB_COMP = 1 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_CX = 2 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_8B = 3 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_16B = 4 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_32B = 5 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_64B = 6 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_128B = 7 << 16,
|
|
|
|
MLX5_ATOMIC_MODE_256B = 8 << 16,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
2016-02-23 00:17:25 +08:00
|
|
|
MLX5_REG_QETCR = 0x4005,
|
|
|
|
MLX5_REG_QTCT = 0x400a,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_REG_PCAP = 0x5001,
|
|
|
|
MLX5_REG_PMTU = 0x5003,
|
|
|
|
MLX5_REG_PTYS = 0x5004,
|
|
|
|
MLX5_REG_PAOS = 0x5006,
|
2015-08-16 21:04:51 +08:00
|
|
|
MLX5_REG_PFCC = 0x5007,
|
2015-08-04 19:05:47 +08:00
|
|
|
MLX5_REG_PPCNT = 0x5008,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_REG_PMAOS = 0x5012,
|
|
|
|
MLX5_REG_PUDE = 0x5009,
|
|
|
|
MLX5_REG_PMPE = 0x5010,
|
|
|
|
MLX5_REG_PELC = 0x500e,
|
2015-06-05 00:30:45 +08:00
|
|
|
MLX5_REG_PVLC = 0x500f,
|
2016-04-25 03:51:52 +08:00
|
|
|
MLX5_REG_PCMR = 0x5041,
|
2016-04-25 03:51:54 +08:00
|
|
|
MLX5_REG_PMLP = 0x5002,
|
2013-07-07 22:25:49 +08:00
|
|
|
MLX5_REG_NODE_DESC = 0x6001,
|
|
|
|
MLX5_REG_HOST_ENDIANNESS = 0x7004,
|
2016-04-25 03:51:54 +08:00
|
|
|
MLX5_REG_MCIA = 0x9014,
|
2016-04-25 03:51:53 +08:00
|
|
|
MLX5_REG_MLCR = 0x902b,
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2015-12-14 22:34:10 +08:00
|
|
|
enum {
|
|
|
|
MLX5_ATOMIC_OPS_CMP_SWAP = 1 << 0,
|
|
|
|
MLX5_ATOMIC_OPS_FETCH_ADD = 1 << 1,
|
|
|
|
};
|
|
|
|
|
2014-12-11 23:04:19 +08:00
|
|
|
enum mlx5_page_fault_resume_flags {
|
|
|
|
MLX5_PAGE_FAULT_RESUME_REQUESTOR = 1 << 0,
|
|
|
|
MLX5_PAGE_FAULT_RESUME_WRITE = 1 << 1,
|
|
|
|
MLX5_PAGE_FAULT_RESUME_RDMA = 1 << 2,
|
|
|
|
MLX5_PAGE_FAULT_RESUME_ERROR = 1 << 7,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
enum dbg_rsc_type {
|
|
|
|
MLX5_DBG_RSC_QP,
|
|
|
|
MLX5_DBG_RSC_EQ,
|
|
|
|
MLX5_DBG_RSC_CQ,
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_field_desc {
|
|
|
|
struct dentry *dent;
|
|
|
|
int i;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_rsc_debug {
|
|
|
|
struct mlx5_core_dev *dev;
|
|
|
|
void *object;
|
|
|
|
enum dbg_rsc_type type;
|
|
|
|
struct dentry *root;
|
|
|
|
struct mlx5_field_desc fields[0];
|
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_dev_event {
|
|
|
|
MLX5_DEV_EVENT_SYS_ERROR,
|
|
|
|
MLX5_DEV_EVENT_PORT_UP,
|
|
|
|
MLX5_DEV_EVENT_PORT_DOWN,
|
|
|
|
MLX5_DEV_EVENT_PORT_INITIALIZED,
|
|
|
|
MLX5_DEV_EVENT_LID_CHANGE,
|
|
|
|
MLX5_DEV_EVENT_PKEY_CHANGE,
|
|
|
|
MLX5_DEV_EVENT_GUID_CHANGE,
|
|
|
|
MLX5_DEV_EVENT_CLIENT_REREG,
|
|
|
|
};
|
|
|
|
|
2015-05-29 03:28:43 +08:00
|
|
|
enum mlx5_port_status {
|
2015-08-16 21:04:50 +08:00
|
|
|
MLX5_PORT_UP = 1,
|
|
|
|
MLX5_PORT_DOWN = 2,
|
2015-05-29 03:28:43 +08:00
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_uuar_info {
|
|
|
|
struct mlx5_uar *uars;
|
|
|
|
int num_uars;
|
|
|
|
int num_low_latency_uuars;
|
|
|
|
unsigned long *bitmap;
|
|
|
|
unsigned int *count;
|
|
|
|
struct mlx5_bf *bfs;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* protect uuar allocation data structs
|
|
|
|
*/
|
|
|
|
struct mutex lock;
|
2014-01-30 19:49:48 +08:00
|
|
|
u32 ver;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_bf {
|
|
|
|
void __iomem *reg;
|
|
|
|
void __iomem *regreg;
|
|
|
|
int buf_size;
|
|
|
|
struct mlx5_uar *uar;
|
|
|
|
unsigned long offset;
|
|
|
|
int need_lock;
|
|
|
|
/* protect blue flame buffer selection when needed
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
|
|
|
|
/* serialize 64 bit writes when done as two 32 bit accesses
|
|
|
|
*/
|
|
|
|
spinlock_t lock32;
|
|
|
|
int uuarn;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_first {
|
|
|
|
__be32 data[4];
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_msg {
|
|
|
|
struct list_head list;
|
|
|
|
struct cache_ent *cache;
|
|
|
|
u32 len;
|
|
|
|
struct mlx5_cmd_first first;
|
|
|
|
struct mlx5_cmd_mailbox *next;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_debug {
|
|
|
|
struct dentry *dbg_root;
|
|
|
|
struct dentry *dbg_in;
|
|
|
|
struct dentry *dbg_out;
|
|
|
|
struct dentry *dbg_outlen;
|
|
|
|
struct dentry *dbg_status;
|
|
|
|
struct dentry *dbg_run;
|
|
|
|
void *in_msg;
|
|
|
|
void *out_msg;
|
|
|
|
u8 status;
|
|
|
|
u16 inlen;
|
|
|
|
u16 outlen;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct cache_ent {
|
|
|
|
/* protect block chain allocations
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
struct list_head head;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct cmd_msg_cache {
|
|
|
|
struct cache_ent large;
|
|
|
|
struct cache_ent med;
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_stats {
|
|
|
|
u64 sum;
|
|
|
|
u64 n;
|
|
|
|
struct dentry *root;
|
|
|
|
struct dentry *avg;
|
|
|
|
struct dentry *count;
|
|
|
|
/* protect command average calculations */
|
|
|
|
spinlock_t lock;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd {
|
2015-04-02 22:07:25 +08:00
|
|
|
void *cmd_alloc_buf;
|
|
|
|
dma_addr_t alloc_dma;
|
|
|
|
int alloc_size;
|
2013-07-07 22:25:49 +08:00
|
|
|
void *cmd_buf;
|
|
|
|
dma_addr_t dma;
|
|
|
|
u16 cmdif_rev;
|
|
|
|
u8 log_sz;
|
|
|
|
u8 log_stride;
|
|
|
|
int max_reg_cmds;
|
|
|
|
int events;
|
|
|
|
u32 __iomem *vector;
|
|
|
|
|
|
|
|
/* protect command queue allocations
|
|
|
|
*/
|
|
|
|
spinlock_t alloc_lock;
|
|
|
|
|
|
|
|
/* protect token allocations
|
|
|
|
*/
|
|
|
|
spinlock_t token_lock;
|
|
|
|
u8 token;
|
|
|
|
unsigned long bitmask;
|
|
|
|
char wq_name[MLX5_CMD_WQ_MAX_NAME];
|
|
|
|
struct workqueue_struct *wq;
|
|
|
|
struct semaphore sem;
|
|
|
|
struct semaphore pages_sem;
|
|
|
|
int mode;
|
|
|
|
struct mlx5_cmd_work_ent *ent_arr[MLX5_MAX_COMMANDS];
|
|
|
|
struct pci_pool *pool;
|
|
|
|
struct mlx5_cmd_debug dbg;
|
|
|
|
struct cmd_msg_cache cache;
|
|
|
|
int checksum_disabled;
|
|
|
|
struct mlx5_cmd_stats stats[MLX5_CMD_OP_MAX];
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_port_caps {
|
|
|
|
int gid_table_len;
|
|
|
|
int pkey_table_len;
|
2015-05-29 03:28:41 +08:00
|
|
|
u8 ext_port_cap;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cmd_mailbox {
|
|
|
|
void *buf;
|
|
|
|
dma_addr_t dma;
|
|
|
|
struct mlx5_cmd_mailbox *next;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_buf_list {
|
|
|
|
void *buf;
|
|
|
|
dma_addr_t map;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_buf {
|
|
|
|
struct mlx5_buf_list direct;
|
|
|
|
int npages;
|
|
|
|
int size;
|
2014-07-29 04:30:23 +08:00
|
|
|
u8 page_shift;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
net/mlx5_core: Use tasklet for user-space CQ completion events
Previously, we've fired all our completion callbacks straight from
our ISR.
Some of those callbacks were lightweight (for example, mlx5 Ethernet
napi callbacks), but some of them did more work (for example,
the user-space RDMA stack uverbs' completion handler). Besides that,
doing more than the minimal work in ISR is generally considered wrong,
it could even lead to a hard lockup of the system. Since when a lot
of completion events are generated by the hardware, the loop over
those events could be so long, that we'll get into a hard lockup by
the system watchdog.
In order to avoid that, add a new way of invoking completion events
callbacks. In the interrupt itself, we add the CQs which receive
completion event to a per-EQ list and schedule a tasklet. In the
tasklet context we loop over all the CQs in the list and invoke the
user callback.
Signed-off-by: Matan Barak <matanb@mellanox.com>
Signed-off-by: Doug Ledford <dledford@redhat.com>
2016-04-17 22:08:40 +08:00
|
|
|
struct mlx5_eq_tasklet {
|
|
|
|
struct list_head list;
|
|
|
|
struct list_head process_list;
|
|
|
|
struct tasklet_struct task;
|
|
|
|
/* lock on completion tasklet list */
|
|
|
|
spinlock_t lock;
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_eq {
|
|
|
|
struct mlx5_core_dev *dev;
|
|
|
|
__be32 __iomem *doorbell;
|
|
|
|
u32 cons_index;
|
|
|
|
struct mlx5_buf buf;
|
|
|
|
int size;
|
2016-01-17 17:25:47 +08:00
|
|
|
unsigned int irqn;
|
2013-07-07 22:25:49 +08:00
|
|
|
u8 eqn;
|
|
|
|
int nent;
|
|
|
|
u64 mask;
|
|
|
|
struct list_head list;
|
|
|
|
int index;
|
|
|
|
struct mlx5_rsc_debug *dbg;
|
net/mlx5_core: Use tasklet for user-space CQ completion events
Previously, we've fired all our completion callbacks straight from
our ISR.
Some of those callbacks were lightweight (for example, mlx5 Ethernet
napi callbacks), but some of them did more work (for example,
the user-space RDMA stack uverbs' completion handler). Besides that,
doing more than the minimal work in ISR is generally considered wrong,
it could even lead to a hard lockup of the system. Since when a lot
of completion events are generated by the hardware, the loop over
those events could be so long, that we'll get into a hard lockup by
the system watchdog.
In order to avoid that, add a new way of invoking completion events
callbacks. In the interrupt itself, we add the CQs which receive
completion event to a per-EQ list and schedule a tasklet. In the
tasklet context we loop over all the CQs in the list and invoke the
user callback.
Signed-off-by: Matan Barak <matanb@mellanox.com>
Signed-off-by: Doug Ledford <dledford@redhat.com>
2016-04-17 22:08:40 +08:00
|
|
|
struct mlx5_eq_tasklet tasklet_ctx;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2014-02-23 20:19:06 +08:00
|
|
|
struct mlx5_core_psv {
|
|
|
|
u32 psv_idx;
|
|
|
|
struct psv_layout {
|
|
|
|
u32 pd;
|
|
|
|
u16 syndrome;
|
|
|
|
u16 reserved;
|
|
|
|
u16 bg;
|
|
|
|
u16 app_tag;
|
|
|
|
u32 ref_tag;
|
|
|
|
} psv;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_core_sig_ctx {
|
|
|
|
struct mlx5_core_psv psv_memory;
|
|
|
|
struct mlx5_core_psv psv_wire;
|
2014-02-23 20:19:12 +08:00
|
|
|
struct ib_sig_err err_item;
|
|
|
|
bool sig_status_checked;
|
|
|
|
bool sig_err_exists;
|
|
|
|
u32 sigerr_count;
|
2014-02-23 20:19:06 +08:00
|
|
|
};
|
2013-07-07 22:25:49 +08:00
|
|
|
|
2016-03-01 00:05:28 +08:00
|
|
|
struct mlx5_core_mkey {
|
2013-07-07 22:25:49 +08:00
|
|
|
u64 iova;
|
|
|
|
u64 size;
|
|
|
|
u32 key;
|
|
|
|
u32 pd;
|
|
|
|
};
|
|
|
|
|
2014-10-02 17:19:45 +08:00
|
|
|
enum mlx5_res_type {
|
2016-01-15 01:13:00 +08:00
|
|
|
MLX5_RES_QP = MLX5_EVENT_QUEUE_TYPE_QP,
|
|
|
|
MLX5_RES_RQ = MLX5_EVENT_QUEUE_TYPE_RQ,
|
|
|
|
MLX5_RES_SQ = MLX5_EVENT_QUEUE_TYPE_SQ,
|
|
|
|
MLX5_RES_SRQ = 3,
|
|
|
|
MLX5_RES_XSRQ = 4,
|
2014-10-02 17:19:45 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_core_rsc_common {
|
|
|
|
enum mlx5_res_type res;
|
|
|
|
atomic_t refcount;
|
|
|
|
struct completion free;
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_core_srq {
|
2015-06-05 00:30:38 +08:00
|
|
|
struct mlx5_core_rsc_common common; /* must be first */
|
2013-07-07 22:25:49 +08:00
|
|
|
u32 srqn;
|
|
|
|
int max;
|
|
|
|
int max_gs;
|
|
|
|
int max_avail_gather;
|
|
|
|
int wqe_shift;
|
|
|
|
void (*event) (struct mlx5_core_srq *, enum mlx5_event);
|
|
|
|
|
|
|
|
atomic_t refcount;
|
|
|
|
struct completion free;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_eq_table {
|
|
|
|
void __iomem *update_ci;
|
|
|
|
void __iomem *update_arm_ci;
|
2015-04-02 22:07:32 +08:00
|
|
|
struct list_head comp_eqs_list;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_eq pages_eq;
|
|
|
|
struct mlx5_eq async_eq;
|
|
|
|
struct mlx5_eq cmd_eq;
|
|
|
|
int num_comp_vectors;
|
|
|
|
/* protect EQs list
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_uar {
|
|
|
|
u32 index;
|
|
|
|
struct list_head bf_list;
|
|
|
|
unsigned free_bf_bmap;
|
net/mlx5e: TX latency optimization to save DMA reads
A regular TX WQE execution involves two or more DMA reads -
one to fetch the WQE, and another one per WQE gather entry.
These DMA reads obviously increase the TX latency.
There are two mlx5 mechanisms to bypass these DMA reads:
1) Inline WQE
2) Blue Flame (BF)
An inline WQE contains a whole packet, thus saves the DMA read/s
of the regular WQE gather entry/s. Inline WQE support was already
added in the previous commit.
A BF WQE is written directly to the device I/O mapped memory, thus
enables saving the DMA read that fetches the WQE.
The BF WQE I/O write must be in cache line granularity, thus uses
the CPU write combining mechanism.
A BF WQE I/O write acts also as a TX doorbell for notifying the
device of new TX WQEs.
A BF WQE is written to the same I/O mapped address as the regular TX
doorbell, thus this address is being mapped twice - once by ioremap()
and once by io_mapping_map_wc().
While both mechanisms reduce the TX latency, they both consume more CPU
cycles than a regular WQE:
- A BF WQE must still be written to host memory, in addition to being
written directly to the device I/O mapped memory.
- An inline WQE involves copying the SKB data into it.
To handle this tradeoff, we introduce here a heuristic algorithm that
strives to avoid using these two mechanisms in case the TX queue is
being back-pressured by the device, and limit their usage rate otherwise.
An inline WQE will always be "Blue Flamed" (written directly to the
device I/O mapped memory) while a BF WQE may not be inlined (may contain
gather entries).
Preliminary testing using netperf UDP_RR shows that the latency goes down
from 17.5us to 16.9us, while the message rate (tested with pktgen) stays
the same.
Signed-off-by: Achiad Shochat <achiad@mellanox.com>
Signed-off-by: Amir Vadai <amirv@mellanox.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-07-24 04:35:59 +08:00
|
|
|
void __iomem *bf_map;
|
2013-07-07 22:25:49 +08:00
|
|
|
void __iomem *map;
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
struct mlx5_core_health {
|
|
|
|
struct health_buffer __iomem *health;
|
|
|
|
__be32 __iomem *health_counter;
|
|
|
|
struct timer_list timer;
|
|
|
|
u32 prev;
|
|
|
|
int miss_counter;
|
2015-10-14 22:43:45 +08:00
|
|
|
bool sick;
|
2015-10-08 22:14:00 +08:00
|
|
|
struct workqueue_struct *wq;
|
|
|
|
struct work_struct work;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_cq_table {
|
|
|
|
/* protect radix tree
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
struct radix_tree_root tree;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_qp_table {
|
|
|
|
/* protect radix tree
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
struct radix_tree_root tree;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_srq_table {
|
|
|
|
/* protect radix tree
|
|
|
|
*/
|
|
|
|
spinlock_t lock;
|
|
|
|
struct radix_tree_root tree;
|
|
|
|
};
|
|
|
|
|
2016-03-01 00:05:28 +08:00
|
|
|
struct mlx5_mkey_table {
|
2014-02-23 20:19:10 +08:00
|
|
|
/* protect radix tree
|
|
|
|
*/
|
|
|
|
rwlock_t lock;
|
|
|
|
struct radix_tree_root tree;
|
|
|
|
};
|
|
|
|
|
2015-12-02 00:03:09 +08:00
|
|
|
struct mlx5_vf_context {
|
|
|
|
int enabled;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_core_sriov {
|
|
|
|
struct mlx5_vf_context *vfs_ctx;
|
|
|
|
int num_vfs;
|
|
|
|
int enabled_vfs;
|
|
|
|
};
|
|
|
|
|
2015-05-29 03:28:39 +08:00
|
|
|
struct mlx5_irq_info {
|
|
|
|
cpumask_var_t mask;
|
|
|
|
char name[MLX5_MAX_IRQ_NAME];
|
|
|
|
};
|
|
|
|
|
2016-05-13 20:55:41 +08:00
|
|
|
struct mlx5_fc_stats {
|
2016-07-14 15:32:37 +08:00
|
|
|
struct rb_root counters;
|
2016-05-13 20:55:41 +08:00
|
|
|
struct list_head addlist;
|
|
|
|
/* protect addlist add/splice operations */
|
|
|
|
spinlock_t addlist_lock;
|
|
|
|
|
|
|
|
struct workqueue_struct *wq;
|
|
|
|
struct delayed_work work;
|
|
|
|
unsigned long next_query;
|
|
|
|
};
|
|
|
|
|
2015-12-02 00:03:18 +08:00
|
|
|
struct mlx5_eswitch;
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
struct mlx5_lag;
|
2015-12-02 00:03:18 +08:00
|
|
|
|
2016-06-23 22:02:37 +08:00
|
|
|
struct mlx5_rl_entry {
|
|
|
|
u32 rate;
|
|
|
|
u16 index;
|
|
|
|
u16 refcount;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_rl_table {
|
|
|
|
/* protect rate limit table */
|
|
|
|
struct mutex rl_lock;
|
|
|
|
u16 max_size;
|
|
|
|
u32 max_rate;
|
|
|
|
u32 min_rate;
|
|
|
|
struct mlx5_rl_entry *rl_entry;
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_priv {
|
|
|
|
char name[MLX5_MAX_NAME_LEN];
|
|
|
|
struct mlx5_eq_table eq_table;
|
2015-05-29 03:28:39 +08:00
|
|
|
struct msix_entry *msix_arr;
|
|
|
|
struct mlx5_irq_info *irq_info;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_uuar_info uuari;
|
|
|
|
MLX5_DECLARE_DOORBELL_LOCK(cq_uar_lock);
|
|
|
|
|
|
|
|
/* pages stuff */
|
|
|
|
struct workqueue_struct *pg_wq;
|
|
|
|
struct rb_root page_root;
|
|
|
|
int fw_pages;
|
2014-12-11 23:04:23 +08:00
|
|
|
atomic_t reg_pages;
|
2013-10-23 14:53:19 +08:00
|
|
|
struct list_head free_list;
|
2015-12-02 00:03:09 +08:00
|
|
|
int vfs_pages;
|
2013-07-07 22:25:49 +08:00
|
|
|
|
|
|
|
struct mlx5_core_health health;
|
|
|
|
|
|
|
|
struct mlx5_srq_table srq_table;
|
|
|
|
|
|
|
|
/* start: qp staff */
|
|
|
|
struct mlx5_qp_table qp_table;
|
|
|
|
struct dentry *qp_debugfs;
|
|
|
|
struct dentry *eq_debugfs;
|
|
|
|
struct dentry *cq_debugfs;
|
|
|
|
struct dentry *cmdif_debugfs;
|
|
|
|
/* end: qp staff */
|
|
|
|
|
|
|
|
/* start: cq staff */
|
|
|
|
struct mlx5_cq_table cq_table;
|
|
|
|
/* end: cq staff */
|
|
|
|
|
2016-03-01 00:05:28 +08:00
|
|
|
/* start: mkey staff */
|
|
|
|
struct mlx5_mkey_table mkey_table;
|
|
|
|
/* end: mkey staff */
|
2014-02-23 20:19:10 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
/* start: alloc staff */
|
2015-07-24 04:35:57 +08:00
|
|
|
/* protect buffer alocation according to numa node */
|
|
|
|
struct mutex alloc_mutex;
|
|
|
|
int numa_node;
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mutex pgdir_mutex;
|
|
|
|
struct list_head pgdir_list;
|
|
|
|
/* end: alloc staff */
|
|
|
|
struct dentry *dbg_root;
|
|
|
|
|
|
|
|
/* protect mkey key part */
|
|
|
|
spinlock_t mkey_lock;
|
|
|
|
u8 mkey_key;
|
2014-07-29 04:30:22 +08:00
|
|
|
|
|
|
|
struct list_head dev_list;
|
|
|
|
struct list_head ctx_list;
|
|
|
|
spinlock_t ctx_lock;
|
2015-12-02 00:03:18 +08:00
|
|
|
|
2016-07-04 22:23:06 +08:00
|
|
|
struct mlx5_flow_steering *steering;
|
2015-12-02 00:03:18 +08:00
|
|
|
struct mlx5_eswitch *eswitch;
|
2015-12-02 00:03:09 +08:00
|
|
|
struct mlx5_core_sriov sriov;
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
struct mlx5_lag *lag;
|
2015-12-02 00:03:09 +08:00
|
|
|
unsigned long pci_dev_data;
|
2016-05-13 20:55:41 +08:00
|
|
|
struct mlx5_fc_stats fc_stats;
|
2016-06-23 22:02:37 +08:00
|
|
|
struct mlx5_rl_table rl_table;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
2015-10-14 22:43:46 +08:00
|
|
|
enum mlx5_device_state {
|
|
|
|
MLX5_DEVICE_STATE_UP,
|
|
|
|
MLX5_DEVICE_STATE_INTERNAL_ERROR,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_interface_state {
|
2016-04-22 05:33:07 +08:00
|
|
|
MLX5_INTERFACE_STATE_DOWN = BIT(0),
|
|
|
|
MLX5_INTERFACE_STATE_UP = BIT(1),
|
|
|
|
MLX5_INTERFACE_STATE_SHUTDOWN = BIT(2),
|
2015-10-14 22:43:46 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum mlx5_pci_status {
|
|
|
|
MLX5_PCI_STATUS_DISABLED,
|
|
|
|
MLX5_PCI_STATUS_ENABLED,
|
|
|
|
};
|
|
|
|
|
2016-07-01 19:51:04 +08:00
|
|
|
struct mlx5_td {
|
|
|
|
struct list_head tirs_list;
|
|
|
|
u32 tdn;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5e_resources {
|
|
|
|
struct mlx5_uar cq_uar;
|
|
|
|
u32 pdn;
|
|
|
|
struct mlx5_td td;
|
|
|
|
struct mlx5_core_mkey mkey;
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_core_dev {
|
|
|
|
struct pci_dev *pdev;
|
2015-10-14 22:43:46 +08:00
|
|
|
/* sync pci state */
|
|
|
|
struct mutex pci_status_mutex;
|
|
|
|
enum mlx5_pci_status pci_status;
|
2013-07-07 22:25:49 +08:00
|
|
|
u8 rev_id;
|
|
|
|
char board_id[MLX5_BOARD_ID_LEN];
|
|
|
|
struct mlx5_cmd cmd;
|
2015-05-29 03:28:41 +08:00
|
|
|
struct mlx5_port_caps port_caps[MLX5_MAX_PORTS];
|
|
|
|
u32 hca_caps_cur[MLX5_CAP_NUM][MLX5_UN_SZ_DW(hca_cap_union)];
|
|
|
|
u32 hca_caps_max[MLX5_CAP_NUM][MLX5_UN_SZ_DW(hca_cap_union)];
|
2013-07-07 22:25:49 +08:00
|
|
|
phys_addr_t iseg_base;
|
|
|
|
struct mlx5_init_seg __iomem *iseg;
|
2015-10-14 22:43:46 +08:00
|
|
|
enum mlx5_device_state state;
|
|
|
|
/* sync interface state */
|
|
|
|
struct mutex intf_state_mutex;
|
2016-04-22 05:33:07 +08:00
|
|
|
unsigned long intf_state;
|
2013-07-07 22:25:49 +08:00
|
|
|
void (*event) (struct mlx5_core_dev *dev,
|
|
|
|
enum mlx5_dev_event event,
|
2014-07-29 04:30:24 +08:00
|
|
|
unsigned long param);
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_priv priv;
|
|
|
|
struct mlx5_profile *profile;
|
|
|
|
atomic_t num_qps;
|
2015-05-29 03:28:48 +08:00
|
|
|
u32 issi;
|
2016-07-01 19:51:04 +08:00
|
|
|
struct mlx5e_resources mlx5e_res;
|
2016-04-29 06:36:39 +08:00
|
|
|
#ifdef CONFIG_RFS_ACCEL
|
|
|
|
struct cpu_rmap *rmap;
|
|
|
|
#endif
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_db {
|
|
|
|
__be32 *db;
|
|
|
|
union {
|
|
|
|
struct mlx5_db_pgdir *pgdir;
|
|
|
|
struct mlx5_ib_user_db_page *user_page;
|
|
|
|
} u;
|
|
|
|
dma_addr_t dma;
|
|
|
|
int index;
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_DB_PER_PAGE = PAGE_SIZE / L1_CACHE_BYTES,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MLX5_COMP_EQ_SIZE = 1024,
|
|
|
|
};
|
|
|
|
|
2015-05-29 03:28:42 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PTYS_IB = 1 << 0,
|
|
|
|
MLX5_PTYS_EN = 1 << 2,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_db_pgdir {
|
|
|
|
struct list_head list;
|
|
|
|
DECLARE_BITMAP(bitmap, MLX5_DB_PER_PAGE);
|
|
|
|
__be32 *db_page;
|
|
|
|
dma_addr_t db_dma;
|
|
|
|
};
|
|
|
|
|
|
|
|
typedef void (*mlx5_cmd_cbk_t)(int status, void *context);
|
|
|
|
|
|
|
|
struct mlx5_cmd_work_ent {
|
|
|
|
struct mlx5_cmd_msg *in;
|
|
|
|
struct mlx5_cmd_msg *out;
|
2013-10-23 14:53:14 +08:00
|
|
|
void *uout;
|
|
|
|
int uout_size;
|
2013-07-07 22:25:49 +08:00
|
|
|
mlx5_cmd_cbk_t callback;
|
2016-06-30 22:34:43 +08:00
|
|
|
struct delayed_work cb_timeout_work;
|
2013-07-07 22:25:49 +08:00
|
|
|
void *context;
|
2013-10-23 14:53:14 +08:00
|
|
|
int idx;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct completion done;
|
|
|
|
struct mlx5_cmd *cmd;
|
|
|
|
struct work_struct work;
|
|
|
|
struct mlx5_cmd_layout *lay;
|
|
|
|
int ret;
|
|
|
|
int page_queue;
|
|
|
|
u8 status;
|
|
|
|
u8 token;
|
2014-07-17 05:04:44 +08:00
|
|
|
u64 ts1;
|
|
|
|
u64 ts2;
|
2013-10-23 14:53:14 +08:00
|
|
|
u16 op;
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_pas {
|
|
|
|
u64 pa;
|
|
|
|
u8 log_sz;
|
|
|
|
};
|
|
|
|
|
2015-06-05 00:30:41 +08:00
|
|
|
enum port_state_policy {
|
2016-03-12 04:58:42 +08:00
|
|
|
MLX5_POLICY_DOWN = 0,
|
|
|
|
MLX5_POLICY_UP = 1,
|
|
|
|
MLX5_POLICY_FOLLOW = 2,
|
|
|
|
MLX5_POLICY_INVALID = 0xffffffff
|
2015-06-05 00:30:41 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum phy_port_state {
|
|
|
|
MLX5_AAA_111
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_hca_vport_context {
|
|
|
|
u32 field_select;
|
|
|
|
bool sm_virt_aware;
|
|
|
|
bool has_smi;
|
|
|
|
bool has_raw;
|
|
|
|
enum port_state_policy policy;
|
|
|
|
enum phy_port_state phys_state;
|
|
|
|
enum ib_port_state vport_state;
|
|
|
|
u8 port_physical_state;
|
|
|
|
u64 sys_image_guid;
|
|
|
|
u64 port_guid;
|
|
|
|
u64 node_guid;
|
|
|
|
u32 cap_mask1;
|
|
|
|
u32 cap_mask1_perm;
|
|
|
|
u32 cap_mask2;
|
|
|
|
u32 cap_mask2_perm;
|
|
|
|
u16 lid;
|
|
|
|
u8 init_type_reply; /* bitmask: see ib spec 14.2.5.6 InitTypeReply */
|
|
|
|
u8 lmc;
|
|
|
|
u8 subnet_timeout;
|
|
|
|
u16 sm_lid;
|
|
|
|
u8 sm_sl;
|
|
|
|
u16 qkey_violation_counter;
|
|
|
|
u16 pkey_violation_counter;
|
|
|
|
bool grh_required;
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
static inline void *mlx5_buf_offset(struct mlx5_buf *buf, int offset)
|
|
|
|
{
|
|
|
|
return buf->direct.buf + offset;
|
|
|
|
}
|
|
|
|
|
|
|
|
extern struct workqueue_struct *mlx5_core_wq;
|
|
|
|
|
|
|
|
#define STRUCT_FIELD(header, field) \
|
|
|
|
.struct_offset_bytes = offsetof(struct ib_unpacked_ ## header, field), \
|
|
|
|
.struct_size_bytes = sizeof((struct ib_unpacked_ ## header *)0)->field
|
|
|
|
|
|
|
|
static inline struct mlx5_core_dev *pci2mlx5_core_dev(struct pci_dev *pdev)
|
|
|
|
{
|
|
|
|
return pci_get_drvdata(pdev);
|
|
|
|
}
|
|
|
|
|
|
|
|
extern struct dentry *mlx5_debugfs_root;
|
|
|
|
|
|
|
|
static inline u16 fw_rev_maj(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->fw_rev) & 0xffff;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u16 fw_rev_min(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->fw_rev) >> 16;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u16 fw_rev_sub(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->cmdif_rev_fw_sub) & 0xffff;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u16 cmdif_rev(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->cmdif_rev_fw_sub) >> 16;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void *mlx5_vzalloc(unsigned long size)
|
|
|
|
{
|
|
|
|
void *rtn;
|
|
|
|
|
|
|
|
rtn = kzalloc(size, GFP_KERNEL | __GFP_NOWARN);
|
|
|
|
if (!rtn)
|
|
|
|
rtn = vzalloc(size);
|
|
|
|
return rtn;
|
|
|
|
}
|
|
|
|
|
2014-02-23 20:19:10 +08:00
|
|
|
static inline u32 mlx5_base_mkey(const u32 key)
|
|
|
|
{
|
|
|
|
return key & 0xffffff00u;
|
|
|
|
}
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_cmd_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cmd_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cmd_use_events(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cmd_use_polling(struct mlx5_core_dev *dev);
|
2016-07-20 01:17:12 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_cmd_exec(struct mlx5_core_dev *dev, void *in, int in_size, void *out,
|
|
|
|
int out_size);
|
2013-10-23 14:53:14 +08:00
|
|
|
int mlx5_cmd_exec_cb(struct mlx5_core_dev *dev, void *in, int in_size,
|
|
|
|
void *out, int out_size, mlx5_cmd_cbk_t callback,
|
|
|
|
void *context);
|
2016-07-20 01:17:12 +08:00
|
|
|
void mlx5_cmd_mbox_status(void *out, u8 *status, u32 *syndrome);
|
|
|
|
|
|
|
|
int mlx5_core_get_caps(struct mlx5_core_dev *dev, enum mlx5_cap_type cap_type);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_cmd_alloc_uar(struct mlx5_core_dev *dev, u32 *uarn);
|
|
|
|
int mlx5_cmd_free_uar(struct mlx5_core_dev *dev, u32 uarn);
|
|
|
|
int mlx5_alloc_uuars(struct mlx5_core_dev *dev, struct mlx5_uuar_info *uuari);
|
|
|
|
int mlx5_free_uuars(struct mlx5_core_dev *dev, struct mlx5_uuar_info *uuari);
|
2016-03-02 06:13:40 +08:00
|
|
|
int mlx5_alloc_map_uar(struct mlx5_core_dev *mdev, struct mlx5_uar *uar,
|
|
|
|
bool map_wc);
|
2015-05-29 03:28:40 +08:00
|
|
|
void mlx5_unmap_free_uar(struct mlx5_core_dev *mdev, struct mlx5_uar *uar);
|
2015-10-08 22:14:00 +08:00
|
|
|
void mlx5_health_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_health_init(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_start_health_poll(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_stop_health_poll(struct mlx5_core_dev *dev);
|
2015-07-24 04:35:57 +08:00
|
|
|
int mlx5_buf_alloc_node(struct mlx5_core_dev *dev, int size,
|
|
|
|
struct mlx5_buf *buf, int node);
|
2015-05-29 03:28:38 +08:00
|
|
|
int mlx5_buf_alloc(struct mlx5_core_dev *dev, int size, struct mlx5_buf *buf);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_buf_free(struct mlx5_core_dev *dev, struct mlx5_buf *buf);
|
|
|
|
struct mlx5_cmd_mailbox *mlx5_alloc_cmd_mailbox_chain(struct mlx5_core_dev *dev,
|
|
|
|
gfp_t flags, int npages);
|
|
|
|
void mlx5_free_cmd_mailbox_chain(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_cmd_mailbox *head);
|
|
|
|
int mlx5_core_create_srq(struct mlx5_core_dev *dev, struct mlx5_core_srq *srq,
|
2016-06-17 20:33:32 +08:00
|
|
|
struct mlx5_srq_attr *in);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_core_destroy_srq(struct mlx5_core_dev *dev, struct mlx5_core_srq *srq);
|
|
|
|
int mlx5_core_query_srq(struct mlx5_core_dev *dev, struct mlx5_core_srq *srq,
|
2016-06-17 20:33:32 +08:00
|
|
|
struct mlx5_srq_attr *out);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_core_arm_srq(struct mlx5_core_dev *dev, struct mlx5_core_srq *srq,
|
|
|
|
u16 lwm, int is_srq);
|
2016-03-01 00:05:28 +08:00
|
|
|
void mlx5_init_mkey_table(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cleanup_mkey_table(struct mlx5_core_dev *dev);
|
2016-07-16 11:28:36 +08:00
|
|
|
int mlx5_core_create_mkey_cb(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_core_mkey *mkey,
|
|
|
|
u32 *in, int inlen,
|
|
|
|
u32 *out, int outlen,
|
|
|
|
mlx5_cmd_cbk_t callback, void *context);
|
2016-03-01 00:05:28 +08:00
|
|
|
int mlx5_core_create_mkey(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_core_mkey *mkey,
|
2016-07-16 11:28:36 +08:00
|
|
|
u32 *in, int inlen);
|
2016-03-01 00:05:28 +08:00
|
|
|
int mlx5_core_destroy_mkey(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_core_mkey *mkey);
|
|
|
|
int mlx5_core_query_mkey(struct mlx5_core_dev *dev, struct mlx5_core_mkey *mkey,
|
2016-07-16 11:28:36 +08:00
|
|
|
u32 *out, int outlen);
|
2016-03-01 00:05:28 +08:00
|
|
|
int mlx5_core_dump_fill_mkey(struct mlx5_core_dev *dev, struct mlx5_core_mkey *_mkey,
|
2013-07-07 22:25:49 +08:00
|
|
|
u32 *mkey);
|
|
|
|
int mlx5_core_alloc_pd(struct mlx5_core_dev *dev, u32 *pdn);
|
|
|
|
int mlx5_core_dealloc_pd(struct mlx5_core_dev *dev, u32 pdn);
|
2015-06-01 05:15:30 +08:00
|
|
|
int mlx5_core_mad_ifc(struct mlx5_core_dev *dev, const void *inb, void *outb,
|
2014-07-29 04:30:23 +08:00
|
|
|
u16 opmod, u8 port);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_pagealloc_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_pagealloc_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_pagealloc_start(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_pagealloc_stop(struct mlx5_core_dev *dev);
|
2015-12-02 00:03:09 +08:00
|
|
|
int mlx5_sriov_init(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_sriov_cleanup(struct mlx5_core_dev *dev);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_core_req_pages_handler(struct mlx5_core_dev *dev, u16 func_id,
|
2013-08-14 22:46:48 +08:00
|
|
|
s32 npages);
|
2013-07-18 20:31:08 +08:00
|
|
|
int mlx5_satisfy_startup_pages(struct mlx5_core_dev *dev, int boot);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_reclaim_startup_pages(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_register_debugfs(void);
|
|
|
|
void mlx5_unregister_debugfs(void);
|
|
|
|
int mlx5_eq_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_eq_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_fill_page_array(struct mlx5_buf *buf, __be64 *pas);
|
|
|
|
void mlx5_cq_completion(struct mlx5_core_dev *dev, u32 cqn);
|
2014-10-02 17:19:45 +08:00
|
|
|
void mlx5_rsc_event(struct mlx5_core_dev *dev, u32 rsn, int event_type);
|
2014-12-11 23:04:19 +08:00
|
|
|
#ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
|
|
|
|
void mlx5_eq_pagefault(struct mlx5_core_dev *dev, struct mlx5_eqe *eqe);
|
|
|
|
#endif
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_srq_event(struct mlx5_core_dev *dev, u32 srqn, int event_type);
|
|
|
|
struct mlx5_core_srq *mlx5_core_get_srq(struct mlx5_core_dev *dev, u32 srqn);
|
2015-10-08 22:13:58 +08:00
|
|
|
void mlx5_cmd_comp_handler(struct mlx5_core_dev *dev, u64 vec);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_cq_event(struct mlx5_core_dev *dev, u32 cqn, int event_type);
|
|
|
|
int mlx5_create_map_eq(struct mlx5_core_dev *dev, struct mlx5_eq *eq, u8 vecidx,
|
|
|
|
int nent, u64 mask, const char *name, struct mlx5_uar *uar);
|
|
|
|
int mlx5_destroy_unmap_eq(struct mlx5_core_dev *dev, struct mlx5_eq *eq);
|
|
|
|
int mlx5_start_eqs(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_stop_eqs(struct mlx5_core_dev *dev);
|
2016-01-17 17:25:47 +08:00
|
|
|
int mlx5_vector2eqn(struct mlx5_core_dev *dev, int vector, int *eqn,
|
|
|
|
unsigned int *irqn);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_core_attach_mcg(struct mlx5_core_dev *dev, union ib_gid *mgid, u32 qpn);
|
|
|
|
int mlx5_core_detach_mcg(struct mlx5_core_dev *dev, union ib_gid *mgid, u32 qpn);
|
|
|
|
|
|
|
|
int mlx5_qp_debugfs_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_qp_debugfs_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_core_access_reg(struct mlx5_core_dev *dev, void *data_in,
|
|
|
|
int size_in, void *data_out, int size_out,
|
|
|
|
u16 reg_num, int arg, int write);
|
2015-05-29 03:28:42 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_debug_eq_add(struct mlx5_core_dev *dev, struct mlx5_eq *eq);
|
|
|
|
void mlx5_debug_eq_remove(struct mlx5_core_dev *dev, struct mlx5_eq *eq);
|
|
|
|
int mlx5_core_eq_query(struct mlx5_core_dev *dev, struct mlx5_eq *eq,
|
2016-07-16 08:26:15 +08:00
|
|
|
u32 *out, int outlen);
|
2013-07-07 22:25:49 +08:00
|
|
|
int mlx5_eq_debugfs_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_eq_debugfs_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_cq_debugfs_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cq_debugfs_cleanup(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_db_alloc(struct mlx5_core_dev *dev, struct mlx5_db *db);
|
2015-07-24 04:35:57 +08:00
|
|
|
int mlx5_db_alloc_node(struct mlx5_core_dev *dev, struct mlx5_db *db,
|
|
|
|
int node);
|
2013-07-07 22:25:49 +08:00
|
|
|
void mlx5_db_free(struct mlx5_core_dev *dev, struct mlx5_db *db);
|
|
|
|
|
|
|
|
const char *mlx5_command_str(int command);
|
|
|
|
int mlx5_cmdif_debugfs_init(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cmdif_debugfs_cleanup(struct mlx5_core_dev *dev);
|
2014-02-23 20:19:06 +08:00
|
|
|
int mlx5_core_create_psv(struct mlx5_core_dev *dev, u32 pdn,
|
|
|
|
int npsvs, u32 *sig_index);
|
|
|
|
int mlx5_core_destroy_psv(struct mlx5_core_dev *dev, int psv_num);
|
2014-10-02 17:19:45 +08:00
|
|
|
void mlx5_core_put_rsc(struct mlx5_core_rsc_common *common);
|
2014-12-11 23:04:19 +08:00
|
|
|
int mlx5_query_odp_caps(struct mlx5_core_dev *dev,
|
|
|
|
struct mlx5_odp_caps *odp_caps);
|
2016-02-19 00:15:00 +08:00
|
|
|
int mlx5_core_query_ib_ppcnt(struct mlx5_core_dev *dev,
|
|
|
|
u8 port_num, void *out, size_t sz);
|
2013-07-07 22:25:49 +08:00
|
|
|
|
2016-06-23 22:02:37 +08:00
|
|
|
int mlx5_init_rl_table(struct mlx5_core_dev *dev);
|
|
|
|
void mlx5_cleanup_rl_table(struct mlx5_core_dev *dev);
|
|
|
|
int mlx5_rl_add_rate(struct mlx5_core_dev *dev, u32 rate, u16 *index);
|
|
|
|
void mlx5_rl_remove_rate(struct mlx5_core_dev *dev, u32 rate);
|
|
|
|
bool mlx5_rl_is_in_range(struct mlx5_core_dev *dev, u32 rate);
|
|
|
|
|
2015-10-14 22:43:47 +08:00
|
|
|
static inline int fw_initializing(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return ioread32be(&dev->iseg->initializing) >> 31;
|
|
|
|
}
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
static inline u32 mlx5_mkey_to_idx(u32 mkey)
|
|
|
|
{
|
|
|
|
return mkey >> 8;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u32 mlx5_idx_to_mkey(u32 mkey_idx)
|
|
|
|
{
|
|
|
|
return mkey_idx << 8;
|
|
|
|
}
|
|
|
|
|
2013-10-23 14:53:14 +08:00
|
|
|
static inline u8 mlx5_mkey_variant(u32 mkey)
|
|
|
|
{
|
|
|
|
return mkey & 0xff;
|
|
|
|
}
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PROF_MASK_QP_SIZE = (u64)1 << 0,
|
2013-09-11 21:35:25 +08:00
|
|
|
MLX5_PROF_MASK_MR_CACHE = (u64)1 << 1,
|
2013-07-07 22:25:49 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
MAX_MR_CACHE_ENTRIES = 16,
|
|
|
|
};
|
|
|
|
|
2015-04-02 22:07:34 +08:00
|
|
|
enum {
|
|
|
|
MLX5_INTERFACE_PROTOCOL_IB = 0,
|
|
|
|
MLX5_INTERFACE_PROTOCOL_ETH = 1,
|
|
|
|
};
|
|
|
|
|
2014-07-29 04:30:22 +08:00
|
|
|
struct mlx5_interface {
|
|
|
|
void * (*add)(struct mlx5_core_dev *dev);
|
|
|
|
void (*remove)(struct mlx5_core_dev *dev, void *context);
|
|
|
|
void (*event)(struct mlx5_core_dev *dev, void *context,
|
2014-07-29 04:30:24 +08:00
|
|
|
enum mlx5_dev_event event, unsigned long param);
|
2015-04-02 22:07:34 +08:00
|
|
|
void * (*get_dev)(void *context);
|
|
|
|
int protocol;
|
2014-07-29 04:30:22 +08:00
|
|
|
struct list_head list;
|
|
|
|
};
|
|
|
|
|
2015-04-02 22:07:34 +08:00
|
|
|
void *mlx5_get_protocol_dev(struct mlx5_core_dev *mdev, int protocol);
|
2014-07-29 04:30:22 +08:00
|
|
|
int mlx5_register_interface(struct mlx5_interface *intf);
|
|
|
|
void mlx5_unregister_interface(struct mlx5_interface *intf);
|
2015-06-05 00:30:42 +08:00
|
|
|
int mlx5_core_query_vendor_id(struct mlx5_core_dev *mdev, u32 *vendor_id);
|
2014-07-29 04:30:22 +08:00
|
|
|
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
bool mlx5_lag_is_active(struct mlx5_core_dev *dev);
|
2016-05-09 19:06:44 +08:00
|
|
|
struct net_device *mlx5_lag_get_roce_netdev(struct mlx5_core_dev *dev);
|
net/mlx5: Implement RoCE LAG feature
Available on dual port cards only, this feature keeps
track, using netdev LAG events, of the bonding
and link status of each port's PF netdev.
When both of the card's PF netdevs are enslaved to the
same bond/team master, and only them, LAG state
is active.
During LAG, only one IB device is present for both ports.
In addition to the above, this commit includes FW commands
used for managing the LAG, new facilities for adding and removing
a single device by interface, and port remap functionality according to
bond events.
Please note that this feature is currently used only for mimicking
Ethernet bonding for RoCE - netdevs functionality is not altered,
and their bonding continues to be managed solely by bond/team driver.
Signed-off-by: Aviv Heller <avivh@mellanox.com>
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
Signed-off-by: Leon Romanovsky <leon@kernel.org>
2016-04-17 21:57:32 +08:00
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
struct mlx5_profile {
|
|
|
|
u64 mask;
|
2014-07-29 04:30:23 +08:00
|
|
|
u8 log_max_qp;
|
2013-07-07 22:25:49 +08:00
|
|
|
struct {
|
|
|
|
int size;
|
|
|
|
int limit;
|
|
|
|
} mr_cache[MAX_MR_CACHE_ENTRIES];
|
|
|
|
};
|
|
|
|
|
2015-12-02 00:03:09 +08:00
|
|
|
enum {
|
|
|
|
MLX5_PCI_DEV_IS_VF = 1 << 0,
|
|
|
|
};
|
|
|
|
|
|
|
|
static inline int mlx5_core_is_pf(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return !(dev->priv.pci_dev_data & MLX5_PCI_DEV_IS_VF);
|
|
|
|
}
|
|
|
|
|
2015-06-05 00:30:41 +08:00
|
|
|
static inline int mlx5_get_gid_table_len(u16 param)
|
|
|
|
{
|
|
|
|
if (param > 4) {
|
|
|
|
pr_warn("gid table length is zero\n");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 8 * (1 << param);
|
|
|
|
}
|
|
|
|
|
2016-06-23 22:02:37 +08:00
|
|
|
static inline bool mlx5_rl_is_supported(struct mlx5_core_dev *dev)
|
|
|
|
{
|
|
|
|
return !!(dev->priv.rl_table.max_size);
|
|
|
|
}
|
|
|
|
|
2015-10-08 22:13:58 +08:00
|
|
|
enum {
|
|
|
|
MLX5_TRIGGERED_CMD_COMP = (u64)1 << 32,
|
|
|
|
};
|
|
|
|
|
2013-07-07 22:25:49 +08:00
|
|
|
#endif /* MLX5_DRIVER_H */
|