skd: Reduce memory usage

Every single coherent DMA memory buffer occupies at least one page.
Reduce memory usage by switching from coherent buffers to streaming
DMA for I/O requests (struct skd_fitmsg_context) and S/G-lists
(struct fit_sg_descriptor[]).

Signed-off-by: Bart Van Assche <bart.vanassche@wdc.com>
Cc: Christoph Hellwig <hch@lst.de>
Cc: Hannes Reinecke <hare@suse.de>
Cc: Johannes Thumshirn <jthumshirn@suse.de>
Signed-off-by: Jens Axboe <axboe@kernel.dk>
This commit is contained in:
Bart Van Assche 2017-08-17 13:13:35 -07:00 committed by Jens Axboe
parent d4d0f5fc3a
commit a3db102def
1 changed files with 108 additions and 37 deletions

View File

@ -32,6 +32,7 @@
#include <linux/aer.h> #include <linux/aer.h>
#include <linux/wait.h> #include <linux/wait.h>
#include <linux/stringify.h> #include <linux/stringify.h>
#include <linux/slab_def.h>
#include <scsi/scsi.h> #include <scsi/scsi.h>
#include <scsi/sg.h> #include <scsi/sg.h>
#include <linux/io.h> #include <linux/io.h>
@ -256,6 +257,9 @@ struct skd_device {
u8 skcomp_cycle; u8 skcomp_cycle;
u32 skcomp_ix; u32 skcomp_ix;
struct kmem_cache *msgbuf_cache;
struct kmem_cache *sglist_cache;
struct kmem_cache *databuf_cache;
struct fit_completion_entry_v1 *skcomp_table; struct fit_completion_entry_v1 *skcomp_table;
struct fit_comp_error_info *skerr_table; struct fit_comp_error_info *skerr_table;
dma_addr_t cq_dma_address; dma_addr_t cq_dma_address;
@ -538,6 +542,11 @@ static void skd_process_request(struct request *req, bool last)
return; return;
} }
dma_sync_single_for_device(&skdev->pdev->dev, skreq->sksg_dma_address,
skreq->n_sg *
sizeof(struct fit_sg_descriptor),
DMA_TO_DEVICE);
spin_lock_irqsave(&skdev->lock, flags); spin_lock_irqsave(&skdev->lock, flags);
/* Either a FIT msg is in progress or we have to start one. */ /* Either a FIT msg is in progress or we have to start one. */
skmsg = skdev->skmsg; skmsg = skdev->skmsg;
@ -1078,6 +1087,11 @@ static void skd_complete_internal(struct skd_device *skdev,
dev_dbg(&skdev->pdev->dev, "complete internal %x\n", scsi->cdb[0]); dev_dbg(&skdev->pdev->dev, "complete internal %x\n", scsi->cdb[0]);
dma_sync_single_for_cpu(&skdev->pdev->dev,
skspcl->db_dma_address,
skspcl->req.sksg_list[0].byte_count,
DMA_BIDIRECTIONAL);
skspcl->req.completion = *skcomp; skspcl->req.completion = *skcomp;
skspcl->req.state = SKD_REQ_STATE_IDLE; skspcl->req.state = SKD_REQ_STATE_IDLE;
skspcl->req.id += SKD_ID_INCR; skspcl->req.id += SKD_ID_INCR;
@ -1263,6 +1277,9 @@ static void skd_send_fitmsg(struct skd_device *skdev,
*/ */
qcmd |= FIT_QCMD_MSGSIZE_64; qcmd |= FIT_QCMD_MSGSIZE_64;
dma_sync_single_for_device(&skdev->pdev->dev, skmsg->mb_dma_address,
skmsg->length, DMA_TO_DEVICE);
/* Make sure skd_msg_buf is written before the doorbell is triggered. */ /* Make sure skd_msg_buf is written before the doorbell is triggered. */
smp_wmb(); smp_wmb();
@ -1274,6 +1291,8 @@ static void skd_send_special_fitmsg(struct skd_device *skdev,
{ {
u64 qcmd; u64 qcmd;
WARN_ON_ONCE(skspcl->req.n_sg != 1);
if (unlikely(skdev->dbg_level > 1)) { if (unlikely(skdev->dbg_level > 1)) {
u8 *bp = (u8 *)skspcl->msg_buf; u8 *bp = (u8 *)skspcl->msg_buf;
int i; int i;
@ -1307,6 +1326,17 @@ static void skd_send_special_fitmsg(struct skd_device *skdev,
qcmd = skspcl->mb_dma_address; qcmd = skspcl->mb_dma_address;
qcmd |= FIT_QCMD_QID_NORMAL + FIT_QCMD_MSGSIZE_128; qcmd |= FIT_QCMD_QID_NORMAL + FIT_QCMD_MSGSIZE_128;
dma_sync_single_for_device(&skdev->pdev->dev, skspcl->mb_dma_address,
SKD_N_SPECIAL_FITMSG_BYTES, DMA_TO_DEVICE);
dma_sync_single_for_device(&skdev->pdev->dev,
skspcl->req.sksg_dma_address,
1 * sizeof(struct fit_sg_descriptor),
DMA_TO_DEVICE);
dma_sync_single_for_device(&skdev->pdev->dev,
skspcl->db_dma_address,
skspcl->req.sksg_list[0].byte_count,
DMA_BIDIRECTIONAL);
/* Make sure skd_msg_buf is written before the doorbell is triggered. */ /* Make sure skd_msg_buf is written before the doorbell is triggered. */
smp_wmb(); smp_wmb();
@ -2619,6 +2649,35 @@ static void skd_release_irq(struct skd_device *skdev)
***************************************************************************** *****************************************************************************
*/ */
static void *skd_alloc_dma(struct skd_device *skdev, struct kmem_cache *s,
dma_addr_t *dma_handle, gfp_t gfp,
enum dma_data_direction dir)
{
struct device *dev = &skdev->pdev->dev;
void *buf;
buf = kmem_cache_alloc(s, gfp);
if (!buf)
return NULL;
*dma_handle = dma_map_single(dev, buf, s->size, dir);
if (dma_mapping_error(dev, *dma_handle)) {
kfree(buf);
buf = NULL;
}
return buf;
}
static void skd_free_dma(struct skd_device *skdev, struct kmem_cache *s,
void *vaddr, dma_addr_t dma_handle,
enum dma_data_direction dir)
{
if (!vaddr)
return;
dma_unmap_single(&skdev->pdev->dev, dma_handle, s->size, dir);
kmem_cache_free(s, vaddr);
}
static int skd_cons_skcomp(struct skd_device *skdev) static int skd_cons_skcomp(struct skd_device *skdev)
{ {
int rc = 0; int rc = 0;
@ -2695,18 +2754,14 @@ static struct fit_sg_descriptor *skd_cons_sg_list(struct skd_device *skdev,
dma_addr_t *ret_dma_addr) dma_addr_t *ret_dma_addr)
{ {
struct fit_sg_descriptor *sg_list; struct fit_sg_descriptor *sg_list;
u32 nbytes;
nbytes = sizeof(*sg_list) * n_sg; sg_list = skd_alloc_dma(skdev, skdev->sglist_cache, ret_dma_addr,
GFP_DMA | __GFP_ZERO, DMA_TO_DEVICE);
sg_list = pci_alloc_consistent(skdev->pdev, nbytes, ret_dma_addr);
if (sg_list != NULL) { if (sg_list != NULL) {
uint64_t dma_address = *ret_dma_addr; uint64_t dma_address = *ret_dma_addr;
u32 i; u32 i;
memset(sg_list, 0, nbytes);
for (i = 0; i < n_sg - 1; i++) { for (i = 0; i < n_sg - 1; i++) {
uint64_t ndp_off; uint64_t ndp_off;
ndp_off = (i + 1) * sizeof(struct fit_sg_descriptor); ndp_off = (i + 1) * sizeof(struct fit_sg_descriptor);
@ -2720,15 +2775,14 @@ static struct fit_sg_descriptor *skd_cons_sg_list(struct skd_device *skdev,
} }
static void skd_free_sg_list(struct skd_device *skdev, static void skd_free_sg_list(struct skd_device *skdev,
struct fit_sg_descriptor *sg_list, u32 n_sg, struct fit_sg_descriptor *sg_list,
dma_addr_t dma_addr) dma_addr_t dma_addr)
{ {
u32 nbytes = sizeof(*sg_list) * n_sg;
if (WARN_ON_ONCE(!sg_list)) if (WARN_ON_ONCE(!sg_list))
return; return;
pci_free_consistent(skdev->pdev, nbytes, sg_list, dma_addr); skd_free_dma(skdev, skdev->sglist_cache, sg_list, dma_addr,
DMA_TO_DEVICE);
} }
static int skd_init_request(struct blk_mq_tag_set *set, struct request *rq, static int skd_init_request(struct blk_mq_tag_set *set, struct request *rq,
@ -2752,34 +2806,31 @@ static void skd_exit_request(struct blk_mq_tag_set *set, struct request *rq,
struct skd_device *skdev = set->driver_data; struct skd_device *skdev = set->driver_data;
struct skd_request_context *skreq = blk_mq_rq_to_pdu(rq); struct skd_request_context *skreq = blk_mq_rq_to_pdu(rq);
skd_free_sg_list(skdev, skreq->sksg_list, skd_free_sg_list(skdev, skreq->sksg_list, skreq->sksg_dma_address);
skdev->sgs_per_request,
skreq->sksg_dma_address);
} }
static int skd_cons_sksb(struct skd_device *skdev) static int skd_cons_sksb(struct skd_device *skdev)
{ {
int rc = 0; int rc = 0;
struct skd_special_context *skspcl; struct skd_special_context *skspcl;
u32 nbytes;
skspcl = &skdev->internal_skspcl; skspcl = &skdev->internal_skspcl;
skspcl->req.id = 0 + SKD_ID_INTERNAL; skspcl->req.id = 0 + SKD_ID_INTERNAL;
skspcl->req.state = SKD_REQ_STATE_IDLE; skspcl->req.state = SKD_REQ_STATE_IDLE;
nbytes = SKD_N_INTERNAL_BYTES; skspcl->data_buf = skd_alloc_dma(skdev, skdev->databuf_cache,
&skspcl->db_dma_address,
skspcl->data_buf = pci_zalloc_consistent(skdev->pdev, nbytes, GFP_DMA | __GFP_ZERO,
&skspcl->db_dma_address); DMA_BIDIRECTIONAL);
if (skspcl->data_buf == NULL) { if (skspcl->data_buf == NULL) {
rc = -ENOMEM; rc = -ENOMEM;
goto err_out; goto err_out;
} }
nbytes = SKD_N_SPECIAL_FITMSG_BYTES; skspcl->msg_buf = skd_alloc_dma(skdev, skdev->msgbuf_cache,
skspcl->msg_buf = pci_zalloc_consistent(skdev->pdev, nbytes, &skspcl->mb_dma_address,
&skspcl->mb_dma_address); GFP_DMA | __GFP_ZERO, DMA_TO_DEVICE);
if (skspcl->msg_buf == NULL) { if (skspcl->msg_buf == NULL) {
rc = -ENOMEM; rc = -ENOMEM;
goto err_out; goto err_out;
@ -2886,6 +2937,7 @@ static struct skd_device *skd_construct(struct pci_dev *pdev)
{ {
struct skd_device *skdev; struct skd_device *skdev;
int blk_major = skd_major; int blk_major = skd_major;
size_t size;
int rc; int rc;
skdev = kzalloc(sizeof(*skdev), GFP_KERNEL); skdev = kzalloc(sizeof(*skdev), GFP_KERNEL);
@ -2914,6 +2966,31 @@ static struct skd_device *skd_construct(struct pci_dev *pdev)
INIT_WORK(&skdev->start_queue, skd_start_queue); INIT_WORK(&skdev->start_queue, skd_start_queue);
INIT_WORK(&skdev->completion_worker, skd_completion_worker); INIT_WORK(&skdev->completion_worker, skd_completion_worker);
size = max(SKD_N_FITMSG_BYTES, SKD_N_SPECIAL_FITMSG_BYTES);
skdev->msgbuf_cache = kmem_cache_create("skd-msgbuf", size, 0,
SLAB_HWCACHE_ALIGN, NULL);
if (!skdev->msgbuf_cache)
goto err_out;
WARN_ONCE(kmem_cache_size(skdev->msgbuf_cache) < size,
"skd-msgbuf: %d < %zd\n",
kmem_cache_size(skdev->msgbuf_cache), size);
size = skd_sgs_per_request * sizeof(struct fit_sg_descriptor);
skdev->sglist_cache = kmem_cache_create("skd-sglist", size, 0,
SLAB_HWCACHE_ALIGN, NULL);
if (!skdev->sglist_cache)
goto err_out;
WARN_ONCE(kmem_cache_size(skdev->sglist_cache) < size,
"skd-sglist: %d < %zd\n",
kmem_cache_size(skdev->sglist_cache), size);
size = SKD_N_INTERNAL_BYTES;
skdev->databuf_cache = kmem_cache_create("skd-databuf", size, 0,
SLAB_HWCACHE_ALIGN, NULL);
if (!skdev->databuf_cache)
goto err_out;
WARN_ONCE(kmem_cache_size(skdev->databuf_cache) < size,
"skd-databuf: %d < %zd\n",
kmem_cache_size(skdev->databuf_cache), size);
dev_dbg(&skdev->pdev->dev, "skcomp\n"); dev_dbg(&skdev->pdev->dev, "skcomp\n");
rc = skd_cons_skcomp(skdev); rc = skd_cons_skcomp(skdev);
if (rc < 0) if (rc < 0)
@ -2986,31 +3063,21 @@ static void skd_free_skmsg(struct skd_device *skdev)
static void skd_free_sksb(struct skd_device *skdev) static void skd_free_sksb(struct skd_device *skdev)
{ {
struct skd_special_context *skspcl; struct skd_special_context *skspcl = &skdev->internal_skspcl;
u32 nbytes;
skspcl = &skdev->internal_skspcl; skd_free_dma(skdev, skdev->databuf_cache, skspcl->data_buf,
skspcl->db_dma_address, DMA_BIDIRECTIONAL);
if (skspcl->data_buf != NULL) {
nbytes = SKD_N_INTERNAL_BYTES;
pci_free_consistent(skdev->pdev, nbytes,
skspcl->data_buf, skspcl->db_dma_address);
}
skspcl->data_buf = NULL; skspcl->data_buf = NULL;
skspcl->db_dma_address = 0; skspcl->db_dma_address = 0;
if (skspcl->msg_buf != NULL) { skd_free_dma(skdev, skdev->msgbuf_cache, skspcl->msg_buf,
nbytes = SKD_N_SPECIAL_FITMSG_BYTES; skspcl->mb_dma_address, DMA_TO_DEVICE);
pci_free_consistent(skdev->pdev, nbytes,
skspcl->msg_buf, skspcl->mb_dma_address);
}
skspcl->msg_buf = NULL; skspcl->msg_buf = NULL;
skspcl->mb_dma_address = 0; skspcl->mb_dma_address = 0;
skd_free_sg_list(skdev, skspcl->req.sksg_list, 1, skd_free_sg_list(skdev, skspcl->req.sksg_list,
skspcl->req.sksg_dma_address); skspcl->req.sksg_dma_address);
skspcl->req.sksg_list = NULL; skspcl->req.sksg_list = NULL;
@ -3056,6 +3123,10 @@ static void skd_destruct(struct skd_device *skdev)
dev_dbg(&skdev->pdev->dev, "skcomp\n"); dev_dbg(&skdev->pdev->dev, "skcomp\n");
skd_free_skcomp(skdev); skd_free_skcomp(skdev);
kmem_cache_destroy(skdev->databuf_cache);
kmem_cache_destroy(skdev->sglist_cache);
kmem_cache_destroy(skdev->msgbuf_cache);
dev_dbg(&skdev->pdev->dev, "skdev\n"); dev_dbg(&skdev->pdev->dev, "skdev\n");
kfree(skdev); kfree(skdev);
} }