Commit ea85a20c authored by James Smart's avatar James Smart Committed by Martin K. Petersen

scsi: lpfc: Remove lock contention target write path

Lower IOps performance with write operations. Perf tool shows lock
contention in dma_pool_alloc and dma_pool_free related to the
txrdy_payload_pool.

The allocations are for dma buffers for XFER_RDY's, which actually are not
needed for the FCP_TRECEIVE command as the command contents are used by the
adapter to generate the IU.

Remove the allocations and the associated buffer pool.  Rather than leaving
NULLs in buffer pointer locations, set command and sgl to indicate skipped
SGLE indexes.

Link: https://lore.kernel.org/r/20191018211832.7917-10-jsmart2021@gmail.comSigned-off-by: default avatarDick Kennedy <dick.kennedy@broadcom.com>
Signed-off-by: default avatarJames Smart <jsmart2021@gmail.com>
Signed-off-by: default avatarMartin K. Petersen <martin.petersen@oracle.com>
parent 22770cba
...@@ -989,7 +989,6 @@ struct lpfc_hba { ...@@ -989,7 +989,6 @@ struct lpfc_hba {
struct dma_pool *lpfc_drb_pool; /* data receive buffer pool */ struct dma_pool *lpfc_drb_pool; /* data receive buffer pool */
struct dma_pool *lpfc_nvmet_drb_pool; /* data receive buffer pool */ struct dma_pool *lpfc_nvmet_drb_pool; /* data receive buffer pool */
struct dma_pool *lpfc_hbq_pool; /* SLI3 hbq buffer pool */ struct dma_pool *lpfc_hbq_pool; /* SLI3 hbq buffer pool */
struct dma_pool *txrdy_payload_pool;
struct dma_pool *lpfc_cmd_rsp_buf_pool; struct dma_pool *lpfc_cmd_rsp_buf_pool;
struct lpfc_dma_pool lpfc_mbuf_safety_pool; struct lpfc_dma_pool lpfc_mbuf_safety_pool;
......
...@@ -7556,19 +7556,11 @@ lpfc_create_shost(struct lpfc_hba *phba) ...@@ -7556,19 +7556,11 @@ lpfc_create_shost(struct lpfc_hba *phba)
if (phba->nvmet_support) { if (phba->nvmet_support) {
/* Only 1 vport (pport) will support NVME target */ /* Only 1 vport (pport) will support NVME target */
if (phba->txrdy_payload_pool == NULL) {
phba->txrdy_payload_pool = dma_pool_create(
"txrdy_pool", &phba->pcidev->dev,
TXRDY_PAYLOAD_LEN, 16, 0);
if (phba->txrdy_payload_pool) {
phba->targetport = NULL; phba->targetport = NULL;
phba->cfg_enable_fc4_type = LPFC_ENABLE_NVME; phba->cfg_enable_fc4_type = LPFC_ENABLE_NVME;
lpfc_printf_log(phba, KERN_INFO, lpfc_printf_log(phba, KERN_INFO, LOG_INIT | LOG_NVME_DISC,
LOG_INIT | LOG_NVME_DISC,
"6076 NVME Target Found\n"); "6076 NVME Target Found\n");
} }
}
}
lpfc_debugfs_initialize(vport); lpfc_debugfs_initialize(vport);
/* Put reference to SCSI host to driver's device private data */ /* Put reference to SCSI host to driver's device private data */
......
...@@ -230,9 +230,6 @@ lpfc_mem_free(struct lpfc_hba *phba) ...@@ -230,9 +230,6 @@ lpfc_mem_free(struct lpfc_hba *phba)
dma_pool_destroy(phba->lpfc_hrb_pool); dma_pool_destroy(phba->lpfc_hrb_pool);
phba->lpfc_hrb_pool = NULL; phba->lpfc_hrb_pool = NULL;
dma_pool_destroy(phba->txrdy_payload_pool);
phba->txrdy_payload_pool = NULL;
dma_pool_destroy(phba->lpfc_hbq_pool); dma_pool_destroy(phba->lpfc_hbq_pool);
phba->lpfc_hbq_pool = NULL; phba->lpfc_hbq_pool = NULL;
......
...@@ -378,13 +378,6 @@ lpfc_nvmet_ctxbuf_post(struct lpfc_hba *phba, struct lpfc_nvmet_ctxbuf *ctx_buf) ...@@ -378,13 +378,6 @@ lpfc_nvmet_ctxbuf_post(struct lpfc_hba *phba, struct lpfc_nvmet_ctxbuf *ctx_buf)
int cpu; int cpu;
unsigned long iflag; unsigned long iflag;
if (ctxp->txrdy) {
dma_pool_free(phba->txrdy_payload_pool, ctxp->txrdy,
ctxp->txrdy_phys);
ctxp->txrdy = NULL;
ctxp->txrdy_phys = 0;
}
if (ctxp->state == LPFC_NVMET_STE_FREE) { if (ctxp->state == LPFC_NVMET_STE_FREE) {
lpfc_printf_log(phba, KERN_ERR, LOG_NVME_IOERR, lpfc_printf_log(phba, KERN_ERR, LOG_NVME_IOERR,
"6411 NVMET free, already free IO x%x: %d %d\n", "6411 NVMET free, already free IO x%x: %d %d\n",
...@@ -430,7 +423,6 @@ lpfc_nvmet_ctxbuf_post(struct lpfc_hba *phba, struct lpfc_nvmet_ctxbuf *ctx_buf) ...@@ -430,7 +423,6 @@ lpfc_nvmet_ctxbuf_post(struct lpfc_hba *phba, struct lpfc_nvmet_ctxbuf *ctx_buf)
ctxp = (struct lpfc_nvmet_rcv_ctx *)ctx_buf->context; ctxp = (struct lpfc_nvmet_rcv_ctx *)ctx_buf->context;
ctxp->wqeq = NULL; ctxp->wqeq = NULL;
ctxp->txrdy = NULL;
ctxp->offset = 0; ctxp->offset = 0;
ctxp->phba = phba; ctxp->phba = phba;
ctxp->size = size; ctxp->size = size;
...@@ -2327,7 +2319,6 @@ lpfc_nvmet_unsol_fcp_buffer(struct lpfc_hba *phba, ...@@ -2327,7 +2319,6 @@ lpfc_nvmet_unsol_fcp_buffer(struct lpfc_hba *phba,
ctxp->state, ctxp->entry_cnt, ctxp->oxid); ctxp->state, ctxp->entry_cnt, ctxp->oxid);
} }
ctxp->wqeq = NULL; ctxp->wqeq = NULL;
ctxp->txrdy = NULL;
ctxp->offset = 0; ctxp->offset = 0;
ctxp->phba = phba; ctxp->phba = phba;
ctxp->size = size; ctxp->size = size;
...@@ -2606,7 +2597,6 @@ lpfc_nvmet_prep_fcp_wqe(struct lpfc_hba *phba, ...@@ -2606,7 +2597,6 @@ lpfc_nvmet_prep_fcp_wqe(struct lpfc_hba *phba,
struct scatterlist *sgel; struct scatterlist *sgel;
union lpfc_wqe128 *wqe; union lpfc_wqe128 *wqe;
struct ulp_bde64 *bde; struct ulp_bde64 *bde;
uint32_t *txrdy;
dma_addr_t physaddr; dma_addr_t physaddr;
int i, cnt; int i, cnt;
int do_pbde; int do_pbde;
...@@ -2768,23 +2758,11 @@ lpfc_nvmet_prep_fcp_wqe(struct lpfc_hba *phba, ...@@ -2768,23 +2758,11 @@ lpfc_nvmet_prep_fcp_wqe(struct lpfc_hba *phba,
&lpfc_treceive_cmd_template.words[3], &lpfc_treceive_cmd_template.words[3],
sizeof(uint32_t) * 9); sizeof(uint32_t) * 9);
/* Words 0 - 2 : The first sg segment */ /* Words 0 - 2 : First SGE is skipped, set invalid BDE type */
txrdy = dma_pool_alloc(phba->txrdy_payload_pool, wqe->fcp_treceive.bde.tus.f.bdeFlags = LPFC_SGE_TYPE_SKIP;
GFP_KERNEL, &physaddr); wqe->fcp_treceive.bde.tus.f.bdeSize = 0;
if (!txrdy) { wqe->fcp_treceive.bde.addrLow = 0;
lpfc_printf_log(phba, KERN_ERR, LOG_NVME_IOERR, wqe->fcp_treceive.bde.addrHigh = 0;
"6041 Bad txrdy buffer: oxid x%x\n",
ctxp->oxid);
return NULL;
}
ctxp->txrdy = txrdy;
ctxp->txrdy_phys = physaddr;
wqe->fcp_treceive.bde.tus.f.bdeFlags = BUFF_TYPE_BDE_64;
wqe->fcp_treceive.bde.tus.f.bdeSize = TXRDY_PAYLOAD_LEN;
wqe->fcp_treceive.bde.addrLow =
cpu_to_le32(putPaddrLow(physaddr));
wqe->fcp_treceive.bde.addrHigh =
cpu_to_le32(putPaddrHigh(physaddr));
/* Word 4 */ /* Word 4 */
wqe->fcp_treceive.relative_offset = ctxp->offset; wqe->fcp_treceive.relative_offset = ctxp->offset;
...@@ -2819,17 +2797,13 @@ lpfc_nvmet_prep_fcp_wqe(struct lpfc_hba *phba, ...@@ -2819,17 +2797,13 @@ lpfc_nvmet_prep_fcp_wqe(struct lpfc_hba *phba,
/* Word 12 */ /* Word 12 */
wqe->fcp_tsend.fcp_data_len = rsp->transfer_length; wqe->fcp_tsend.fcp_data_len = rsp->transfer_length;
/* Setup 1 TXRDY and 1 SKIP SGE */ /* Setup 2 SKIP SGEs */
txrdy[0] = 0; sgl->addr_hi = 0;
txrdy[1] = cpu_to_be32(rsp->transfer_length); sgl->addr_lo = 0;
txrdy[2] = 0;
sgl->addr_hi = putPaddrHigh(physaddr);
sgl->addr_lo = putPaddrLow(physaddr);
sgl->word2 = 0; sgl->word2 = 0;
bf_set(lpfc_sli4_sge_type, sgl, LPFC_SGE_TYPE_DATA); bf_set(lpfc_sli4_sge_type, sgl, LPFC_SGE_TYPE_SKIP);
sgl->word2 = cpu_to_le32(sgl->word2); sgl->word2 = cpu_to_le32(sgl->word2);
sgl->sge_len = cpu_to_le32(TXRDY_PAYLOAD_LEN); sgl->sge_len = 0;
sgl++; sgl++;
sgl->addr_hi = 0; sgl->addr_hi = 0;
sgl->addr_lo = 0; sgl->addr_lo = 0;
......
...@@ -112,9 +112,7 @@ struct lpfc_nvmet_rcv_ctx { ...@@ -112,9 +112,7 @@ struct lpfc_nvmet_rcv_ctx {
struct lpfc_hba *phba; struct lpfc_hba *phba;
struct lpfc_iocbq *wqeq; struct lpfc_iocbq *wqeq;
struct lpfc_iocbq *abort_wqeq; struct lpfc_iocbq *abort_wqeq;
dma_addr_t txrdy_phys;
spinlock_t ctxlock; /* protect flag access */ spinlock_t ctxlock; /* protect flag access */
uint32_t *txrdy;
uint32_t sid; uint32_t sid;
uint32_t offset; uint32_t offset;
uint16_t oxid; uint16_t oxid;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment