scsi: elx: efct: Hardware queues processing

Add driver definitions for:

 - Routines for EQ, CQ, WQ and RQ processing.

 - Routines for I/O object pool allocation and deallocation.

Link: https://lore.kernel.org/r/20210601235512.20104-23-jsmart2021@gmail.com
Reviewed-by: Hannes Reinecke <hare@suse.de>
Reviewed-by: Daniel Wagner <dwagner@suse.de>
Co-developed-by: Ram Vegesna <ram.vegesna@broadcom.com>
Signed-off-by: Ram Vegesna <ram.vegesna@broadcom.com>
Signed-off-by: James Smart <jsmart2021@gmail.com>
Signed-off-by: Martin K. Petersen <martin.petersen@oracle.com>
This commit is contained in:
James Smart 2021-06-01 16:55:03 -07:00 committed by Martin K. Petersen
parent 63de51327a
commit e2cf422ba8
4 changed files with 764 additions and 0 deletions

View File

@ -2131,3 +2131,363 @@ efct_hw_reqtag_get_instance(struct efct_hw *hw, u32 instance_index)
return wqcb;
}
int
efct_hw_queue_hash_find(struct efct_queue_hash *hash, u16 id)
{
int index = -1;
int i = id & (EFCT_HW_Q_HASH_SIZE - 1);
/*
* Since the hash is always bigger than the maximum number of Qs, then
* we never have to worry about an infinite loop. We will always find
* an unused entry.
*/
do {
if (hash[i].in_use && hash[i].id == id)
index = hash[i].index;
else
i = (i + 1) & (EFCT_HW_Q_HASH_SIZE - 1);
} while (index == -1 && hash[i].in_use);
return index;
}
int
efct_hw_process(struct efct_hw *hw, u32 vector,
u32 max_isr_time_msec)
{
struct hw_eq *eq;
/*
* The caller should disable interrupts if they wish to prevent us
* from processing during a shutdown. The following states are defined:
* EFCT_HW_STATE_UNINITIALIZED - No queues allocated
* EFCT_HW_STATE_QUEUES_ALLOCATED - The state after a chip reset,
* queues are cleared.
* EFCT_HW_STATE_ACTIVE - Chip and queues are operational
* EFCT_HW_STATE_RESET_IN_PROGRESS - reset, we still want completions
* EFCT_HW_STATE_TEARDOWN_IN_PROGRESS - We still want mailbox
* completions.
*/
if (hw->state == EFCT_HW_STATE_UNINITIALIZED)
return 0;
/* Get pointer to struct hw_eq */
eq = hw->hw_eq[vector];
if (!eq)
return 0;
eq->use_count++;
return efct_hw_eq_process(hw, eq, max_isr_time_msec);
}
int
efct_hw_eq_process(struct efct_hw *hw, struct hw_eq *eq,
u32 max_isr_time_msec)
{
u8 eqe[sizeof(struct sli4_eqe)] = { 0 };
u32 tcheck_count;
u64 tstart;
u64 telapsed;
bool done = false;
tcheck_count = EFCT_HW_TIMECHECK_ITERATIONS;
tstart = jiffies_to_msecs(jiffies);
while (!done && !sli_eq_read(&hw->sli, eq->queue, eqe)) {
u16 cq_id = 0;
int rc;
rc = sli_eq_parse(&hw->sli, eqe, &cq_id);
if (unlikely(rc)) {
if (rc == SLI4_EQE_STATUS_EQ_FULL) {
u32 i;
/*
* Received a sentinel EQE indicating the
* EQ is full. Process all CQs
*/
for (i = 0; i < hw->cq_count; i++)
efct_hw_cq_process(hw, hw->hw_cq[i]);
continue;
} else {
return rc;
}
} else {
int index;
index = efct_hw_queue_hash_find(hw->cq_hash, cq_id);
if (likely(index >= 0))
efct_hw_cq_process(hw, hw->hw_cq[index]);
else
efc_log_err(hw->os, "bad CQ_ID %#06x\n", cq_id);
}
if (eq->queue->n_posted > eq->queue->posted_limit)
sli_queue_arm(&hw->sli, eq->queue, false);
if (tcheck_count && (--tcheck_count == 0)) {
tcheck_count = EFCT_HW_TIMECHECK_ITERATIONS;
telapsed = jiffies_to_msecs(jiffies) - tstart;
if (telapsed >= max_isr_time_msec)
done = true;
}
}
sli_queue_eq_arm(&hw->sli, eq->queue, true);
return 0;
}
static int
_efct_hw_wq_write(struct hw_wq *wq, struct efct_hw_wqe *wqe)
{
int queue_rc;
/* Every so often, set the wqec bit to generate comsummed completions */
if (wq->wqec_count)
wq->wqec_count--;
if (wq->wqec_count == 0) {
struct sli4_generic_wqe *genwqe = (void *)wqe->wqebuf;
genwqe->cmdtype_wqec_byte |= SLI4_GEN_WQE_WQEC;
wq->wqec_count = wq->wqec_set_count;
}
/* Decrement WQ free count */
wq->free_count--;
queue_rc = sli_wq_write(&wq->hw->sli, wq->queue, wqe->wqebuf);
return (queue_rc < 0) ? -EIO : 0;
}
static void
hw_wq_submit_pending(struct hw_wq *wq, u32 update_free_count)
{
struct efct_hw_wqe *wqe;
unsigned long flags = 0;
spin_lock_irqsave(&wq->queue->lock, flags);
/* Update free count with value passed in */
wq->free_count += update_free_count;
while ((wq->free_count > 0) && (!list_empty(&wq->pending_list))) {
wqe = list_first_entry(&wq->pending_list,
struct efct_hw_wqe, list_entry);
list_del_init(&wqe->list_entry);
_efct_hw_wq_write(wq, wqe);
if (wqe->abort_wqe_submit_needed) {
wqe->abort_wqe_submit_needed = false;
efct_hw_fill_abort_wqe(wq->hw, wqe);
INIT_LIST_HEAD(&wqe->list_entry);
list_add_tail(&wqe->list_entry, &wq->pending_list);
wq->wq_pending_count++;
}
}
spin_unlock_irqrestore(&wq->queue->lock, flags);
}
void
efct_hw_cq_process(struct efct_hw *hw, struct hw_cq *cq)
{
u8 cqe[sizeof(struct sli4_mcqe)];
u16 rid = U16_MAX;
/* completion type */
enum sli4_qentry ctype;
u32 n_processed = 0;
u32 tstart, telapsed;
tstart = jiffies_to_msecs(jiffies);
while (!sli_cq_read(&hw->sli, cq->queue, cqe)) {
int status;
status = sli_cq_parse(&hw->sli, cq->queue, cqe, &ctype, &rid);
/*
* The sign of status is significant. If status is:
* == 0 : call completed correctly and
* the CQE indicated success
* > 0 : call completed correctly and
* the CQE indicated an error
* < 0 : call failed and no information is available about the
* CQE
*/
if (status < 0) {
if (status == SLI4_MCQE_STATUS_NOT_COMPLETED)
/*
* Notification that an entry was consumed,
* but not completed
*/
continue;
break;
}
switch (ctype) {
case SLI4_QENTRY_ASYNC:
sli_cqe_async(&hw->sli, cqe);
break;
case SLI4_QENTRY_MQ:
/*
* Process MQ entry. Note there is no way to determine
* the MQ_ID from the completion entry.
*/
efct_hw_mq_process(hw, status, hw->mq);
break;
case SLI4_QENTRY_WQ:
efct_hw_wq_process(hw, cq, cqe, status, rid);
break;
case SLI4_QENTRY_WQ_RELEASE: {
u32 wq_id = rid;
int index;
struct hw_wq *wq = NULL;
index = efct_hw_queue_hash_find(hw->wq_hash, wq_id);
if (likely(index >= 0)) {
wq = hw->hw_wq[index];
} else {
efc_log_err(hw->os, "bad WQ_ID %#06x\n", wq_id);
break;
}
/* Submit any HW IOs that are on the WQ pending list */
hw_wq_submit_pending(wq, wq->wqec_set_count);
break;
}
case SLI4_QENTRY_RQ:
efct_hw_rqpair_process_rq(hw, cq, cqe);
break;
case SLI4_QENTRY_XABT: {
efct_hw_xabt_process(hw, cq, cqe, rid);
break;
}
default:
efc_log_debug(hw->os, "unhandled ctype=%#x rid=%#x\n",
ctype, rid);
break;
}
n_processed++;
if (n_processed == cq->queue->proc_limit)
break;
if (cq->queue->n_posted >= cq->queue->posted_limit)
sli_queue_arm(&hw->sli, cq->queue, false);
}
sli_queue_arm(&hw->sli, cq->queue, true);
if (n_processed > cq->queue->max_num_processed)
cq->queue->max_num_processed = n_processed;
telapsed = jiffies_to_msecs(jiffies) - tstart;
if (telapsed > cq->queue->max_process_time)
cq->queue->max_process_time = telapsed;
}
void
efct_hw_wq_process(struct efct_hw *hw, struct hw_cq *cq,
u8 *cqe, int status, u16 rid)
{
struct hw_wq_callback *wqcb;
if (rid == EFCT_HW_REQUE_XRI_REGTAG) {
if (status)
efc_log_err(hw->os, "reque xri failed, status = %d\n",
status);
return;
}
wqcb = efct_hw_reqtag_get_instance(hw, rid);
if (!wqcb) {
efc_log_err(hw->os, "invalid request tag: x%x\n", rid);
return;
}
if (!wqcb->callback) {
efc_log_err(hw->os, "wqcb callback is NULL\n");
return;
}
(*wqcb->callback)(wqcb->arg, cqe, status);
}
void
efct_hw_xabt_process(struct efct_hw *hw, struct hw_cq *cq,
u8 *cqe, u16 rid)
{
/* search IOs wait free list */
struct efct_hw_io *io = NULL;
unsigned long flags = 0;
io = efct_hw_io_lookup(hw, rid);
if (!io) {
/* IO lookup failure should never happen */
efc_log_err(hw->os, "xabt io lookup failed rid=%#x\n", rid);
return;
}
if (!io->xbusy)
efc_log_debug(hw->os, "xabt io not busy rid=%#x\n", rid);
else
/* mark IO as no longer busy */
io->xbusy = false;
/*
* For IOs that were aborted internally, we need to issue any pending
* callback here.
*/
if (io->done) {
efct_hw_done_t done = io->done;
void *arg = io->arg;
/*
* Use latched status as this is always saved for an internal
* abort
*/
int status = io->saved_status;
u32 len = io->saved_len;
u32 ext = io->saved_ext;
io->done = NULL;
io->status_saved = false;
done(io, len, status, ext, arg);
}
spin_lock_irqsave(&hw->io_lock, flags);
if (io->state == EFCT_HW_IO_STATE_INUSE ||
io->state == EFCT_HW_IO_STATE_WAIT_FREE) {
/* if on wait_free list, caller has already freed IO;
* remove from wait_free list and add to free list.
* if on in-use list, already marked as no longer busy;
* just leave there and wait for caller to free.
*/
if (io->state == EFCT_HW_IO_STATE_WAIT_FREE) {
io->state = EFCT_HW_IO_STATE_FREE;
list_del_init(&io->list_entry);
efct_hw_io_free_move_correct_list(hw, io);
}
}
spin_unlock_irqrestore(&hw->io_lock, flags);
}
static int
efct_hw_flush(struct efct_hw *hw)
{
u32 i = 0;
/* Process any remaining completions */
for (i = 0; i < hw->eq_count; i++)
efct_hw_process(hw, i, ~0);
return 0;
}

View File

@ -652,4 +652,43 @@ efct_hw_reqtag_free(struct efct_hw *hw, struct hw_wq_callback *wqcb);
struct hw_wq_callback
*efct_hw_reqtag_get_instance(struct efct_hw *hw, u32 instance_index);
/* RQ completion handlers for RQ pair mode */
int
efct_hw_rqpair_process_rq(struct efct_hw *hw,
struct hw_cq *cq, u8 *cqe);
int
efct_hw_rqpair_sequence_free(struct efct_hw *hw, struct efc_hw_sequence *seq);
static inline void
efct_hw_sequence_copy(struct efc_hw_sequence *dst,
struct efc_hw_sequence *src)
{
/* Copy src to dst, then zero out the linked list link */
*dst = *src;
}
int
efct_efc_hw_sequence_free(struct efc *efc, struct efc_hw_sequence *seq);
static inline int
efct_hw_sequence_free(struct efct_hw *hw, struct efc_hw_sequence *seq)
{
/* Only RQ pair mode is supported */
return efct_hw_rqpair_sequence_free(hw, seq);
}
int
efct_hw_eq_process(struct efct_hw *hw, struct hw_eq *eq,
u32 max_isr_time_msec);
void efct_hw_cq_process(struct efct_hw *hw, struct hw_cq *cq);
void
efct_hw_wq_process(struct efct_hw *hw, struct hw_cq *cq,
u8 *cqe, int status, u16 rid);
void
efct_hw_xabt_process(struct efct_hw *hw, struct hw_cq *cq,
u8 *cqe, u16 rid);
int
efct_hw_process(struct efct_hw *hw, u32 vector, u32 max_isr_time_msec);
int
efct_hw_queue_hash_find(struct efct_queue_hash *hash, u16 id);
#endif /* __EFCT_H__ */

View File

@ -0,0 +1,191 @@
// SPDX-License-Identifier: GPL-2.0
/*
* Copyright (C) 2021 Broadcom. All Rights Reserved. The term
* Broadcom refers to Broadcom Inc. and/or its subsidiaries.
*/
#include "efct_driver.h"
#include "efct_hw.h"
#include "efct_io.h"
struct efct_io_pool {
struct efct *efct;
spinlock_t lock; /* IO pool lock */
u32 io_num_ios; /* Total IOs allocated */
struct efct_io *ios[EFCT_NUM_SCSI_IOS];
struct list_head freelist;
};
struct efct_io_pool *
efct_io_pool_create(struct efct *efct, u32 num_sgl)
{
u32 i = 0;
struct efct_io_pool *io_pool;
struct efct_io *io;
/* Allocate the IO pool */
io_pool = kzalloc(sizeof(*io_pool), GFP_KERNEL);
if (!io_pool)
return NULL;
io_pool->efct = efct;
INIT_LIST_HEAD(&io_pool->freelist);
/* initialize IO pool lock */
spin_lock_init(&io_pool->lock);
for (i = 0; i < EFCT_NUM_SCSI_IOS; i++) {
io = kzalloc(sizeof(*io), GFP_KERNEL);
if (!io)
break;
io_pool->io_num_ios++;
io_pool->ios[i] = io;
io->tag = i;
io->instance_index = i;
/* Allocate a response buffer */
io->rspbuf.size = SCSI_RSP_BUF_LENGTH;
io->rspbuf.virt = dma_alloc_coherent(&efct->pci->dev,
io->rspbuf.size,
&io->rspbuf.phys, GFP_DMA);
if (!io->rspbuf.virt) {
efc_log_err(efct, "dma_alloc rspbuf failed\n");
efct_io_pool_free(io_pool);
return NULL;
}
/* Allocate SGL */
io->sgl = kzalloc(sizeof(*io->sgl) * num_sgl, GFP_KERNEL);
if (!io->sgl) {
efct_io_pool_free(io_pool);
return NULL;
}
memset(io->sgl, 0, sizeof(*io->sgl) * num_sgl);
io->sgl_allocated = num_sgl;
io->sgl_count = 0;
INIT_LIST_HEAD(&io->list_entry);
list_add_tail(&io->list_entry, &io_pool->freelist);
}
return io_pool;
}
int
efct_io_pool_free(struct efct_io_pool *io_pool)
{
struct efct *efct;
u32 i;
struct efct_io *io;
if (io_pool) {
efct = io_pool->efct;
for (i = 0; i < io_pool->io_num_ios; i++) {
io = io_pool->ios[i];
if (!io)
continue;
kfree(io->sgl);
dma_free_coherent(&efct->pci->dev,
io->rspbuf.size, io->rspbuf.virt,
io->rspbuf.phys);
memset(&io->rspbuf, 0, sizeof(struct efc_dma));
}
kfree(io_pool);
efct->xport->io_pool = NULL;
}
return 0;
}
struct efct_io *
efct_io_pool_io_alloc(struct efct_io_pool *io_pool)
{
struct efct_io *io = NULL;
struct efct *efct;
unsigned long flags = 0;
efct = io_pool->efct;
spin_lock_irqsave(&io_pool->lock, flags);
if (!list_empty(&io_pool->freelist)) {
io = list_first_entry(&io_pool->freelist, struct efct_io,
list_entry);
list_del_init(&io->list_entry);
}
spin_unlock_irqrestore(&io_pool->lock, flags);
if (!io)
return NULL;
io->io_type = EFCT_IO_TYPE_MAX;
io->hio_type = EFCT_HW_IO_MAX;
io->hio = NULL;
io->transferred = 0;
io->efct = efct;
io->timeout = 0;
io->sgl_count = 0;
io->tgt_task_tag = 0;
io->init_task_tag = 0;
io->hw_tag = 0;
io->display_name = "pending";
io->seq_init = 0;
io->io_free = 0;
io->release = NULL;
atomic_add_return(1, &efct->xport->io_active_count);
atomic_add_return(1, &efct->xport->io_total_alloc);
return io;
}
/* Free an object used to track an IO */
void
efct_io_pool_io_free(struct efct_io_pool *io_pool, struct efct_io *io)
{
struct efct *efct;
struct efct_hw_io *hio = NULL;
unsigned long flags = 0;
efct = io_pool->efct;
spin_lock_irqsave(&io_pool->lock, flags);
hio = io->hio;
io->hio = NULL;
io->io_free = 1;
INIT_LIST_HEAD(&io->list_entry);
list_add(&io->list_entry, &io_pool->freelist);
spin_unlock_irqrestore(&io_pool->lock, flags);
if (hio)
efct_hw_io_free(&efct->hw, hio);
atomic_sub_return(1, &efct->xport->io_active_count);
atomic_add_return(1, &efct->xport->io_total_free);
}
/* Find an I/O given it's node and ox_id */
struct efct_io *
efct_io_find_tgt_io(struct efct *efct, struct efct_node *node,
u16 ox_id, u16 rx_id)
{
struct efct_io *io = NULL;
unsigned long flags = 0;
u8 found = false;
spin_lock_irqsave(&node->active_ios_lock, flags);
list_for_each_entry(io, &node->active_ios, list_entry) {
if ((io->cmd_tgt && io->init_task_tag == ox_id) &&
(rx_id == 0xffff || io->tgt_task_tag == rx_id)) {
if (kref_get_unless_zero(&io->ref))
found = true;
break;
}
}
spin_unlock_irqrestore(&node->active_ios_lock, flags);
return found ? io : NULL;
}

View File

@ -0,0 +1,174 @@
/* SPDX-License-Identifier: GPL-2.0 */
/*
* Copyright (C) 2021 Broadcom. All Rights Reserved. The term
* Broadcom refers to Broadcom Inc. and/or its subsidiaries.
*/
#if !defined(__EFCT_IO_H__)
#define __EFCT_IO_H__
#include "efct_lio.h"
#define EFCT_LOG_ENABLE_IO_ERRORS(efct) \
(((efct) != NULL) ? (((efct)->logmask & (1U << 6)) != 0) : 0)
#define io_error_log(io, fmt, ...) \
do { \
if (EFCT_LOG_ENABLE_IO_ERRORS(io->efct)) \
efc_log_warn(io->efct, fmt, ##__VA_ARGS__); \
} while (0)
#define SCSI_CMD_BUF_LENGTH 48
#define SCSI_RSP_BUF_LENGTH (FCP_RESP_WITH_EXT + SCSI_SENSE_BUFFERSIZE)
#define EFCT_NUM_SCSI_IOS 8192
enum efct_io_type {
EFCT_IO_TYPE_IO = 0,
EFCT_IO_TYPE_ELS,
EFCT_IO_TYPE_CT,
EFCT_IO_TYPE_CT_RESP,
EFCT_IO_TYPE_BLS_RESP,
EFCT_IO_TYPE_ABORT,
EFCT_IO_TYPE_MAX,
};
enum efct_els_state {
EFCT_ELS_REQUEST = 0,
EFCT_ELS_REQUEST_DELAYED,
EFCT_ELS_REQUEST_DELAY_ABORT,
EFCT_ELS_REQ_ABORT,
EFCT_ELS_REQ_ABORTED,
EFCT_ELS_ABORT_IO_COMPL,
};
/**
* Scsi target IO object
* @efct: pointer back to efct
* @instance_index: unique instance index value
* @io: IO display name
* @node: pointer to node
* @list_entry: io list entry
* @io_pending_link: io pending list entry
* @ref: reference counter
* @release: release callback function
* @init_task_tag: initiator task tag (OX_ID) for back-end and SCSI logging
* @tgt_task_tag: target task tag (RX_ID) for back-end and SCSI logging
* @hw_tag: HW layer unique IO id
* @tag: unique IO identifier
* @sgl: SGL
* @sgl_allocated: Number of allocated SGEs
* @sgl_count: Number of SGEs in this SGL
* @tgt_io: backend target private IO data
* @exp_xfer_len: expected data transfer length, based on FC header
* @hw_priv: Declarations private to HW/SLI
* @io_type: indicates what this struct efct_io structure is used for
* @hio: hw io object
* @transferred: Number of bytes transferred
* @auto_resp: set if auto_trsp was set
* @low_latency: set if low latency request
* @wq_steering: selected WQ steering request
* @wq_class: selected WQ class if steering is class
* @xfer_req: transfer size for current request
* @scsi_tgt_cb: target callback function
* @scsi_tgt_cb_arg: target callback function argument
* @abort_cb: abort callback function
* @abort_cb_arg: abort callback function argument
* @bls_cb: BLS callback function
* @bls_cb_arg: BLS callback function argument
* @tmf_cmd: TMF command being processed
* @abort_rx_id: rx_id from the ABTS that initiated the command abort
* @cmd_tgt: True if this is a Target command
* @send_abts: when aborting, indicates ABTS is to be sent
* @cmd_ini: True if this is an Initiator command
* @seq_init: True if local node has sequence initiative
* @iparam: iparams for hw io send call
* @hio_type: HW IO type
* @wire_len: wire length
* @hw_cb: saved HW callback
* @io_to_abort: for abort handling, pointer to IO to abort
* @rspbuf: SCSI Response buffer
* @timeout: Timeout value in seconds for this IO
* @cs_ctl: CS_CTL priority for this IO
* @io_free: Is io object in freelist
* @app_id: application id
*/
struct efct_io {
struct efct *efct;
u32 instance_index;
const char *display_name;
struct efct_node *node;
struct list_head list_entry;
struct list_head io_pending_link;
struct kref ref;
void (*release)(struct kref *arg);
u32 init_task_tag;
u32 tgt_task_tag;
u32 hw_tag;
u32 tag;
struct efct_scsi_sgl *sgl;
u32 sgl_allocated;
u32 sgl_count;
struct efct_scsi_tgt_io tgt_io;
u32 exp_xfer_len;
void *hw_priv;
enum efct_io_type io_type;
struct efct_hw_io *hio;
size_t transferred;
bool auto_resp;
bool low_latency;
u8 wq_steering;
u8 wq_class;
u64 xfer_req;
efct_scsi_io_cb_t scsi_tgt_cb;
void *scsi_tgt_cb_arg;
efct_scsi_io_cb_t abort_cb;
void *abort_cb_arg;
efct_scsi_io_cb_t bls_cb;
void *bls_cb_arg;
enum efct_scsi_tmf_cmd tmf_cmd;
u16 abort_rx_id;
bool cmd_tgt;
bool send_abts;
bool cmd_ini;
bool seq_init;
union efct_hw_io_param_u iparam;
enum efct_hw_io_type hio_type;
u64 wire_len;
void *hw_cb;
struct efct_io *io_to_abort;
struct efc_dma rspbuf;
u32 timeout;
u8 cs_ctl;
u8 io_free;
u32 app_id;
};
struct efct_io_cb_arg {
int status;
int ext_status;
void *app;
};
struct efct_io_pool *
efct_io_pool_create(struct efct *efct, u32 num_sgl);
int
efct_io_pool_free(struct efct_io_pool *io_pool);
u32
efct_io_pool_allocated(struct efct_io_pool *io_pool);
struct efct_io *
efct_io_pool_io_alloc(struct efct_io_pool *io_pool);
void
efct_io_pool_io_free(struct efct_io_pool *io_pool, struct efct_io *io);
struct efct_io *
efct_io_find_tgt_io(struct efct *efct, struct efct_node *node,
u16 ox_id, u16 rx_id);
#endif /* __EFCT_IO_H__ */