e6dbe9397e
This reverts commitaa136d0c82
. As I previously[1] pointed out this implementation of XDP_REDIRECT is wrong. XDP_REDIRECT is a facility that must work between different NIC drivers. Another NIC driver can call ndo_xdp_xmit/nicvf_xdp_xmit, but your driver patch assumes payload data (at top of page) will contain a queue index and a DMA addr, this is not true and worse will likely contain garbage. Given you have not fixed this in due time (just reached v4.16-rc1), the only option I see is a revert. [1] http://lkml.kernel.org/r/20171211130902.482513d3@redhat.com Cc: Sunil Goutham <sgoutham@cavium.com> Cc: Christina Jacob <cjacob@caviumnetworks.com> Cc: Aleksey Makarov <aleksey.makarov@cavium.com> Fixes:aa136d0c82
("net: thunderx: Add support for xdp redirect") Signed-off-by: Jesper Dangaard Brouer <brouer@redhat.com> Signed-off-by: David S. Miller <davem@davemloft.net>
378 lines
11 KiB
C
378 lines
11 KiB
C
/*
|
|
* Copyright (C) 2015 Cavium, Inc.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms of version 2 of the GNU General Public License
|
|
* as published by the Free Software Foundation.
|
|
*/
|
|
|
|
#ifndef NICVF_QUEUES_H
|
|
#define NICVF_QUEUES_H
|
|
|
|
#include <linux/netdevice.h>
|
|
#include <linux/iommu.h>
|
|
#include <net/xdp.h>
|
|
#include "q_struct.h"
|
|
|
|
#define MAX_QUEUE_SET 128
|
|
#define MAX_RCV_QUEUES_PER_QS 8
|
|
#define MAX_RCV_BUF_DESC_RINGS_PER_QS 2
|
|
#define MAX_SND_QUEUES_PER_QS 8
|
|
#define MAX_CMP_QUEUES_PER_QS 8
|
|
|
|
/* VF's queue interrupt ranges */
|
|
#define NICVF_INTR_ID_CQ 0
|
|
#define NICVF_INTR_ID_SQ 8
|
|
#define NICVF_INTR_ID_RBDR 16
|
|
#define NICVF_INTR_ID_MISC 18
|
|
#define NICVF_INTR_ID_QS_ERR 19
|
|
|
|
#define for_each_cq_irq(irq) \
|
|
for (irq = NICVF_INTR_ID_CQ; irq < NICVF_INTR_ID_SQ; irq++)
|
|
#define for_each_sq_irq(irq) \
|
|
for (irq = NICVF_INTR_ID_SQ; irq < NICVF_INTR_ID_RBDR; irq++)
|
|
#define for_each_rbdr_irq(irq) \
|
|
for (irq = NICVF_INTR_ID_RBDR; irq < NICVF_INTR_ID_MISC; irq++)
|
|
|
|
#define RBDR_SIZE0 0ULL /* 8K entries */
|
|
#define RBDR_SIZE1 1ULL /* 16K entries */
|
|
#define RBDR_SIZE2 2ULL /* 32K entries */
|
|
#define RBDR_SIZE3 3ULL /* 64K entries */
|
|
#define RBDR_SIZE4 4ULL /* 126K entries */
|
|
#define RBDR_SIZE5 5ULL /* 256K entries */
|
|
#define RBDR_SIZE6 6ULL /* 512K entries */
|
|
|
|
#define SND_QUEUE_SIZE0 0ULL /* 1K entries */
|
|
#define SND_QUEUE_SIZE1 1ULL /* 2K entries */
|
|
#define SND_QUEUE_SIZE2 2ULL /* 4K entries */
|
|
#define SND_QUEUE_SIZE3 3ULL /* 8K entries */
|
|
#define SND_QUEUE_SIZE4 4ULL /* 16K entries */
|
|
#define SND_QUEUE_SIZE5 5ULL /* 32K entries */
|
|
#define SND_QUEUE_SIZE6 6ULL /* 64K entries */
|
|
|
|
#define CMP_QUEUE_SIZE0 0ULL /* 1K entries */
|
|
#define CMP_QUEUE_SIZE1 1ULL /* 2K entries */
|
|
#define CMP_QUEUE_SIZE2 2ULL /* 4K entries */
|
|
#define CMP_QUEUE_SIZE3 3ULL /* 8K entries */
|
|
#define CMP_QUEUE_SIZE4 4ULL /* 16K entries */
|
|
#define CMP_QUEUE_SIZE5 5ULL /* 32K entries */
|
|
#define CMP_QUEUE_SIZE6 6ULL /* 64K entries */
|
|
|
|
/* Default queue count per QS, its lengths and threshold values */
|
|
#define DEFAULT_RBDR_CNT 1
|
|
|
|
#define SND_QSIZE SND_QUEUE_SIZE0
|
|
#define SND_QUEUE_LEN (1ULL << (SND_QSIZE + 10))
|
|
#define MIN_SND_QUEUE_LEN (1ULL << (SND_QUEUE_SIZE0 + 10))
|
|
#define MAX_SND_QUEUE_LEN (1ULL << (SND_QUEUE_SIZE6 + 10))
|
|
#define SND_QUEUE_THRESH 2ULL
|
|
#define MIN_SQ_DESC_PER_PKT_XMIT 2
|
|
/* Since timestamp not enabled, otherwise 2 */
|
|
#define MAX_CQE_PER_PKT_XMIT 1
|
|
|
|
/* Keep CQ and SQ sizes same, if timestamping
|
|
* is enabled this equation will change.
|
|
*/
|
|
#define CMP_QSIZE CMP_QUEUE_SIZE0
|
|
#define CMP_QUEUE_LEN (1ULL << (CMP_QSIZE + 10))
|
|
#define MIN_CMP_QUEUE_LEN (1ULL << (CMP_QUEUE_SIZE0 + 10))
|
|
#define MAX_CMP_QUEUE_LEN (1ULL << (CMP_QUEUE_SIZE6 + 10))
|
|
#define CMP_QUEUE_CQE_THRESH (NAPI_POLL_WEIGHT / 2)
|
|
#define CMP_QUEUE_TIMER_THRESH 80 /* ~2usec */
|
|
|
|
/* No of CQEs that might anyway gets used by HW due to pipelining
|
|
* effects irrespective of PASS/DROP/LEVELS being configured
|
|
*/
|
|
#define CMP_QUEUE_PIPELINE_RSVD 544
|
|
|
|
#define RBDR_SIZE RBDR_SIZE0
|
|
#define RCV_BUF_COUNT (1ULL << (RBDR_SIZE + 13))
|
|
#define MAX_RCV_BUF_COUNT (1ULL << (RBDR_SIZE6 + 13))
|
|
#define RBDR_THRESH (RCV_BUF_COUNT / 2)
|
|
#define DMA_BUFFER_LEN 1536 /* In multiples of 128bytes */
|
|
#define RCV_FRAG_LEN (SKB_DATA_ALIGN(DMA_BUFFER_LEN + NET_SKB_PAD) + \
|
|
SKB_DATA_ALIGN(sizeof(struct skb_shared_info)))
|
|
|
|
#define MAX_CQES_FOR_TX ((SND_QUEUE_LEN / MIN_SQ_DESC_PER_PKT_XMIT) * \
|
|
MAX_CQE_PER_PKT_XMIT)
|
|
|
|
/* RED and Backpressure levels of CQ for pkt reception
|
|
* For CQ, level is a measure of emptiness i.e 0x0 means full
|
|
* eg: For CQ of size 4K, and for pass/drop levels of 160/144
|
|
* HW accepts pkt if unused CQE >= 2560
|
|
* RED accepts pkt if unused CQE < 2304 & >= 2560
|
|
* DROPs pkts if unused CQE < 2304
|
|
*/
|
|
#define RQ_PASS_CQ_LVL 192ULL
|
|
#define RQ_DROP_CQ_LVL 184ULL
|
|
|
|
/* RED and Backpressure levels of RBDR for pkt reception
|
|
* For RBDR, level is a measure of fullness i.e 0x0 means empty
|
|
* eg: For RBDR of size 8K, and for pass/drop levels of 4/0
|
|
* HW accepts pkt if unused RBs >= 256
|
|
* RED accepts pkt if unused RBs < 256 & >= 0
|
|
* DROPs pkts if unused RBs < 0
|
|
*/
|
|
#define RQ_PASS_RBDR_LVL 8ULL
|
|
#define RQ_DROP_RBDR_LVL 0ULL
|
|
|
|
/* Descriptor size in bytes */
|
|
#define SND_QUEUE_DESC_SIZE 16
|
|
#define CMP_QUEUE_DESC_SIZE 512
|
|
|
|
/* Buffer / descriptor alignments */
|
|
#define NICVF_RCV_BUF_ALIGN 7
|
|
#define NICVF_RCV_BUF_ALIGN_BYTES (1ULL << NICVF_RCV_BUF_ALIGN)
|
|
#define NICVF_CQ_BASE_ALIGN_BYTES 512 /* 9 bits */
|
|
#define NICVF_SQ_BASE_ALIGN_BYTES 128 /* 7 bits */
|
|
|
|
#define NICVF_ALIGNED_ADDR(ADDR, ALIGN_BYTES) ALIGN(ADDR, ALIGN_BYTES)
|
|
|
|
/* Queue enable/disable */
|
|
#define NICVF_SQ_EN BIT_ULL(19)
|
|
|
|
/* Queue reset */
|
|
#define NICVF_CQ_RESET BIT_ULL(41)
|
|
#define NICVF_SQ_RESET BIT_ULL(17)
|
|
#define NICVF_RBDR_RESET BIT_ULL(43)
|
|
|
|
enum CQ_RX_ERRLVL_E {
|
|
CQ_ERRLVL_MAC,
|
|
CQ_ERRLVL_L2,
|
|
CQ_ERRLVL_L3,
|
|
CQ_ERRLVL_L4,
|
|
};
|
|
|
|
enum CQ_RX_ERROP_E {
|
|
CQ_RX_ERROP_RE_NONE = 0x0,
|
|
CQ_RX_ERROP_RE_PARTIAL = 0x1,
|
|
CQ_RX_ERROP_RE_JABBER = 0x2,
|
|
CQ_RX_ERROP_RE_FCS = 0x7,
|
|
CQ_RX_ERROP_RE_TERMINATE = 0x9,
|
|
CQ_RX_ERROP_RE_RX_CTL = 0xb,
|
|
CQ_RX_ERROP_PREL2_ERR = 0x1f,
|
|
CQ_RX_ERROP_L2_FRAGMENT = 0x20,
|
|
CQ_RX_ERROP_L2_OVERRUN = 0x21,
|
|
CQ_RX_ERROP_L2_PFCS = 0x22,
|
|
CQ_RX_ERROP_L2_PUNY = 0x23,
|
|
CQ_RX_ERROP_L2_MAL = 0x24,
|
|
CQ_RX_ERROP_L2_OVERSIZE = 0x25,
|
|
CQ_RX_ERROP_L2_UNDERSIZE = 0x26,
|
|
CQ_RX_ERROP_L2_LENMISM = 0x27,
|
|
CQ_RX_ERROP_L2_PCLP = 0x28,
|
|
CQ_RX_ERROP_IP_NOT = 0x41,
|
|
CQ_RX_ERROP_IP_CSUM_ERR = 0x42,
|
|
CQ_RX_ERROP_IP_MAL = 0x43,
|
|
CQ_RX_ERROP_IP_MALD = 0x44,
|
|
CQ_RX_ERROP_IP_HOP = 0x45,
|
|
CQ_RX_ERROP_L3_ICRC = 0x46,
|
|
CQ_RX_ERROP_L3_PCLP = 0x47,
|
|
CQ_RX_ERROP_L4_MAL = 0x61,
|
|
CQ_RX_ERROP_L4_CHK = 0x62,
|
|
CQ_RX_ERROP_UDP_LEN = 0x63,
|
|
CQ_RX_ERROP_L4_PORT = 0x64,
|
|
CQ_RX_ERROP_TCP_FLAG = 0x65,
|
|
CQ_RX_ERROP_TCP_OFFSET = 0x66,
|
|
CQ_RX_ERROP_L4_PCLP = 0x67,
|
|
CQ_RX_ERROP_RBDR_TRUNC = 0x70,
|
|
};
|
|
|
|
enum CQ_TX_ERROP_E {
|
|
CQ_TX_ERROP_GOOD = 0x0,
|
|
CQ_TX_ERROP_DESC_FAULT = 0x10,
|
|
CQ_TX_ERROP_HDR_CONS_ERR = 0x11,
|
|
CQ_TX_ERROP_SUBDC_ERR = 0x12,
|
|
CQ_TX_ERROP_MAX_SIZE_VIOL = 0x13,
|
|
CQ_TX_ERROP_IMM_SIZE_OFLOW = 0x80,
|
|
CQ_TX_ERROP_DATA_SEQUENCE_ERR = 0x81,
|
|
CQ_TX_ERROP_MEM_SEQUENCE_ERR = 0x82,
|
|
CQ_TX_ERROP_LOCK_VIOL = 0x83,
|
|
CQ_TX_ERROP_DATA_FAULT = 0x84,
|
|
CQ_TX_ERROP_TSTMP_CONFLICT = 0x85,
|
|
CQ_TX_ERROP_TSTMP_TIMEOUT = 0x86,
|
|
CQ_TX_ERROP_MEM_FAULT = 0x87,
|
|
CQ_TX_ERROP_CK_OVERLAP = 0x88,
|
|
CQ_TX_ERROP_CK_OFLOW = 0x89,
|
|
CQ_TX_ERROP_ENUM_LAST = 0x8a,
|
|
};
|
|
|
|
enum RQ_SQ_STATS {
|
|
RQ_SQ_STATS_OCTS,
|
|
RQ_SQ_STATS_PKTS,
|
|
};
|
|
|
|
struct rx_tx_queue_stats {
|
|
u64 bytes;
|
|
u64 pkts;
|
|
} ____cacheline_aligned_in_smp;
|
|
|
|
struct q_desc_mem {
|
|
dma_addr_t dma;
|
|
u64 size;
|
|
u32 q_len;
|
|
dma_addr_t phys_base;
|
|
void *base;
|
|
void *unalign_base;
|
|
};
|
|
|
|
struct pgcache {
|
|
struct page *page;
|
|
int ref_count;
|
|
u64 dma_addr;
|
|
};
|
|
|
|
struct rbdr {
|
|
bool enable;
|
|
u32 dma_size;
|
|
u32 frag_len;
|
|
u32 thresh; /* Threshold level for interrupt */
|
|
void *desc;
|
|
u32 head;
|
|
u32 tail;
|
|
struct q_desc_mem dmem;
|
|
bool is_xdp;
|
|
|
|
/* For page recycling */
|
|
int pgidx;
|
|
int pgcnt;
|
|
int pgalloc;
|
|
struct pgcache *pgcache;
|
|
} ____cacheline_aligned_in_smp;
|
|
|
|
struct rcv_queue {
|
|
bool enable;
|
|
struct rbdr *rbdr_start;
|
|
struct rbdr *rbdr_cont;
|
|
bool en_tcp_reassembly;
|
|
u8 cq_qs; /* CQ's QS to which this RQ is assigned */
|
|
u8 cq_idx; /* CQ index (0 to 7) in the QS */
|
|
u8 cont_rbdr_qs; /* Continue buffer ptrs - QS num */
|
|
u8 cont_qs_rbdr_idx; /* RBDR idx in the cont QS */
|
|
u8 start_rbdr_qs; /* First buffer ptrs - QS num */
|
|
u8 start_qs_rbdr_idx; /* RBDR idx in the above QS */
|
|
u8 caching;
|
|
struct rx_tx_queue_stats stats;
|
|
struct xdp_rxq_info xdp_rxq;
|
|
} ____cacheline_aligned_in_smp;
|
|
|
|
struct cmp_queue {
|
|
bool enable;
|
|
u16 thresh;
|
|
spinlock_t lock; /* lock to serialize processing CQEs */
|
|
void *desc;
|
|
struct q_desc_mem dmem;
|
|
int irq;
|
|
} ____cacheline_aligned_in_smp;
|
|
|
|
struct snd_queue {
|
|
bool enable;
|
|
u8 cq_qs; /* CQ's QS to which this SQ is pointing */
|
|
u8 cq_idx; /* CQ index (0 to 7) in the above QS */
|
|
u16 thresh;
|
|
atomic_t free_cnt;
|
|
u32 head;
|
|
u32 tail;
|
|
u64 *skbuff;
|
|
void *desc;
|
|
u64 *xdp_page;
|
|
u16 xdp_desc_cnt;
|
|
u16 xdp_free_cnt;
|
|
bool is_xdp;
|
|
|
|
/* For TSO segment's header */
|
|
char *tso_hdrs;
|
|
dma_addr_t tso_hdrs_phys;
|
|
|
|
cpumask_t affinity_mask;
|
|
struct q_desc_mem dmem;
|
|
struct rx_tx_queue_stats stats;
|
|
} ____cacheline_aligned_in_smp;
|
|
|
|
struct queue_set {
|
|
bool enable;
|
|
bool be_en;
|
|
u8 vnic_id;
|
|
u8 rq_cnt;
|
|
u8 cq_cnt;
|
|
u64 cq_len;
|
|
u8 sq_cnt;
|
|
u64 sq_len;
|
|
u8 rbdr_cnt;
|
|
u64 rbdr_len;
|
|
struct rcv_queue rq[MAX_RCV_QUEUES_PER_QS];
|
|
struct cmp_queue cq[MAX_CMP_QUEUES_PER_QS];
|
|
struct snd_queue sq[MAX_SND_QUEUES_PER_QS];
|
|
struct rbdr rbdr[MAX_RCV_BUF_DESC_RINGS_PER_QS];
|
|
} ____cacheline_aligned_in_smp;
|
|
|
|
#define GET_RBDR_DESC(RING, idx)\
|
|
(&(((struct rbdr_entry_t *)((RING)->desc))[idx]))
|
|
#define GET_SQ_DESC(RING, idx)\
|
|
(&(((struct sq_hdr_subdesc *)((RING)->desc))[idx]))
|
|
#define GET_CQ_DESC(RING, idx)\
|
|
(&(((union cq_desc_t *)((RING)->desc))[idx]))
|
|
|
|
/* CQ status bits */
|
|
#define CQ_WR_FULL BIT(26)
|
|
#define CQ_WR_DISABLE BIT(25)
|
|
#define CQ_WR_FAULT BIT(24)
|
|
#define CQ_CQE_COUNT (0xFFFF << 0)
|
|
|
|
#define CQ_ERR_MASK (CQ_WR_FULL | CQ_WR_DISABLE | CQ_WR_FAULT)
|
|
|
|
static inline u64 nicvf_iova_to_phys(struct nicvf *nic, dma_addr_t dma_addr)
|
|
{
|
|
/* Translation is installed only when IOMMU is present */
|
|
if (nic->iommu_domain)
|
|
return iommu_iova_to_phys(nic->iommu_domain, dma_addr);
|
|
return dma_addr;
|
|
}
|
|
|
|
void nicvf_unmap_sndq_buffers(struct nicvf *nic, struct snd_queue *sq,
|
|
int hdr_sqe, u8 subdesc_cnt);
|
|
void nicvf_config_vlan_stripping(struct nicvf *nic,
|
|
netdev_features_t features);
|
|
int nicvf_set_qset_resources(struct nicvf *nic);
|
|
int nicvf_config_data_transfer(struct nicvf *nic, bool enable);
|
|
void nicvf_qset_config(struct nicvf *nic, bool enable);
|
|
void nicvf_cmp_queue_config(struct nicvf *nic, struct queue_set *qs,
|
|
int qidx, bool enable);
|
|
|
|
void nicvf_sq_enable(struct nicvf *nic, struct snd_queue *sq, int qidx);
|
|
void nicvf_sq_disable(struct nicvf *nic, int qidx);
|
|
void nicvf_put_sq_desc(struct snd_queue *sq, int desc_cnt);
|
|
void nicvf_sq_free_used_descs(struct net_device *netdev,
|
|
struct snd_queue *sq, int qidx);
|
|
int nicvf_sq_append_skb(struct nicvf *nic, struct snd_queue *sq,
|
|
struct sk_buff *skb, u8 sq_num);
|
|
int nicvf_xdp_sq_append_pkt(struct nicvf *nic, struct snd_queue *sq,
|
|
u64 bufaddr, u64 dma_addr, u16 len);
|
|
void nicvf_xdp_sq_doorbell(struct nicvf *nic, struct snd_queue *sq, int sq_num);
|
|
|
|
struct sk_buff *nicvf_get_rcv_skb(struct nicvf *nic,
|
|
struct cqe_rx_t *cqe_rx, bool xdp);
|
|
void nicvf_rbdr_task(unsigned long data);
|
|
void nicvf_rbdr_work(struct work_struct *work);
|
|
|
|
void nicvf_enable_intr(struct nicvf *nic, int int_type, int q_idx);
|
|
void nicvf_disable_intr(struct nicvf *nic, int int_type, int q_idx);
|
|
void nicvf_clear_intr(struct nicvf *nic, int int_type, int q_idx);
|
|
int nicvf_is_intr_enabled(struct nicvf *nic, int int_type, int q_idx);
|
|
|
|
/* Register access APIs */
|
|
void nicvf_reg_write(struct nicvf *nic, u64 offset, u64 val);
|
|
u64 nicvf_reg_read(struct nicvf *nic, u64 offset);
|
|
void nicvf_qset_reg_write(struct nicvf *nic, u64 offset, u64 val);
|
|
u64 nicvf_qset_reg_read(struct nicvf *nic, u64 offset);
|
|
void nicvf_queue_reg_write(struct nicvf *nic, u64 offset,
|
|
u64 qidx, u64 val);
|
|
u64 nicvf_queue_reg_read(struct nicvf *nic,
|
|
u64 offset, u64 qidx);
|
|
|
|
/* Stats */
|
|
void nicvf_update_rq_stats(struct nicvf *nic, int rq_idx);
|
|
void nicvf_update_sq_stats(struct nicvf *nic, int sq_idx);
|
|
int nicvf_check_cqe_rx_errs(struct nicvf *nic, struct cqe_rx_t *cqe_rx);
|
|
int nicvf_check_cqe_tx_errs(struct nicvf *nic, struct cqe_send_t *cqe_tx);
|
|
#endif /* NICVF_QUEUES_H */
|