f-stack/dpdk/drivers/baseband/acc100/rte_acc100_pmd.h

603 lines
17 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright(c) 2020 Intel Corporation
*/
#ifndef _RTE_ACC100_PMD_H_
#define _RTE_ACC100_PMD_H_
#include "acc100_pf_enum.h"
#include "acc100_vf_enum.h"
#include "rte_acc100_cfg.h"
/* Helper macro for logging */
#define rte_bbdev_log(level, fmt, ...) \
rte_log(RTE_LOG_ ## level, acc100_logtype, fmt "\n", \
##__VA_ARGS__)
#ifdef RTE_LIBRTE_BBDEV_DEBUG
#define rte_bbdev_log_debug(fmt, ...) \
rte_bbdev_log(DEBUG, "acc100_pmd: " fmt, \
##__VA_ARGS__)
#else
#define rte_bbdev_log_debug(fmt, ...)
#endif
/* ACC100 PF and VF driver names */
#define ACC100PF_DRIVER_NAME intel_acc100_pf
#define ACC100VF_DRIVER_NAME intel_acc100_vf
/* ACC100 PCI vendor & device IDs */
#define RTE_ACC100_VENDOR_ID (0x8086)
#define RTE_ACC100_PF_DEVICE_ID (0x0d5c)
#define RTE_ACC100_VF_DEVICE_ID (0x0d5d)
/* Define as 1 to use only a single FEC engine */
#ifndef RTE_ACC100_SINGLE_FEC
#define RTE_ACC100_SINGLE_FEC 0
#endif
/* Values used in filling in descriptors */
#define ACC100_DMA_DESC_TYPE 2
#define ACC100_DMA_CODE_BLK_MODE 0
#define ACC100_DMA_BLKID_FCW 1
#define ACC100_DMA_BLKID_IN 2
#define ACC100_DMA_BLKID_OUT_ENC 1
#define ACC100_DMA_BLKID_OUT_HARD 1
#define ACC100_DMA_BLKID_OUT_SOFT 2
#define ACC100_DMA_BLKID_OUT_HARQ 3
#define ACC100_DMA_BLKID_IN_HARQ 3
/* Values used in filling in decode FCWs */
#define ACC100_FCW_TD_VER 1
#define ACC100_FCW_TD_EXT_COLD_REG_EN 1
#define ACC100_FCW_TD_AUTOMAP 0x0f
#define ACC100_FCW_TD_RVIDX_0 2
#define ACC100_FCW_TD_RVIDX_1 26
#define ACC100_FCW_TD_RVIDX_2 50
#define ACC100_FCW_TD_RVIDX_3 74
/* Values used in writing to the registers */
#define ACC100_REG_IRQ_EN_ALL 0x1FF83FF /* Enable all interrupts */
/* ACC100 Specific Dimensioning */
#define ACC100_SIZE_64MBYTE (64*1024*1024)
/* Number of elements in an Info Ring */
#define ACC100_INFO_RING_NUM_ENTRIES 1024
/* Number of elements in HARQ layout memory */
#define ACC100_HARQ_LAYOUT (64*1024*1024)
/* Assume offset for HARQ in memory */
#define ACC100_HARQ_OFFSET (32*1024)
/* Mask used to calculate an index in an Info Ring array (not a byte offset) */
#define ACC100_INFO_RING_MASK (ACC100_INFO_RING_NUM_ENTRIES-1)
/* Number of Virtual Functions ACC100 supports */
#define ACC100_NUM_VFS 16
#define ACC100_NUM_QGRPS 8
#define ACC100_NUM_QGRPS_PER_WORD 8
#define ACC100_NUM_AQS 16
#define MAX_ENQ_BATCH_SIZE 255
/* All ACC100 Registers alignment are 32bits = 4B */
#define ACC100_BYTES_IN_WORD 4
#define ACC100_MAX_E_MBUF 64000
#define ACC100_GRP_ID_SHIFT 10 /* Queue Index Hierarchy */
#define ACC100_VF_ID_SHIFT 4 /* Queue Index Hierarchy */
#define ACC100_VF_OFFSET_QOS 16 /* offset in Memory specific to QoS Mon */
#define ACC100_TMPL_PRI_0 0x03020100
#define ACC100_TMPL_PRI_1 0x07060504
#define ACC100_TMPL_PRI_2 0x0b0a0908
#define ACC100_TMPL_PRI_3 0x0f0e0d0c
#define ACC100_QUEUE_ENABLE 0x80000000 /* Bit to mark Queue as Enabled */
#define ACC100_WORDS_IN_ARAM_SIZE (128 * 1024 / 4)
#define ACC100_FDONE 0x80000000
#define ACC100_SDONE 0x40000000
#define ACC100_NUM_TMPL 32
/* Mapping of signals for the available engines */
#define ACC100_SIG_UL_5G 0
#define ACC100_SIG_UL_5G_LAST 7
#define ACC100_SIG_DL_5G 13
#define ACC100_SIG_DL_5G_LAST 15
#define ACC100_SIG_UL_4G 16
#define ACC100_SIG_UL_4G_LAST 21
#define ACC100_SIG_DL_4G 27
#define ACC100_SIG_DL_4G_LAST 31
#define ACC100_NUM_ACCS 5
#define ACC100_ACCMAP_0 0
#define ACC100_ACCMAP_1 2
#define ACC100_ACCMAP_2 1
#define ACC100_ACCMAP_3 3
#define ACC100_ACCMAP_4 4
#define ACC100_PF_VAL 2
/* max number of iterations to allocate memory block for all rings */
#define ACC100_SW_RING_MEM_ALLOC_ATTEMPTS 5
#define ACC100_MAX_QUEUE_DEPTH 1024
#define ACC100_DMA_MAX_NUM_POINTERS 14
#define ACC100_DMA_DESC_PADDING 8
#define ACC100_FCW_PADDING 12
#define ACC100_DESC_FCW_OFFSET 192
#define ACC100_DESC_SIZE 256
#define ACC100_DESC_OFFSET (ACC100_DESC_SIZE / 64)
#define ACC100_FCW_TE_BLEN 32
#define ACC100_FCW_TD_BLEN 24
#define ACC100_FCW_LE_BLEN 32
#define ACC100_FCW_LD_BLEN 36
#define ACC100_5GUL_SIZE_0 16
#define ACC100_5GUL_SIZE_1 40
#define ACC100_5GUL_OFFSET_0 36
#define ACC100_FCW_VER 2
#define ACC100_MUX_5GDL_DESC 6
#define ACC100_CMP_ENC_SIZE 20
#define ACC100_CMP_DEC_SIZE 24
#define ACC100_ENC_OFFSET (32)
#define ACC100_DEC_OFFSET (80)
#define ACC100_EXT_MEM /* Default option with memory external to CPU */
#define ACC100_HARQ_OFFSET_THRESHOLD 1024
/* Constants from K0 computation from 3GPP 38.212 Table 5.4.2.1-2 */
#define ACC100_N_ZC_1 66 /* N = 66 Zc for BG 1 */
#define ACC100_N_ZC_2 50 /* N = 50 Zc for BG 2 */
#define ACC100_K0_1_1 17 /* K0 fraction numerator for rv 1 and BG 1 */
#define ACC100_K0_1_2 13 /* K0 fraction numerator for rv 1 and BG 2 */
#define ACC100_K0_2_1 33 /* K0 fraction numerator for rv 2 and BG 1 */
#define ACC100_K0_2_2 25 /* K0 fraction numerator for rv 2 and BG 2 */
#define ACC100_K0_3_1 56 /* K0 fraction numerator for rv 3 and BG 1 */
#define ACC100_K0_3_2 43 /* K0 fraction numerator for rv 3 and BG 2 */
/* ACC100 Configuration */
#define ACC100_DDR_ECC_ENABLE
#define ACC100_CFG_DMA_ERROR 0x3D7
#define ACC100_CFG_AXI_CACHE 0x11
#define ACC100_CFG_QMGR_HI_P 0x0F0F
#define ACC100_CFG_PCI_AXI 0xC003
#define ACC100_CFG_PCI_BRIDGE 0x40006033
#define ACC100_ENGINE_OFFSET 0x1000
#define ACC100_RESET_HI 0x20100
#define ACC100_RESET_LO 0x20000
#define ACC100_RESET_HARD 0x1FF
#define ACC100_ENGINES_MAX 9
#define ACC100_LONG_WAIT 1000
#define ACC100_GPEX_AXIMAP_NUM 17
/* ACC100 DMA Descriptor triplet */
struct acc100_dma_triplet {
uint64_t address;
uint32_t blen:20,
res0:4,
last:1,
dma_ext:1,
res1:2,
blkid:4;
} __rte_packed;
/* ACC100 DMA Response Descriptor */
union acc100_dma_rsp_desc {
uint32_t val;
struct {
uint32_t crc_status:1,
synd_ok:1,
dma_err:1,
neg_stop:1,
fcw_err:1,
output_err:1,
input_err:1,
timestampEn:1,
iterCountFrac:8,
iter_cnt:8,
rsrvd3:6,
sdone:1,
fdone:1;
uint32_t add_info_0;
uint32_t add_info_1;
};
};
/* ACC100 Queue Manager Enqueue PCI Register */
union acc100_enqueue_reg_fmt {
uint32_t val;
struct {
uint32_t num_elem:8,
addr_offset:3,
rsrvd:1,
req_elem_addr:20;
};
};
/* FEC 4G Uplink Frame Control Word */
struct __rte_packed acc100_fcw_td {
uint8_t fcw_ver:4,
num_maps:4; /* Unused */
uint8_t filler:6, /* Unused */
rsrvd0:1,
bypass_sb_deint:1;
uint16_t k_pos;
uint16_t k_neg; /* Unused */
uint8_t c_neg; /* Unused */
uint8_t c; /* Unused */
uint32_t ea; /* Unused */
uint32_t eb; /* Unused */
uint8_t cab; /* Unused */
uint8_t k0_start_col; /* Unused */
uint8_t rsrvd1;
uint8_t code_block_mode:1, /* Unused */
turbo_crc_type:1,
rsrvd2:3,
bypass_teq:1, /* Unused */
soft_output_en:1, /* Unused */
ext_td_cold_reg_en:1;
union { /* External Cold register */
uint32_t ext_td_cold_reg;
struct {
uint32_t min_iter:4, /* Unused */
max_iter:4,
ext_scale:5, /* Unused */
rsrvd3:3,
early_stop_en:1, /* Unused */
sw_soft_out_dis:1, /* Unused */
sw_et_cont:1, /* Unused */
sw_soft_out_saturation:1, /* Unused */
half_iter_on:1, /* Unused */
raw_decoder_input_on:1, /* Unused */
rsrvd4:10;
};
};
};
/* FEC 5GNR Uplink Frame Control Word */
struct __rte_packed acc100_fcw_ld {
uint32_t FCWversion:4,
qm:4,
nfiller:11,
BG:1,
Zc:9,
res0:1,
synd_precoder:1,
synd_post:1;
uint32_t ncb:16,
k0:16;
uint32_t rm_e:24,
hcin_en:1,
hcout_en:1,
crc_select:1,
bypass_dec:1,
bypass_intlv:1,
so_en:1,
so_bypass_rm:1,
so_bypass_intlv:1;
uint32_t hcin_offset:16,
hcin_size0:16;
uint32_t hcin_size1:16,
hcin_decomp_mode:3,
llr_pack_mode:1,
hcout_comp_mode:3,
res2:1,
dec_convllr:4,
hcout_convllr:4;
uint32_t itmax:7,
itstop:1,
so_it:7,
res3:1,
hcout_offset:16;
uint32_t hcout_size0:16,
hcout_size1:16;
uint32_t gain_i:8,
gain_h:8,
negstop_th:16;
uint32_t negstop_it:7,
negstop_en:1,
res4:24;
};
/* FEC 4G Downlink Frame Control Word */
struct __rte_packed acc100_fcw_te {
uint16_t k_neg;
uint16_t k_pos;
uint8_t c_neg;
uint8_t c;
uint8_t filler;
uint8_t cab;
uint32_t ea:17,
rsrvd0:15;
uint32_t eb:17,
rsrvd1:15;
uint16_t ncb_neg;
uint16_t ncb_pos;
uint8_t rv_idx0:2,
rsrvd2:2,
rv_idx1:2,
rsrvd3:2;
uint8_t bypass_rv_idx0:1,
bypass_rv_idx1:1,
bypass_rm:1,
rsrvd4:5;
uint8_t rsrvd5:1,
rsrvd6:3,
code_block_crc:1,
rsrvd7:3;
uint8_t code_block_mode:1,
rsrvd8:7;
uint64_t rsrvd9;
};
/* FEC 5GNR Downlink Frame Control Word */
struct __rte_packed acc100_fcw_le {
uint32_t FCWversion:4,
qm:4,
nfiller:11,
BG:1,
Zc:9,
res0:3;
uint32_t ncb:16,
k0:16;
uint32_t rm_e:24,
res1:2,
crc_select:1,
res2:1,
bypass_intlv:1,
res3:3;
uint32_t res4_a:12,
mcb_count:3,
res4_b:17;
uint32_t res5;
uint32_t res6;
uint32_t res7;
uint32_t res8;
};
/* ACC100 DMA Request Descriptor */
struct __rte_packed acc100_dma_req_desc {
union {
struct{
uint32_t type:4,
rsrvd0:26,
sdone:1,
fdone:1;
uint32_t rsrvd1;
uint32_t rsrvd2;
uint32_t pass_param:8,
sdone_enable:1,
irq_enable:1,
timeStampEn:1,
res0:5,
numCBs:4,
res1:4,
m2dlen:4,
d2mlen:4;
};
struct{
uint32_t word0;
uint32_t word1;
uint32_t word2;
uint32_t word3;
};
};
struct acc100_dma_triplet data_ptrs[ACC100_DMA_MAX_NUM_POINTERS];
/* Virtual addresses used to retrieve SW context info */
union {
void *op_addr;
uint64_t pad1; /* pad to 64 bits */
};
/*
* Stores additional information needed for driver processing:
* - last_desc_in_batch - flag used to mark last descriptor (CB)
* in batch
* - cbs_in_tb - stores information about total number of Code Blocks
* in currently processed Transport Block
*/
union {
struct {
union {
struct acc100_fcw_ld fcw_ld;
struct acc100_fcw_td fcw_td;
struct acc100_fcw_le fcw_le;
struct acc100_fcw_te fcw_te;
uint32_t pad2[ACC100_FCW_PADDING];
};
uint32_t last_desc_in_batch :8,
cbs_in_tb:8,
pad4 : 16;
};
uint64_t pad3[ACC100_DMA_DESC_PADDING]; /* pad to 64 bits */
};
};
/* ACC100 DMA Descriptor */
union acc100_dma_desc {
struct acc100_dma_req_desc req;
union acc100_dma_rsp_desc rsp;
uint64_t atom_hdr;
};
/* Union describing Info Ring entry */
union acc100_harq_layout_data {
uint32_t val;
struct {
uint16_t offset;
uint16_t size0;
};
} __rte_packed;
/* Union describing Info Ring entry */
union acc100_info_ring_data {
uint32_t val;
struct {
union {
uint16_t detailed_info;
struct {
uint16_t aq_id: 4;
uint16_t qg_id: 4;
uint16_t vf_id: 6;
uint16_t reserved: 2;
};
};
uint16_t int_nb: 7;
uint16_t msi_0: 1;
uint16_t vf2pf: 6;
uint16_t loop: 1;
uint16_t valid: 1;
};
} __rte_packed;
struct acc100_registry_addr {
unsigned int dma_ring_dl5g_hi;
unsigned int dma_ring_dl5g_lo;
unsigned int dma_ring_ul5g_hi;
unsigned int dma_ring_ul5g_lo;
unsigned int dma_ring_dl4g_hi;
unsigned int dma_ring_dl4g_lo;
unsigned int dma_ring_ul4g_hi;
unsigned int dma_ring_ul4g_lo;
unsigned int ring_size;
unsigned int info_ring_hi;
unsigned int info_ring_lo;
unsigned int info_ring_en;
unsigned int info_ring_ptr;
unsigned int tail_ptrs_dl5g_hi;
unsigned int tail_ptrs_dl5g_lo;
unsigned int tail_ptrs_ul5g_hi;
unsigned int tail_ptrs_ul5g_lo;
unsigned int tail_ptrs_dl4g_hi;
unsigned int tail_ptrs_dl4g_lo;
unsigned int tail_ptrs_ul4g_hi;
unsigned int tail_ptrs_ul4g_lo;
unsigned int depth_log0_offset;
unsigned int depth_log1_offset;
unsigned int qman_group_func;
unsigned int ddr_range;
};
/* Structure holding registry addresses for PF */
static const struct acc100_registry_addr pf_reg_addr = {
.dma_ring_dl5g_hi = HWPfDmaFec5GdlDescBaseHiRegVf,
.dma_ring_dl5g_lo = HWPfDmaFec5GdlDescBaseLoRegVf,
.dma_ring_ul5g_hi = HWPfDmaFec5GulDescBaseHiRegVf,
.dma_ring_ul5g_lo = HWPfDmaFec5GulDescBaseLoRegVf,
.dma_ring_dl4g_hi = HWPfDmaFec4GdlDescBaseHiRegVf,
.dma_ring_dl4g_lo = HWPfDmaFec4GdlDescBaseLoRegVf,
.dma_ring_ul4g_hi = HWPfDmaFec4GulDescBaseHiRegVf,
.dma_ring_ul4g_lo = HWPfDmaFec4GulDescBaseLoRegVf,
.ring_size = HWPfQmgrRingSizeVf,
.info_ring_hi = HWPfHiInfoRingBaseHiRegPf,
.info_ring_lo = HWPfHiInfoRingBaseLoRegPf,
.info_ring_en = HWPfHiInfoRingIntWrEnRegPf,
.info_ring_ptr = HWPfHiInfoRingPointerRegPf,
.tail_ptrs_dl5g_hi = HWPfDmaFec5GdlRespPtrHiRegVf,
.tail_ptrs_dl5g_lo = HWPfDmaFec5GdlRespPtrLoRegVf,
.tail_ptrs_ul5g_hi = HWPfDmaFec5GulRespPtrHiRegVf,
.tail_ptrs_ul5g_lo = HWPfDmaFec5GulRespPtrLoRegVf,
.tail_ptrs_dl4g_hi = HWPfDmaFec4GdlRespPtrHiRegVf,
.tail_ptrs_dl4g_lo = HWPfDmaFec4GdlRespPtrLoRegVf,
.tail_ptrs_ul4g_hi = HWPfDmaFec4GulRespPtrHiRegVf,
.tail_ptrs_ul4g_lo = HWPfDmaFec4GulRespPtrLoRegVf,
.depth_log0_offset = HWPfQmgrGrpDepthLog20Vf,
.depth_log1_offset = HWPfQmgrGrpDepthLog21Vf,
.qman_group_func = HWPfQmgrGrpFunction0,
.ddr_range = HWPfDmaVfDdrBaseRw,
};
/* Structure holding registry addresses for VF */
static const struct acc100_registry_addr vf_reg_addr = {
.dma_ring_dl5g_hi = HWVfDmaFec5GdlDescBaseHiRegVf,
.dma_ring_dl5g_lo = HWVfDmaFec5GdlDescBaseLoRegVf,
.dma_ring_ul5g_hi = HWVfDmaFec5GulDescBaseHiRegVf,
.dma_ring_ul5g_lo = HWVfDmaFec5GulDescBaseLoRegVf,
.dma_ring_dl4g_hi = HWVfDmaFec4GdlDescBaseHiRegVf,
.dma_ring_dl4g_lo = HWVfDmaFec4GdlDescBaseLoRegVf,
.dma_ring_ul4g_hi = HWVfDmaFec4GulDescBaseHiRegVf,
.dma_ring_ul4g_lo = HWVfDmaFec4GulDescBaseLoRegVf,
.ring_size = HWVfQmgrRingSizeVf,
.info_ring_hi = HWVfHiInfoRingBaseHiVf,
.info_ring_lo = HWVfHiInfoRingBaseLoVf,
.info_ring_en = HWVfHiInfoRingIntWrEnVf,
.info_ring_ptr = HWVfHiInfoRingPointerVf,
.tail_ptrs_dl5g_hi = HWVfDmaFec5GdlRespPtrHiRegVf,
.tail_ptrs_dl5g_lo = HWVfDmaFec5GdlRespPtrLoRegVf,
.tail_ptrs_ul5g_hi = HWVfDmaFec5GulRespPtrHiRegVf,
.tail_ptrs_ul5g_lo = HWVfDmaFec5GulRespPtrLoRegVf,
.tail_ptrs_dl4g_hi = HWVfDmaFec4GdlRespPtrHiRegVf,
.tail_ptrs_dl4g_lo = HWVfDmaFec4GdlRespPtrLoRegVf,
.tail_ptrs_ul4g_hi = HWVfDmaFec4GulRespPtrHiRegVf,
.tail_ptrs_ul4g_lo = HWVfDmaFec4GulRespPtrLoRegVf,
.depth_log0_offset = HWVfQmgrGrpDepthLog20Vf,
.depth_log1_offset = HWVfQmgrGrpDepthLog21Vf,
.qman_group_func = HWVfQmgrGrpFunction0Vf,
.ddr_range = HWVfDmaDdrBaseRangeRoVf,
};
/* Structure associated with each queue. */
struct __rte_cache_aligned acc100_queue {
union acc100_dma_desc *ring_addr; /* Virtual address of sw ring */
rte_iova_t ring_addr_iova; /* IOVA address of software ring */
uint32_t sw_ring_head; /* software ring head */
uint32_t sw_ring_tail; /* software ring tail */
/* software ring size (descriptors, not bytes) */
uint32_t sw_ring_depth;
/* mask used to wrap enqueued descriptors on the sw ring */
uint32_t sw_ring_wrap_mask;
/* MMIO register used to enqueue descriptors */
void *mmio_reg_enqueue;
uint8_t vf_id; /* VF ID (max = 63) */
uint8_t qgrp_id; /* Queue Group ID */
uint16_t aq_id; /* Atomic Queue ID */
uint16_t aq_depth; /* Depth of atomic queue */
uint32_t aq_enqueued; /* Count how many "batches" have been enqueued */
uint32_t aq_dequeued; /* Count how many "batches" have been dequeued */
uint32_t irq_enable; /* Enable ops dequeue interrupts if set to 1 */
struct rte_mempool *fcw_mempool; /* FCW mempool */
enum rte_bbdev_op_type op_type; /* Type of this Queue: TE or TD */
/* Internal Buffers for loopback input */
uint8_t *lb_in;
uint8_t *lb_out;
rte_iova_t lb_in_addr_iova;
rte_iova_t lb_out_addr_iova;
struct acc100_device *d;
};
/* Private data structure for each ACC100 device */
struct acc100_device {
void *mmio_base; /**< Base address of MMIO registers (BAR0) */
void *sw_rings_base; /* Base addr of un-aligned memory for sw rings */
void *sw_rings; /* 64MBs of 64MB aligned memory for sw rings */
rte_iova_t sw_rings_iova; /* IOVA address of sw_rings */
/* Virtual address of the info memory routed to the this function under
* operation, whether it is PF or VF.
* HW may DMA information data at this location asynchronously
*/
union acc100_info_ring_data *info_ring;
union acc100_harq_layout_data *harq_layout;
/* Virtual Info Ring head */
uint16_t info_ring_head;
/* Number of bytes available for each queue in device, depending on
* how many queues are enabled with configure()
*/
uint32_t sw_ring_size;
uint32_t ddr_size; /* Size in kB */
uint32_t *tail_ptrs; /* Base address of response tail pointer buffer */
rte_iova_t tail_ptr_iova; /* IOVA address of tail pointers */
/* Max number of entries available for each queue in device, depending
* on how many queues are enabled with configure()
*/
uint32_t sw_ring_max_depth;
struct rte_acc100_conf acc100_conf; /* ACC100 Initial configuration */
/* Bitmap capturing which Queues have already been assigned */
uint16_t q_assigned_bit_map[ACC100_NUM_QGRPS];
bool pf_device; /**< True if this is a PF ACC100 device */
bool configured; /**< True if this ACC100 device is configured */
};
/**
* Structure with details about RTE_BBDEV_EVENT_DEQUEUE event. It's passed to
* the callback function.
*/
struct acc100_deq_intr_details {
uint16_t queue_id;
};
#endif /* _RTE_ACC100_PMD_H_ */