#include #include #include #include #include "i40e_bm.h" #include "i40e_base_wrapper.h" using namespace i40e; extern nicbm::Runner *runner; lan::lan(i40e_bm &dev_, size_t num_qs_) : dev(dev_), num_qs(num_qs_) { rxqs = new lan_queue_rx *[num_qs]; txqs = new lan_queue_tx *[num_qs]; for (size_t i = 0; i < num_qs; i++) { rxqs[i] = new lan_queue_rx(*this, dev.regs.qrx_tail[i], i, dev.regs.qrx_ena[i], dev.regs.glhmc_lanrxbase[0], dev.regs.qint_rqctl[i]); txqs[i] = new lan_queue_tx(*this, dev.regs.qtx_tail[i], i, dev.regs.qtx_ena[i], dev.regs.glhmc_lantxbase[0], dev.regs.qint_tqctl[i]); } } void lan::reset() { for (size_t i = 0; i < num_qs; i++) { rxqs[i]->reset(); txqs[i]->reset(); } } void lan::qena_updated(uint16_t idx, bool rx) { std::cerr << "lan: qena updated idx=" << idx << " rx=" << rx << std::endl; uint32_t ® = (rx ? dev.regs.qrx_ena[idx] : dev.regs.qtx_ena[idx]); lan_queue_base &q = (rx ? static_cast(*rxqs[idx]) : static_cast(*txqs[idx])); if ((reg & I40E_QRX_ENA_QENA_REQ_MASK) && !q.is_enabled()) { q.enable(); } else if (!(reg & I40E_QRX_ENA_QENA_REQ_MASK) && q.is_enabled()) { q.disable(); } } void lan::tail_updated(uint16_t idx, bool rx) { std::cerr << "lan: tail updated idx=" << idx << " rx=" << rx << std::endl; lan_queue_base &q = (rx ? static_cast(*rxqs[idx]) : static_cast(*txqs[idx])); if (q.is_enabled()) q.reg_updated(); } void lan::packet_received(const void *data, size_t len) { std::cerr << "lan: packet received len=" << len << std::endl; // TODO: steering rxqs[0]->packet_received(data, len); } lan_queue_base::lan_queue_base(lan &lanmgr_, uint32_t ®_tail_, size_t idx_, uint32_t ®_ena_, uint32_t &fpm_basereg_, uint32_t ®_intqctl_, uint16_t ctx_size_) : queue_base(reg_dummy_head, reg_tail_), lanmgr(lanmgr_), enabling(false), idx(idx_), reg_ena(reg_ena_), fpm_basereg(fpm_basereg_), reg_intqctl(reg_intqctl_), ctx_size(ctx_size_) { ctx = new uint8_t[ctx_size_]; } void lan_queue_base::reset() { enabling = false; queue_base::reset(); } void lan_queue_base::enable() { if (enabling || enabled) return; std::cerr << "lan enabling queue " << idx << std::endl; enabling = true; qctx_fetch *qf = new qctx_fetch(*this); qf->write = false; qf->dma_addr = ((fpm_basereg & I40E_GLHMC_LANTXBASE_FPMLANTXBASE_MASK) >> I40E_GLHMC_LANTXBASE_FPMLANTXBASE_SHIFT) * 512; qf->dma_addr += ctx_size * idx; qf->len = ctx_size; qf->data = ctx; lanmgr.dev.hmc.issue_mem_op(*qf); } void lan_queue_base::ctx_fetched() { std::cerr << "lan ctx fetched " << idx << std::endl; initialize(); enabling = false; enabled = true; reg_ena |= I40E_QRX_ENA_QENA_STAT_MASK; reg_updated(); } void lan_queue_base::disable() { std::cerr << "lan disabling queue " << idx << std::endl; enabled = false; // TODO: write back reg_ena &= ~I40E_QRX_ENA_QENA_STAT_MASK; } void lan_queue_base::interrupt() { uint32_t qctl = reg_intqctl; std::cerr << "lanq: interrupt intctl=" << qctl << std::endl; uint16_t msix_idx = (qctl & I40E_QINT_TQCTL_MSIX_INDX_MASK) >> I40E_QINT_TQCTL_ITR_INDX_SHIFT; uint8_t msix0_idx = (qctl & I40E_QINT_TQCTL_MSIX0_INDX_MASK) >> I40E_QINT_TQCTL_MSIX0_INDX_SHIFT; bool cause_ena = !!(qctl & I40E_QINT_TQCTL_CAUSE_ENA_MASK); if (!cause_ena) { std::cerr << "lanq: interrupt cause disabled" << std::endl; return; } if (msix_idx != 0) { std::cerr << "TODO: only int 0 is supported" << std::endl; abort(); } // TODO throttling? std::cerr << " setting int0.qidx=" << msix0_idx << std::endl; lanmgr.dev.regs.pfint_icr0 |= I40E_PFINT_ICR0_INTEVENT_MASK | (1 << (I40E_PFINT_ICR0_QUEUE_0_SHIFT + msix0_idx)); runner->msi_issue(0); } lan_queue_base::qctx_fetch::qctx_fetch(lan_queue_base &lq_) : lq(lq_) { } void lan_queue_base::qctx_fetch::done() { lq.ctx_fetched(); delete this; } lan_queue_rx::lan_queue_rx(lan &lanmgr_, uint32_t ®_tail_, size_t idx_, uint32_t ®_ena_, uint32_t ®_fpmbase_, uint32_t ®_intqctl_) : lan_queue_base(lanmgr_, reg_tail_, idx_, reg_ena_, reg_fpmbase_, reg_intqctl_, 32), dcache_first_idx(0), dcache_first_pos(0), dcache_first_cnt(0) { } void lan_queue_rx::reset() { dcache_first_idx = 0; dcache_first_pos = 0; dcache_first_cnt = 0; queue_base::reset(); } void lan_queue_rx::initialize() { std::cerr << "lan_queue_rx::initialize()" << std::endl; uint8_t *ctx_p = reinterpret_cast(ctx); uint16_t *head_p = reinterpret_cast(ctx_p + 0); uint64_t *base_p = reinterpret_cast(ctx_p + 4); uint16_t *qlen_p = reinterpret_cast(ctx_p + 11); uint16_t *dbsz_p = reinterpret_cast(ctx_p + 12); uint16_t *hbsz_p = reinterpret_cast(ctx_p + 13); uint32_t *rxmax_p = reinterpret_cast(ctx_p + 21); reg_dummy_head = (*head_p) & ((1 << 13) - 1); base = ((*base_p) & ((1ULL << 57) - 1)) * 128; len = (*qlen_p >> 1) & ((1 << 13) - 1); dbuff_size = (((*dbsz_p) >> 6) & ((1 << 7) - 1)) * 128; hbuff_size = (((*hbsz_p) >> 5) & ((1 << 5) - 1)) * 64; uint8_t dtype = ((*hbsz_p) >> 10) & ((1 << 2) - 1); bool longdesc = !!(((*hbsz_p) >> 12) & 0x1); desc_len = (longdesc ? 32 : 16); crc_strip = !!(((*hbsz_p) >> 13) & 0x1); rxmax = (((*rxmax_p) >> 6) & ((1 << 14) - 1)) * 128; if (!longdesc) { std::cerr << "lan_queue_rx::initialize: currently only 32B descs " " supported" << std::endl; abort(); } if (dtype != 0) { std::cerr << "lan_queue_rx::initialize: no header split supported" << std::endl; abort(); } std::cerr << " head=" << reg_dummy_head << " base=" << base << " len=" << len << " dbsz=" << dbuff_size << " hbsz=" << hbuff_size << " dtype=" << (unsigned) dtype << " longdesc=" << longdesc << " crcstrip=" << crc_strip << " rxmax=" << rxmax << std::endl; } uint32_t lan_queue_rx::max_fetch_capacity() { return DCACHE_SIZE - dcache_first_cnt; } void lan_queue_rx::desc_fetched(void *desc_ptr, uint32_t didx) { std::cerr << "rxq: desc fetched" << std::endl; union i40e_32byte_rx_desc *desc = reinterpret_cast (desc_ptr); assert(dcache_first_cnt < DCACHE_SIZE); std::cerr << " idx=" << dcache_first_idx << " cnt=" << dcache_first_cnt << " didx=" << didx << std::endl; assert((dcache_first_idx + dcache_first_cnt) % len == didx); uint16_t dci = (dcache_first_pos + dcache_first_cnt) % DCACHE_SIZE; dcache[dci].buf = desc->read.pkt_addr; dcache[dci].hbuf = desc->read.hdr_addr; dcache_first_cnt++; } void lan_queue_rx::data_fetched(void *desc, uint32_t didx, void *data) { std::cerr << "rxq: data fetched" << std::endl; } void lan_queue_rx::packet_received(const void *data, size_t pktlen) { if (dcache_first_cnt == 0) { std::cerr << "rqx: empty, dropping packet" << std::endl; return; } std::cerr << "rxq: packet received" << std::endl; union i40e_32byte_rx_desc rxd; memset(&rxd, 0, sizeof(rxd)); rxd.wb.qword1.status_error_len |= (1 << I40E_RX_DESC_STATUS_DD_SHIFT); rxd.wb.qword1.status_error_len |= (1 << I40E_RX_DESC_STATUS_EOF_SHIFT); // TODO: only if checksums are correct rxd.wb.qword1.status_error_len |= (1 << I40E_RX_DESC_STATUS_L3L4P_SHIFT); rxd.wb.qword1.status_error_len |= (pktlen << I40E_RXD_QW1_LENGTH_PBUF_SHIFT); desc_writeback_indirect(&rxd, dcache_first_idx, dcache[dcache_first_pos].buf, data, pktlen); dcache_first_pos = (dcache_first_pos + 1) % DCACHE_SIZE; dcache_first_idx = (dcache_first_idx + 1) % len; dcache_first_cnt--; } lan_queue_tx::lan_queue_tx(lan &lanmgr_, uint32_t ®_tail_, size_t idx_, uint32_t ®_ena_, uint32_t ®_fpmbase_, uint32_t ®_intqctl) : lan_queue_base(lanmgr_, reg_tail_, idx_, reg_ena_, reg_fpmbase_, reg_intqctl, 128) { desc_len = 16; } void lan_queue_tx::initialize() { std::cerr << "lan_queue_tx::initialize()" << std::endl; uint8_t *ctx_p = reinterpret_cast(ctx); uint16_t *head_p = reinterpret_cast(ctx_p + 0); uint64_t *base_p = reinterpret_cast(ctx_p + 4); uint16_t *hwb_qlen_p = reinterpret_cast(ctx_p + 20); uint64_t *hwb_addr_p = reinterpret_cast(ctx_p + 24); reg_dummy_head = (*head_p) & ((1 << 13) - 1); base = ((*base_p) & ((1ULL << 57) - 1)) * 128; len = ((*hwb_qlen_p) >> 1) & ((1 << 13) - 1); hwb = !!(*hwb_qlen_p & (1 << 0)); hwb_addr = *hwb_addr_p; std::cerr << " head=" << reg_dummy_head << " base=" << base << " len=" << len << " hwb=" << hwb << " hwb_addr=" << hwb_addr << std::endl; } void lan_queue_tx::desc_fetched(void *desc_buf, uint32_t didx) { std::cerr << "txq: desc fetched" << std::endl; struct i40e_tx_desc *desc = reinterpret_cast(desc_buf); uint64_t d1 = desc->cmd_type_offset_bsz; uint8_t dtype = (d1 & I40E_TXD_QW1_DTYPE_MASK) >> I40E_TXD_QW1_DTYPE_SHIFT; if (dtype == I40E_TX_DESC_DTYPE_DATA) { uint16_t len = (d1 & I40E_TXD_QW1_TX_BUF_SZ_MASK) >> I40E_TXD_QW1_TX_BUF_SZ_SHIFT; std::cerr << " bufaddr=" << desc->buffer_addr << " len=" << len << std::endl; data_fetch(desc_buf, didx, desc->buffer_addr, len); } else if (dtype == I40E_TX_DESC_DTYPE_CONTEXT) { struct i40e_tx_context_desc *ctxd = reinterpret_cast (desc_buf); std::cerr << " context descriptor: tp=" << ctxd->tunneling_params << " l2t=" << ctxd->l2tag2 << " tctm=" << ctxd->type_cmd_tso_mss << std::endl; abort(); desc->buffer_addr = 0; desc->cmd_type_offset_bsz = I40E_TX_DESC_DTYPE_DESC_DONE << I40E_TXD_QW1_DTYPE_SHIFT; desc_writeback(desc_buf, didx); } else { std::cerr << "txq: only support context & data descriptors" << std::endl; abort(); } } void lan_queue_tx::data_fetched(void *desc_buf, uint32_t didx, void *data) { std::cerr << "txq: data fetched" << std::endl; struct i40e_tx_desc *desc = reinterpret_cast(desc_buf); uint64_t d1 = desc->cmd_type_offset_bsz; uint16_t pkt_len = (d1 & I40E_TXD_QW1_TX_BUF_SZ_MASK) >> I40E_TXD_QW1_TX_BUF_SZ_SHIFT; uint16_t cmd = (d1 & I40E_TXD_QW1_CMD_MASK) >> I40E_TXD_QW1_CMD_SHIFT; bool eop = (cmd & I40E_TX_DESC_CMD_EOP); uint16_t iipt = cmd & (I40E_TX_DESC_CMD_IIPT_MASK); uint16_t l4t = (cmd & I40E_TX_DESC_CMD_L4T_EOFT_MASK); uint32_t off = (d1 & I40E_TXD_QW1_OFFSET_MASK) >> I40E_TXD_QW1_OFFSET_SHIFT; uint16_t maclen = ((off & I40E_TXD_QW1_MACLEN_MASK) >> I40E_TX_DESC_LENGTH_MACLEN_SHIFT) * 2; uint16_t iplen = ((off & I40E_TXD_QW1_IPLEN_MASK) >> I40E_TX_DESC_LENGTH_IPLEN_SHIFT) * 4; /*uint16_t l4len = (off & I40E_TXD_QW1_L4LEN_MASK) >> I40E_TX_DESC_LENGTH_L4_FC_LEN_SHIFT;*/ // part of a multi-descriptor packet if (!eop || pktbuf_len != 0) { if (pktbuf_len + pkt_len > MTU) { std::cerr << "multi desc packet longer than MTU pbl=" << pktbuf_len << " len=" << pkt_len << std::endl; abort(); } memcpy(pktbuf + pktbuf_len, data, pkt_len); pktbuf_len += pkt_len; if (!eop) { // not done yet goto writeback; } data = pktbuf; pkt_len = pktbuf_len; } if (l4t == I40E_TX_DESC_CMD_L4T_EOFT_TCP) { uint16_t tcp_off = maclen + iplen; xsum_tcp((uint8_t *) data + tcp_off, pkt_len - tcp_off); } std::cerr << " iipt=" << iipt << " l4t=" << l4t << " maclen=" << maclen << " iplen=" << iplen<< std::endl; runner->eth_send(data, pkt_len); pktbuf_len = 0; writeback: desc->buffer_addr = 0; desc->cmd_type_offset_bsz = I40E_TX_DESC_DTYPE_DESC_DONE << I40E_TXD_QW1_DTYPE_SHIFT; desc_writeback(desc_buf, didx); } void lan_queue_tx::desc_writeback(const void *desc, uint32_t didx) { if (!hwb) { // if head index writeback is disabled we need to write descriptor back lan_queue_base::desc_writeback(desc, idx); } else { // else we just need to write the index back dma_hwb *dma = new dma_hwb(*this, didx, (didx + 1) % len); dma->dma_addr = hwb_addr; std::cerr << "hwb=" << *((uint32_t *) dma->data) << std::endl; runner->issue_dma(*dma); } } lan_queue_tx::dma_hwb::dma_hwb(lan_queue_tx &queue_, uint32_t index_, uint32_t next) : queue(queue_), head(index_), next_head(next) { data = &next_head; len = 4; write = true; } lan_queue_tx::dma_hwb::~dma_hwb() { } void lan_queue_tx::dma_hwb::done() { std::cerr << "txq: tx head written back" << std::endl; queue.desc_written_back(head); delete this; }