"examples/inference/run_text_generation_server_345M.sh" did not exist on "ef59b68720a787eebbc7bbf186f333f807aaf02e"
i40e_lan.cc 14 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
#include <stdlib.h>
#include <string.h>
#include <cassert>
#include <iostream>

#include "i40e_bm.h"

#include "i40e_base_wrapper.h"

using namespace i40e;

extern nicbm::Runner *runner;

lan::lan(i40e_bm &dev_, size_t num_qs_)
15
    : dev(dev_), log("lan"), num_qs(num_qs_)
16
{
17
18
19
20
21
    rxqs = new lan_queue_rx *[num_qs];
    txqs = new lan_queue_tx *[num_qs];

    for (size_t i = 0; i < num_qs; i++) {
        rxqs[i] = new lan_queue_rx(*this, dev.regs.qrx_tail[i], i,
22
23
                dev.regs.qrx_ena[i], dev.regs.glhmc_lanrxbase[0],
                dev.regs.qint_rqctl[i]);
24
        txqs[i] = new lan_queue_tx(*this, dev.regs.qtx_tail[i], i,
25
26
                dev.regs.qtx_ena[i], dev.regs.glhmc_lantxbase[0],
                dev.regs.qint_tqctl[i]);
27
    }
28
29
}

30
31
32
33
34
35
36
37
void lan::reset()
{
    for (size_t i = 0; i < num_qs; i++) {
        rxqs[i]->reset();
        txqs[i]->reset();
    }
}

38
39
void lan::qena_updated(uint16_t idx, bool rx)
{
40
#ifdef DEBUG_LAN
41
    log << " qena updated idx=" << idx << " rx=" << rx << logger::endl;
42
#endif
43
44
45
46
47
48
49
50
51
    uint32_t &reg = (rx ? dev.regs.qrx_ena[idx] : dev.regs.qtx_ena[idx]);
    lan_queue_base &q = (rx ? static_cast<lan_queue_base &>(*rxqs[idx]) :
        static_cast<lan_queue_base &>(*txqs[idx]));

    if ((reg & I40E_QRX_ENA_QENA_REQ_MASK) && !q.is_enabled()) {
        q.enable();
    } else if (!(reg & I40E_QRX_ENA_QENA_REQ_MASK) && q.is_enabled()) {
        q.disable();
    }
52
53
54
55
}

void lan::tail_updated(uint16_t idx, bool rx)
{
56
#ifdef DEBUG_LAN
57
    log << " tail updated idx=" << idx << " rx=" << rx << logger::endl;
58
#endif
59
60
61
62
63
64
65
66

    lan_queue_base &q = (rx ? static_cast<lan_queue_base &>(*rxqs[idx]) :
        static_cast<lan_queue_base &>(*txqs[idx]));

    if (q.is_enabled())
        q.reg_updated();
}

67
68
void lan::packet_received(const void *data, size_t len)
{
69
#ifdef DEBUG_LAN
70
    log << " packet received len=" << len << logger::endl;
71
#endif
72
73
74
75
76

    // TODO: steering
    rxqs[0]->packet_received(data, len);
}

77
78
lan_queue_base::lan_queue_base(lan &lanmgr_, const std::string &qtype,
        uint32_t &reg_tail_, size_t idx_,
79
80
        uint32_t &reg_ena_, uint32_t &fpm_basereg_, uint32_t &reg_intqctl_,
        uint16_t ctx_size_)
81
82
    : queue_base(qtype + std::to_string(idx_), reg_dummy_head, reg_tail_),
    lanmgr(lanmgr_), enabling(false),
83
    idx(idx_), reg_ena(reg_ena_), fpm_basereg(fpm_basereg_),
84
    reg_intqctl(reg_intqctl_), ctx_size(ctx_size_)
85
86
87
88
{
    ctx = new uint8_t[ctx_size_];
}

89
90
91
92
93
94
void lan_queue_base::reset()
{
    enabling = false;
    queue_base::reset();
}

95
96
97
98
99
void lan_queue_base::enable()
{
    if (enabling || enabled)
        return;

100
#ifdef DEBUG_LAN
101
    log << " lan enabling queue " << idx << logger::endl;
102
#endif
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
    enabling = true;

    qctx_fetch *qf = new qctx_fetch(*this);
    qf->write = false;
    qf->dma_addr = ((fpm_basereg & I40E_GLHMC_LANTXBASE_FPMLANTXBASE_MASK) >>
        I40E_GLHMC_LANTXBASE_FPMLANTXBASE_SHIFT) * 512;
    qf->dma_addr += ctx_size * idx;
    qf->len = ctx_size;
    qf->data = ctx;

    lanmgr.dev.hmc.issue_mem_op(*qf);
}

void lan_queue_base::ctx_fetched()
{
118
#ifdef DEBUG_LAN
119
    log << " lan ctx fetched " << idx << logger::endl;
120
#endif
121
122
123
124
125
126
127
128
129
130
131
132

    initialize();

    enabling = false;
    enabled = true;
    reg_ena |= I40E_QRX_ENA_QENA_STAT_MASK;

    reg_updated();
}

void lan_queue_base::disable()
{
133
#ifdef DEBUG_LAN
134
    log << " lan disabling queue " << idx << logger::endl;
135
#endif
136
137
138
139
140
    enabled = false;
    // TODO: write back
    reg_ena &= ~I40E_QRX_ENA_QENA_STAT_MASK;
}

141
142
143
void lan_queue_base::interrupt()
{
    uint32_t qctl = reg_intqctl;
144
#ifdef DEBUG_LAN
145
    log << " interrupt intctl=" << qctl << logger::endl;
146
#endif
147
148
149
150
151
152
153
154

    uint16_t msix_idx = (qctl & I40E_QINT_TQCTL_MSIX_INDX_MASK) >>
        I40E_QINT_TQCTL_ITR_INDX_SHIFT;
    uint8_t msix0_idx = (qctl & I40E_QINT_TQCTL_MSIX0_INDX_MASK) >>
        I40E_QINT_TQCTL_MSIX0_INDX_SHIFT;
    bool cause_ena = !!(qctl & I40E_QINT_TQCTL_CAUSE_ENA_MASK);

    if (!cause_ena) {
155
#ifdef DEBUG_LAN
156
        log << " interrupt cause disabled" << logger::endl;
157
#endif
158
159
160
161
        return;
    }

    if (msix_idx != 0) {
162
        log << "TODO: only int 0 is supported" << logger::endl;
163
164
165
166
        abort();
    }

    // TODO throttling?
167
#ifdef DEBUG_LAN
168
    log << "   setting int0.qidx=" << msix0_idx << logger::endl;
169
#endif
170
171
172
173
174
    lanmgr.dev.regs.pfint_icr0 |= I40E_PFINT_ICR0_INTEVENT_MASK |
        (1 << (I40E_PFINT_ICR0_QUEUE_0_SHIFT + msix0_idx));
    runner->msi_issue(0);
}

175
176
177
178
179
180
181
182
183
184
185
186
lan_queue_base::qctx_fetch::qctx_fetch(lan_queue_base &lq_)
    : lq(lq_)
{
}

void lan_queue_base::qctx_fetch::done()
{
    lq.ctx_fetched();
    delete this;
}

lan_queue_rx::lan_queue_rx(lan &lanmgr_, uint32_t &reg_tail_, size_t idx_,
187
        uint32_t &reg_ena_, uint32_t &reg_fpmbase_, uint32_t &reg_intqctl_)
188
    : lan_queue_base(lanmgr_, "rxq", reg_tail_, idx_, reg_ena_, reg_fpmbase_,
189
            reg_intqctl_, 32)
190
{
191
192
193
    // use larger value for initialization
    desc_len = 32;
    ctxs_init();
194
195
}

196
197
void lan_queue_rx::reset()
{
198
    dcache.clear();
199
200
201
    queue_base::reset();
}

202
203
void lan_queue_rx::initialize()
{
204
#ifdef DEBUG_LAN
205
    log << " initialize()" << logger::endl;
206
#endif
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
    uint8_t *ctx_p = reinterpret_cast<uint8_t *>(ctx);

    uint16_t *head_p = reinterpret_cast<uint16_t *>(ctx_p + 0);
    uint64_t *base_p = reinterpret_cast<uint64_t *>(ctx_p + 4);
    uint16_t *qlen_p = reinterpret_cast<uint16_t *>(ctx_p + 11);
    uint16_t *dbsz_p = reinterpret_cast<uint16_t *>(ctx_p + 12);
    uint16_t *hbsz_p = reinterpret_cast<uint16_t *>(ctx_p + 13);
    uint32_t *rxmax_p = reinterpret_cast<uint32_t *>(ctx_p + 21);

    reg_dummy_head = (*head_p) & ((1 << 13) - 1);

    base = ((*base_p) & ((1ULL << 57) - 1)) * 128;
    len = (*qlen_p >> 1) & ((1 << 13) - 1);

    dbuff_size = (((*dbsz_p) >> 6) & ((1 << 7) - 1)) * 128;
    hbuff_size = (((*hbsz_p) >> 5) & ((1 << 5) - 1)) * 64;
    uint8_t dtype = ((*hbsz_p) >> 10) & ((1 << 2) - 1);
    bool longdesc = !!(((*hbsz_p) >> 12) & 0x1);
    desc_len = (longdesc ? 32 : 16);
    crc_strip = !!(((*hbsz_p) >> 13) & 0x1);
    rxmax = (((*rxmax_p) >> 6) & ((1 << 14) - 1)) * 128;

    if (!longdesc) {
230
231
        log << "lan_queue_rx::initialize: currently only 32B descs "
            " supported" << logger::endl;
232
233
234
        abort();
    }
    if (dtype != 0) {
235
236
        log << "lan_queue_rx::initialize: no header split supported"
            << logger::endl;
237
238
239
        abort();
    }

240
#ifdef DEBUG_LAN
241
    log << "  head=" << reg_dummy_head << " base=" << base <<
242
243
        " len=" << len << " dbsz=" << dbuff_size << " hbsz=" << hbuff_size <<
        " dtype=" << (unsigned) dtype << " longdesc=" << longdesc <<
244
        " crcstrip=" << crc_strip << " rxmax=" << rxmax << logger::endl;
245
#endif
246
247
}

248
queue_base::desc_ctx &lan_queue_rx::desc_ctx_create()
249
{
250
    return *new rx_desc_ctx(*this);
251
252
}

253
void lan_queue_rx::packet_received(const void *data, size_t pktlen)
254
{
255
    if (dcache.empty()) {
256
#ifdef DEBUG_LAN
257
        log << " empty, dropping packet" << logger::endl;
258
#endif
259
260
        return;
    }
261

262
    rx_desc_ctx &ctx = *dcache.front();
263

264
#ifdef DEBUG_LAN
265
266
    log << " packet received didx=" << ctx.index << " cnt=" <<
        dcache.size() << logger::endl;
267
#endif
268

269
270
    dcache.pop_front();
    ctx.packet_received(data, pktlen);
271
272
}

273
274
lan_queue_rx::rx_desc_ctx::rx_desc_ctx(lan_queue_rx &queue_)
    : desc_ctx(queue_), rq(queue_)
275
276
277
{
}

278
void lan_queue_rx::rx_desc_ctx::data_written(uint64_t addr, size_t len)
279
{
280
281
    processed();
}
282

283
284
285
286
void lan_queue_rx::rx_desc_ctx::process()
{
    rq.dcache.push_back(this);
}
287

288
289
290
291
292
293
294
295
296
297
298
299
300
void lan_queue_rx::rx_desc_ctx::packet_received(const void *data, size_t pktlen)
{
    union i40e_32byte_rx_desc *rxd = reinterpret_cast<
        union i40e_32byte_rx_desc *> (desc);

    uint64_t addr = rxd->read.pkt_addr;

    memset(rxd, 0, sizeof(*rxd));
    rxd->wb.qword1.status_error_len |= (1 << I40E_RX_DESC_STATUS_DD_SHIFT);
    rxd->wb.qword1.status_error_len |= (1 << I40E_RX_DESC_STATUS_EOF_SHIFT);
    // TODO: only if checksums are correct
    rxd->wb.qword1.status_error_len |= (1 << I40E_RX_DESC_STATUS_L3L4P_SHIFT);
    rxd->wb.qword1.status_error_len |= (pktlen << I40E_RXD_QW1_LENGTH_PBUF_SHIFT);
301

302
    data_write(addr, pktlen, data);
303
304
}

305
lan_queue_tx::lan_queue_tx(lan &lanmgr_, uint32_t &reg_tail_, size_t idx_,
306
        uint32_t &reg_ena_, uint32_t &reg_fpmbase_, uint32_t &reg_intqctl)
307
    : lan_queue_base(lanmgr_, "txq", reg_tail_, idx_, reg_ena_, reg_fpmbase_,
308
            reg_intqctl, 128)
309
310
{
    desc_len = 16;
311
    ctxs_init();
312
313
}

Antoine Kaufmann's avatar
Antoine Kaufmann committed
314
315
void lan_queue_tx::reset()
{
316
    ready_segments.clear();
Antoine Kaufmann's avatar
Antoine Kaufmann committed
317
318
319
    queue_base::reset();
}

320
321
void lan_queue_tx::initialize()
{
322
#ifdef DEBUG_LAN
323
    log << " initialize()" << logger::endl;
324
#endif
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
    uint8_t *ctx_p = reinterpret_cast<uint8_t *>(ctx);

    uint16_t *head_p = reinterpret_cast<uint16_t *>(ctx_p + 0);
    uint64_t *base_p = reinterpret_cast<uint64_t *>(ctx_p + 4);
    uint16_t *hwb_qlen_p = reinterpret_cast<uint16_t *>(ctx_p + 20);
    uint64_t *hwb_addr_p = reinterpret_cast<uint64_t *>(ctx_p + 24);

    reg_dummy_head = (*head_p) & ((1 << 13) - 1);

    base = ((*base_p) & ((1ULL << 57) - 1)) * 128;
    len = ((*hwb_qlen_p) >> 1) & ((1 << 13) - 1);

    hwb = !!(*hwb_qlen_p & (1 << 0));
    hwb_addr = *hwb_addr_p;

340
#ifdef DEBUG_LAN
341
    log << "  head=" << reg_dummy_head << " base=" << base <<
342
        " len=" << len << " hwb=" << hwb << " hwb_addr=" << hwb_addr <<
343
        logger::endl;
344
#endif
345
}
346

347
queue_base::desc_ctx &lan_queue_tx::desc_ctx_create()
348
{
349
350
    return *new tx_desc_ctx(*this);
}
351

352
353
354
355
356
357
358
359
360
361
362
363
void lan_queue_tx::do_writeback(uint32_t first_idx, uint32_t first_pos,
        uint32_t cnt)
{
    if (!hwb) {
        // if head index writeback is disabled we need to write descriptor back
        lan_queue_base::do_writeback(first_idx, first_pos, cnt);
    } else {
        // else we just need to write the index back
        dma_hwb *dma = new dma_hwb(*this, first_pos, cnt,
                (first_idx + cnt) % len);
        dma->dma_addr = hwb_addr;

364
#ifdef DEBUG_LAN
365
        log << " hwb=" << *((uint32_t *) dma->data) << logger::endl;
366
#endif
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
        runner->issue_dma(*dma);
    }
}

bool lan_queue_tx::trigger_tx_packet()
{
    size_t n = ready_segments.size();
    if (n == 0)
        return false;

    size_t dcnt;
    bool eop = false;
    uint64_t d1;
    uint16_t iipt, l4t, total_len = 0;
    for (dcnt = 0; dcnt < n && !eop; dcnt++) {
        tx_desc_ctx *rd = ready_segments.at(dcnt);

        d1 = rd->d->cmd_type_offset_bsz;
385
#ifdef DEBUG_LAN
386
387
        log << " data fetched didx=" << rd->index << " d1=" <<
            d1 << logger::endl;
388
#endif
389
390
391
392

        uint16_t pkt_len = (d1 & I40E_TXD_QW1_TX_BUF_SZ_MASK) >>
            I40E_TXD_QW1_TX_BUF_SZ_SHIFT;
        if (total_len + pkt_len > MTU) {
393
            log << "txq: trigger_tx_packet too large" << logger::endl;
394
395
            abort();
        }
396

397
398
399
400
401
402
403
        memcpy(pktbuf + total_len, rd->data, pkt_len);

        uint16_t cmd = (d1 & I40E_TXD_QW1_CMD_MASK) >> I40E_TXD_QW1_CMD_SHIFT;
        eop = (cmd & I40E_TX_DESC_CMD_EOP);
        iipt = cmd & (I40E_TX_DESC_CMD_IIPT_MASK);
        l4t = (cmd & I40E_TX_DESC_CMD_L4T_EOFT_MASK);

404
#ifdef DEBUG_LAN
405
406
        log << "    eop=" << eop << " len=" << pkt_len <<
            logger::endl;
407
#endif
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427

        total_len += pkt_len;
    }

    if (!eop)
        return false;

    uint32_t off = (d1 & I40E_TXD_QW1_OFFSET_MASK) >> I40E_TXD_QW1_OFFSET_SHIFT;
    uint16_t maclen = ((off & I40E_TXD_QW1_MACLEN_MASK) >>
        I40E_TX_DESC_LENGTH_MACLEN_SHIFT) * 2;
    uint16_t iplen = ((off & I40E_TXD_QW1_IPLEN_MASK) >>
        I40E_TX_DESC_LENGTH_IPLEN_SHIFT) * 4;
    /*uint16_t l4len = (off & I40E_TXD_QW1_L4LEN_MASK) >>
        I40E_TX_DESC_LENGTH_L4_FC_LEN_SHIFT;*/


    if (l4t == I40E_TX_DESC_CMD_L4T_EOFT_TCP) {
        uint16_t tcp_off = maclen + iplen;
        xsum_tcp(pktbuf + tcp_off, total_len - tcp_off);
    }
428
#ifdef DEBUG_LAN
429
430
    log << "    iipt=" << iipt << " l4t=" << l4t <<
        " maclen=" << maclen << " iplen=" << iplen<< logger::endl;
431
432
433
#else
    (void) iipt;
#endif
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459

    runner->eth_send(pktbuf, total_len);

    while (dcnt-- > 0) {
        ready_segments.front()->processed();
        ready_segments.pop_front();
    }

    return true;
}

void lan_queue_tx::trigger_tx()
{
    while (trigger_tx_packet());
}

lan_queue_tx::tx_desc_ctx::tx_desc_ctx(lan_queue_tx &queue_)
    : desc_ctx(queue_), tq(queue_)
{
    d = reinterpret_cast<struct i40e_tx_desc *>(desc);
}

void lan_queue_tx::tx_desc_ctx::prepare()
{
    uint64_t d1 = d->cmd_type_offset_bsz;

460
#ifdef DEBUG_LAN
461
462
    queue.log << " desc fetched didx=" << index << " d1=" <<
        d1 << logger::endl;
463
#endif
464

465
    uint8_t dtype = (d1 & I40E_TXD_QW1_DTYPE_MASK) >> I40E_TXD_QW1_DTYPE_SHIFT;
Antoine Kaufmann's avatar
Antoine Kaufmann committed
466
467
468
469
    if (dtype == I40E_TX_DESC_DTYPE_DATA) {
        uint16_t len = (d1 & I40E_TXD_QW1_TX_BUF_SZ_MASK) >>
            I40E_TXD_QW1_TX_BUF_SZ_SHIFT;

470
#ifdef DEBUG_LAN
471
472
        queue.log << "  bufaddr=" << d->buffer_addr <<
            " len=" << len << logger::endl;
473
#endif
Antoine Kaufmann's avatar
Antoine Kaufmann committed
474

475
        data_fetch(d->buffer_addr, len);
Antoine Kaufmann's avatar
Antoine Kaufmann committed
476
477
    } else if (dtype == I40E_TX_DESC_DTYPE_CONTEXT) {
        struct i40e_tx_context_desc *ctxd =
478
            reinterpret_cast<struct i40e_tx_context_desc *> (d);
479
480
        queue.log << "  context descriptor: tp=" << ctxd->tunneling_params <<
            " l2t=" << ctxd->l2tag2 << " tctm=" << ctxd->type_cmd_tso_mss << logger::endl;
481
482
        abort();

483
        /*desc->buffer_addr = 0;
Antoine Kaufmann's avatar
Antoine Kaufmann committed
484
485
486
        desc->cmd_type_offset_bsz = I40E_TX_DESC_DTYPE_DESC_DONE <<
            I40E_TXD_QW1_DTYPE_SHIFT;

487
        desc_writeback(desc_buf, didx);*/
Antoine Kaufmann's avatar
Antoine Kaufmann committed
488
    } else {
489
        queue.log << "txq: only support context & data descriptors" << logger::endl;
490
491
        abort();
    }
492
493
494
495
496
497
498
499
500

}

void lan_queue_tx::tx_desc_ctx::process()
{
    tq.ready_segments.push_back(this);
    tq.trigger_tx();
}

501
502
503
504
505
506
507
void lan_queue_tx::tx_desc_ctx::processed()
{
    d->cmd_type_offset_bsz = I40E_TX_DESC_DTYPE_DESC_DONE <<
        I40E_TXD_QW1_DTYPE_SHIFT;
    desc_ctx::processed();
}

508
509
510
lan_queue_tx::dma_hwb::dma_hwb(lan_queue_tx &queue_, uint32_t pos_,
        uint32_t cnt_, uint32_t nh_)
    : queue(queue_), pos(pos_), cnt(cnt_), next_head(nh_)
511
512
513
514
515
516
517
518
519
520
521
522
{
    data = &next_head;
    len = 4;
    write = true;
}

lan_queue_tx::dma_hwb::~dma_hwb()
{
}

void lan_queue_tx::dma_hwb::done()
{
523
#ifdef DEBUG_LAN
524
    queue.log << " tx head written back" << logger::endl;
525
#endif
526
    queue.writeback_done(pos, cnt);
527
    queue.trigger();
528
529
    delete this;
}