]> git.proxmox.com Git - ceph.git/blobdiff - ceph/src/spdk/dpdk/drivers/net/octeontx/octeontx_rxtx.h
update source to Ceph Pacific 16.2.2
[ceph.git] / ceph / src / spdk / dpdk / drivers / net / octeontx / octeontx_rxtx.h
index d0d73b304643fd26468b224681322912d8921d9f..8b46105b6353f8906c541f8460777cae5f92f11c 100644 (file)
@@ -7,13 +7,72 @@
 
 #include <rte_ethdev_driver.h>
 
-#ifndef __hot
-#define __hot  __attribute__((hot))
-#endif
+#define OFFLOAD_FLAGS                                  \
+       uint16_t rx_offload_flags;                      \
+       uint16_t tx_offload_flags
+
+#define BIT(nr) (1UL << (nr))
+
+#define OCCTX_RX_OFFLOAD_NONE          (0)
+#define OCCTX_RX_MULTI_SEG_F           BIT(0)
+#define OCCTX_RX_OFFLOAD_CSUM_F         BIT(1)
+#define OCCTX_RX_VLAN_FLTR_F            BIT(2)
+
+#define OCCTX_TX_OFFLOAD_NONE          (0)
+#define OCCTX_TX_MULTI_SEG_F           BIT(0)
+#define OCCTX_TX_OFFLOAD_L3_L4_CSUM_F  BIT(1)
+#define OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F        BIT(2)
+#define OCCTX_TX_OFFLOAD_MBUF_NOFF_F   BIT(3)
 
 /* Packet type table */
 #define PTYPE_SIZE     OCCTX_PKI_LTYPE_LAST
 
+/* octeontx send header sub descriptor structure */
+RTE_STD_C11
+union octeontx_send_hdr_w0_u {
+       uint64_t u;
+       struct {
+               uint64_t total   : 16;
+               uint64_t markptr : 8;
+               uint64_t l3ptr   : 8;
+               uint64_t l4ptr   : 8;
+               uint64_t ii      : 1;
+               uint64_t shp_dis : 1;
+               uint64_t ckle    : 1;
+               uint64_t cklf    : 2;
+               uint64_t ckl3    : 1;
+               uint64_t ckl4    : 2;
+               uint64_t p       : 1;
+               uint64_t format  : 7;
+               uint64_t tstamp  : 1;
+               uint64_t tso_eom : 1;
+               uint64_t df      : 1;
+               uint64_t tso     : 1;
+               uint64_t n2      : 1;
+               uint64_t scntn1  : 3;
+       };
+};
+
+RTE_STD_C11
+union octeontx_send_hdr_w1_u {
+       uint64_t u;
+       struct {
+               uint64_t tso_mss : 14;
+               uint64_t shp_ra  : 2;
+               uint64_t tso_sb  : 8;
+               uint64_t leptr   : 8;
+               uint64_t lfptr   : 8;
+               uint64_t shp_chg : 9;
+               uint64_t tso_fn  : 7;
+               uint64_t l2len   : 8;
+       };
+};
+
+struct octeontx_send_hdr_s {
+       union octeontx_send_hdr_w0_u w0;
+       union octeontx_send_hdr_w1_u w1;
+};
+
 static const uint32_t __rte_cache_aligned
 ptype_table[PTYPE_SIZE][PTYPE_SIZE][PTYPE_SIZE] = {
        [LC_NONE][LE_NONE][LF_NONE] = RTE_PTYPE_UNKNOWN,
@@ -100,43 +159,346 @@ ptype_table[PTYPE_SIZE][PTYPE_SIZE][PTYPE_SIZE] = {
 
 };
 
-static __rte_always_inline int
-__octeontx_xmit_pkts(void *lmtline_va, void *ioreg_va, int64_t *fc_status_va,
-                       struct rte_mbuf *tx_pkt)
+
+static __rte_always_inline uint64_t
+octeontx_pktmbuf_detach(struct rte_mbuf *m)
+{
+       struct rte_mempool *mp = m->pool;
+       uint32_t mbuf_size, buf_len;
+       struct rte_mbuf *md;
+       uint16_t priv_size;
+       uint16_t refcount;
+
+       /* Update refcount of direct mbuf */
+       md = rte_mbuf_from_indirect(m);
+       refcount = rte_mbuf_refcnt_update(md, -1);
+
+       priv_size = rte_pktmbuf_priv_size(mp);
+       mbuf_size = (uint32_t)(sizeof(struct rte_mbuf) + priv_size);
+       buf_len = rte_pktmbuf_data_room_size(mp);
+
+       m->priv_size = priv_size;
+       m->buf_addr = (char *)m + mbuf_size;
+       m->buf_iova = rte_mempool_virt2iova(m) + mbuf_size;
+       m->buf_len = (uint16_t)buf_len;
+       rte_pktmbuf_reset_headroom(m);
+       m->data_len = 0;
+       m->ol_flags = 0;
+       m->next = NULL;
+       m->nb_segs = 1;
+
+       /* Now indirect mbuf is safe to free */
+       rte_pktmbuf_free(m);
+
+       if (refcount == 0) {
+               rte_mbuf_refcnt_set(md, 1);
+               md->data_len = 0;
+               md->ol_flags = 0;
+               md->next = NULL;
+               md->nb_segs = 1;
+               return 0;
+       } else {
+               return 1;
+       }
+}
+
+static __rte_always_inline uint64_t
+octeontx_prefree_seg(struct rte_mbuf *m)
+{
+       if (likely(rte_mbuf_refcnt_read(m) == 1)) {
+               if (!RTE_MBUF_DIRECT(m))
+                       return octeontx_pktmbuf_detach(m);
+
+               m->next = NULL;
+               m->nb_segs = 1;
+               return 0;
+       } else if (rte_mbuf_refcnt_update(m, -1) == 0) {
+               if (!RTE_MBUF_DIRECT(m))
+                       return octeontx_pktmbuf_detach(m);
+
+               rte_mbuf_refcnt_set(m, 1);
+               m->next = NULL;
+               m->nb_segs = 1;
+               return 0;
+       }
+
+       /* Mbuf is having refcount more than 1 so need not to be freed */
+       return 1;
+}
+
+static __rte_always_inline void
+octeontx_tx_checksum_offload(uint64_t *cmd_buf, const uint16_t flags,
+                            struct rte_mbuf *m)
+{
+       struct octeontx_send_hdr_s *send_hdr =
+                               (struct octeontx_send_hdr_s *)cmd_buf;
+       uint64_t ol_flags = m->ol_flags;
+
+       /* PKO Checksum L4 Algorithm Enumeration
+        * 0x0 - No checksum
+        * 0x1 - UDP L4 checksum
+        * 0x2 - TCP L4 checksum
+        * 0x3 - SCTP L4 checksum
+        */
+       const uint8_t csum = (!(((ol_flags ^ PKT_TX_UDP_CKSUM) >> 52) & 0x3) +
+                     (!(((ol_flags ^ PKT_TX_TCP_CKSUM) >> 52) & 0x3) * 2) +
+                     (!(((ol_flags ^ PKT_TX_SCTP_CKSUM) >> 52) & 0x3) * 3));
+
+       const uint8_t is_tunnel_parsed = (!!(ol_flags & PKT_TX_TUNNEL_GTP) ||
+                                     !!(ol_flags & PKT_TX_TUNNEL_VXLAN_GPE) ||
+                                     !!(ol_flags & PKT_TX_TUNNEL_VXLAN) ||
+                                     !!(ol_flags & PKT_TX_TUNNEL_GRE) ||
+                                     !!(ol_flags & PKT_TX_TUNNEL_GENEVE) ||
+                                     !!(ol_flags & PKT_TX_TUNNEL_IP) ||
+                                     !!(ol_flags & PKT_TX_TUNNEL_IPIP));
+
+       const uint8_t csum_outer = (!!(ol_flags & PKT_TX_OUTER_UDP_CKSUM) ||
+                                   !!(ol_flags & PKT_TX_TUNNEL_UDP));
+       const uint8_t outer_l2_len = m->outer_l2_len;
+       const uint8_t l2_len = m->l2_len;
+
+       if ((flags & OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F) &&
+           (flags & OCCTX_TX_OFFLOAD_L3_L4_CSUM_F)) {
+               if (is_tunnel_parsed) {
+                       /* Outer L3 */
+                       send_hdr->w0.l3ptr = outer_l2_len;
+                       send_hdr->w0.l4ptr = outer_l2_len + m->outer_l3_len;
+                       /* Set clk3 for PKO to calculate IPV4 header checksum */
+                       send_hdr->w0.ckl3 = !!(ol_flags & PKT_TX_OUTER_IPV4);
+
+                       /* Outer L4 */
+                       send_hdr->w0.ckl4 = csum_outer;
+
+                       /* Inner L3 */
+                       send_hdr->w1.leptr = send_hdr->w0.l4ptr + l2_len;
+                       send_hdr->w1.lfptr = send_hdr->w1.leptr + m->l3_len;
+                       /* Set clke for PKO to calculate inner IPV4 header
+                        * checksum.
+                        */
+                       send_hdr->w0.ckle = !!(ol_flags & PKT_TX_IPV4);
+
+                       /* Inner L4 */
+                       send_hdr->w0.cklf = csum;
+               } else {
+                       /* Inner L3 */
+                       send_hdr->w0.l3ptr = l2_len;
+                       send_hdr->w0.l4ptr = l2_len + m->l3_len;
+                       /* Set clk3 for PKO to calculate IPV4 header checksum */
+                       send_hdr->w0.ckl3 = !!(ol_flags & PKT_TX_IPV4);
+
+                       /* Inner L4 */
+                       send_hdr->w0.ckl4 = csum;
+               }
+       } else if (flags & OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F) {
+               /* Outer L3 */
+               send_hdr->w0.l3ptr = outer_l2_len;
+               send_hdr->w0.l4ptr = outer_l2_len + m->outer_l3_len;
+               /* Set clk3 for PKO to calculate IPV4 header checksum */
+               send_hdr->w0.ckl3 = !!(ol_flags & PKT_TX_OUTER_IPV4);
+
+               /* Outer L4 */
+               send_hdr->w0.ckl4 = csum_outer;
+       } else if (flags & OCCTX_TX_OFFLOAD_L3_L4_CSUM_F) {
+               /* Inner L3 */
+               send_hdr->w0.l3ptr = l2_len;
+               send_hdr->w0.l4ptr = l2_len + m->l3_len;
+               /* Set clk3 for PKO to calculate IPV4 header checksum */
+               send_hdr->w0.ckl3 = !!(ol_flags & PKT_TX_IPV4);
+
+               /* Inner L4 */
+               send_hdr->w0.ckl4 = csum;
+       }
+}
+
+static __rte_always_inline uint16_t
+__octeontx_xmit_prepare(struct rte_mbuf *tx_pkt, uint64_t *cmd_buf,
+                       const uint16_t flag)
 {
-       uint64_t cmd_buf[4] __rte_cache_aligned;
-       uint16_t gaura_id;
+       uint16_t gaura_id, nb_desc = 0;
 
-       if (unlikely(*((volatile int64_t *)fc_status_va) < 0))
-               return -ENOSPC;
+       /* Setup PKO_SEND_HDR_S */
+       cmd_buf[nb_desc++] = tx_pkt->data_len & 0xffff;
+       cmd_buf[nb_desc++] = 0x0;
 
+       /* Enable tx checksum offload */
+       if ((flag & OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F) ||
+           (flag & OCCTX_TX_OFFLOAD_L3_L4_CSUM_F))
+               octeontx_tx_checksum_offload(cmd_buf, flag, tx_pkt);
+
+       /* SEND_HDR[DF] bit controls if buffer is to be freed or
+        * not, as SG_DESC[I] and SEND_HDR[II] are clear.
+        */
+       if (flag & OCCTX_TX_OFFLOAD_MBUF_NOFF_F)
+               cmd_buf[0] |= (octeontx_prefree_seg(tx_pkt) <<
+                              58);
+
+       /* Mark mempool object as "put" since it is freed by PKO */
+       if (!(cmd_buf[0] & (1ULL << 58)))
+               __mempool_check_cookies(tx_pkt->pool, (void **)&tx_pkt,
+                                       1, 0);
        /* Get the gaura Id */
-       gaura_id = octeontx_fpa_bufpool_gpool((uintptr_t)tx_pkt->pool->pool_id);
+       gaura_id = octeontx_fpa_bufpool_gpool((uintptr_t)
+                                             tx_pkt->pool->pool_id);
+
+       /* Setup PKO_SEND_BUFLINK_S */
+       cmd_buf[nb_desc++] = PKO_SEND_BUFLINK_SUBDC |
+               PKO_SEND_BUFLINK_LDTYPE(0x1ull) |
+               PKO_SEND_BUFLINK_GAUAR((long)gaura_id) |
+               tx_pkt->data_len;
+       cmd_buf[nb_desc++] = rte_mbuf_data_iova(tx_pkt);
+
+       return nb_desc;
+}
+
+static __rte_always_inline uint16_t
+__octeontx_xmit_mseg_prepare(struct rte_mbuf *tx_pkt, uint64_t *cmd_buf,
+                       const uint16_t flag)
+{
+       uint16_t nb_segs, nb_desc = 0;
+       uint16_t gaura_id, len = 0;
+       struct rte_mbuf *m_next = NULL;
 
+       nb_segs = tx_pkt->nb_segs;
        /* Setup PKO_SEND_HDR_S */
-       cmd_buf[0] = tx_pkt->data_len & 0xffff;
-       cmd_buf[1] = 0x0;
+       cmd_buf[nb_desc++] = tx_pkt->pkt_len & 0xffff;
+       cmd_buf[nb_desc++] = 0x0;
 
-       /* Set don't free bit if reference count > 1 */
-       if (rte_mbuf_refcnt_read(tx_pkt) > 1)
-               cmd_buf[0] |= (1ULL << 58); /* SET DF */
+       /* Enable tx checksum offload */
+       if ((flag & OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F) ||
+           (flag & OCCTX_TX_OFFLOAD_L3_L4_CSUM_F))
+               octeontx_tx_checksum_offload(cmd_buf, flag, tx_pkt);
 
-       /* Setup PKO_SEND_GATHER_S */
-       cmd_buf[(1 << 1) | 1] = rte_mbuf_data_iova(tx_pkt);
-       cmd_buf[(1 << 1) | 0] = PKO_SEND_GATHER_SUBDC |
-                               PKO_SEND_GATHER_LDTYPE(0x1ull) |
-                               PKO_SEND_GATHER_GAUAR((long)gaura_id) |
-                               tx_pkt->data_len;
+       do {
+               m_next = tx_pkt->next;
+               /* To handle case where mbufs belong to diff pools, like
+                * fragmentation
+                */
+               gaura_id = octeontx_fpa_bufpool_gpool((uintptr_t)
+                                                     tx_pkt->pool->pool_id);
 
-       octeontx_reg_lmtst(lmtline_va, ioreg_va, cmd_buf, PKO_CMD_SZ);
+               /* Setup PKO_SEND_GATHER_S */
+               cmd_buf[nb_desc] = PKO_SEND_GATHER_SUBDC                 |
+                                  PKO_SEND_GATHER_LDTYPE(0x1ull)        |
+                                  PKO_SEND_GATHER_GAUAR((long)gaura_id) |
+                                  tx_pkt->data_len;
 
-       return 0;
+               /* SG_DESC[I] bit controls if buffer is to be freed or
+                * not, as SEND_HDR[DF] and SEND_HDR[II] are clear.
+                */
+               if (flag & OCCTX_TX_OFFLOAD_MBUF_NOFF_F) {
+                       cmd_buf[nb_desc] |=
+                            (octeontx_prefree_seg(tx_pkt) << 57);
+               }
+
+               /* Mark mempool object as "put" since it is freed by
+                * PKO.
+                */
+               if (!(cmd_buf[nb_desc] & (1ULL << 57))) {
+                       tx_pkt->next = NULL;
+                       __mempool_check_cookies(tx_pkt->pool,
+                                               (void **)&tx_pkt, 1, 0);
+               }
+               nb_desc++;
+
+               cmd_buf[nb_desc++] = rte_mbuf_data_iova(tx_pkt);
+
+               nb_segs--;
+               len += tx_pkt->data_len;
+               tx_pkt = m_next;
+       } while (nb_segs);
+
+       return nb_desc;
 }
 
-uint16_t
-octeontx_xmit_pkts(void *tx_queue, struct rte_mbuf **tx_pkts, uint16_t nb_pkts);
+static __rte_always_inline uint16_t
+__octeontx_xmit_pkts(void *tx_queue, struct rte_mbuf **tx_pkts,
+                    uint16_t nb_pkts, uint64_t *cmd_buf,
+                    const uint16_t flags)
+{
+       struct octeontx_txq *txq = tx_queue;
+       octeontx_dq_t *dq = &txq->dq;
+       uint16_t count = 0, nb_desc;
+       rte_cio_wmb();
+
+       while (count < nb_pkts) {
+               if (unlikely(*((volatile int64_t *)dq->fc_status_va) < 0))
+                       break;
+
+               if (flags & OCCTX_TX_MULTI_SEG_F) {
+                       nb_desc = __octeontx_xmit_mseg_prepare(tx_pkts[count],
+                                                              cmd_buf, flags);
+               } else {
+                       nb_desc = __octeontx_xmit_prepare(tx_pkts[count],
+                                                         cmd_buf, flags);
+               }
+
+               octeontx_reg_lmtst(dq->lmtline_va, dq->ioreg_va, cmd_buf,
+                                  nb_desc);
+
+               count++;
+       }
+       return count;
+}
 
 uint16_t
 octeontx_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts, uint16_t nb_pkts);
 
-#endif /* __OCTEONTX_RXTX_H__ */
+#define L3L4CSUM_F   OCCTX_TX_OFFLOAD_L3_L4_CSUM_F
+#define OL3OL4CSUM_F OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F
+#define NOFF_F       OCCTX_TX_OFFLOAD_MBUF_NOFF_F
+#define MULT_F       OCCTX_TX_MULTI_SEG_F
+
+/* [L3L4CSUM_F] [OL3OL4CSUM_F] [NOFF] [MULTI_SEG] */
+#define OCCTX_TX_FASTPATH_MODES                                                       \
+T(no_offload,                          0, 0, 0, 0,     4,                     \
+                                       OCCTX_TX_OFFLOAD_NONE)                 \
+T(mseg,                                        0, 0, 0, 1,     14,                    \
+                                       MULT_F)                                \
+T(l3l4csum,                            0, 0, 1, 0,     4,                     \
+                                       L3L4CSUM_F)                            \
+T(l3l4csum_mseg,                       0, 0, 1, 1,     14,                    \
+                                       L3L4CSUM_F | MULT_F)                   \
+T(ol3ol4csum,                          0, 1, 0, 0,     4,                     \
+                                       OL3OL4CSUM_F)                          \
+T(ol3l4csum_mseg,                      0, 1, 0, 1,     14,                    \
+                                       OL3OL4CSUM_F | MULT_F)                 \
+T(ol3l4csum_l3l4csum,                  0, 1, 1, 0,     4,                     \
+                                       OL3OL4CSUM_F | L3L4CSUM_F)             \
+T(ol3l4csum_l3l4csum_mseg,             0, 1, 1, 1,     14,                    \
+                                       OL3OL4CSUM_F | L3L4CSUM_F | MULT_F)    \
+T(noff,                                        1, 0, 0, 0,     4,                     \
+                                       NOFF_F)                                \
+T(noff_mseg,                           1, 0, 0, 1,     14,                    \
+                                       NOFF_F | MULT_F)                       \
+T(noff_l3l4csum,                       1, 0, 1, 0,     4,                     \
+                                       NOFF_F | L3L4CSUM_F)                   \
+T(noff_l3l4csum_mseg,                  1, 0, 1, 1,     14,                    \
+                                       NOFF_F | L3L4CSUM_F | MULT_F)          \
+T(noff_ol3ol4csum,                     1, 1, 0, 0,     4,                     \
+                                       NOFF_F | OL3OL4CSUM_F)                 \
+T(noff_ol3ol4csum_mseg,                        1, 1, 0, 1,     14,                    \
+                                       NOFF_F | OL3OL4CSUM_F | MULT_F)        \
+T(noff_ol3ol4csum_l3l4csum,            1, 1, 1, 0,     4,                     \
+                                       NOFF_F | OL3OL4CSUM_F | L3L4CSUM_F)    \
+T(noff_ol3ol4csum_l3l4csum_mseg,       1, 1, 1, 1,     14,                    \
+                                       NOFF_F | OL3OL4CSUM_F | L3L4CSUM_F |   \
+                                       MULT_F)
+
+/* RX offload macros */
+#define VLAN_FLTR_F     OCCTX_RX_VLAN_FLTR_F
+#define CSUM_F         OCCTX_RX_OFFLOAD_CSUM_F
+#define MULT_RX_F       OCCTX_RX_MULTI_SEG_F
+
+/* [VLAN_FLTR] [CSUM_F] [MULTI_SEG] */
+#define OCCTX_RX_FASTPATH_MODES                                                       \
+R(no_offload,                          0, 0, 0,  OCCTX_RX_OFFLOAD_NONE)       \
+R(mseg,                                        0, 0, 1,  MULT_RX_F)                   \
+R(csum,                                        0, 1, 0,  CSUM_F)                      \
+R(csum_mseg,                           0, 1, 1,  CSUM_F | MULT_RX_F)          \
+R(vlan,                                        1, 0, 0,  VLAN_FLTR_F)                 \
+R(vlan_mseg,                           1, 0, 1,  VLAN_FLTR_F | MULT_RX_F)     \
+R(vlan_csum,                           1, 1, 0,  VLAN_FLTR_F | CSUM_F)        \
+R(vlan_csum_mseg,                      1, 1, 1,  CSUM_F | VLAN_FLTR_F |       \
+                                       MULT_RX_F)
+
+ #endif /* __OCTEONTX_RXTX_H__ */