get:
Show a patch.

patch:
Update a patch.

put:
Update a patch.

GET /api/patches/76662/?format=api
HTTP 200 OK
Allow: GET, PUT, PATCH, HEAD, OPTIONS
Content-Type: application/json
Vary: Accept

{
    "id": 76662,
    "url": "http://patches.dpdk.org/api/patches/76662/?format=api",
    "web_url": "http://patches.dpdk.org/project/dpdk/patch/20200907091711.5980-2-junyux.jiang@intel.com/",
    "project": {
        "id": 1,
        "url": "http://patches.dpdk.org/api/projects/1/?format=api",
        "name": "DPDK",
        "link_name": "dpdk",
        "list_id": "dev.dpdk.org",
        "list_email": "dev@dpdk.org",
        "web_url": "http://core.dpdk.org",
        "scm_url": "git://dpdk.org/dpdk",
        "webscm_url": "http://git.dpdk.org/dpdk",
        "list_archive_url": "https://inbox.dpdk.org/dev",
        "list_archive_url_format": "https://inbox.dpdk.org/dev/{}",
        "commit_url_format": ""
    },
    "msgid": "<20200907091711.5980-2-junyux.jiang@intel.com>",
    "list_archive_url": "https://inbox.dpdk.org/dev/20200907091711.5980-2-junyux.jiang@intel.com",
    "date": "2020-09-07T09:17:07",
    "name": "[v2,1/5] net/ice: support flex Rx descriptor RxDID #22",
    "commit_ref": null,
    "pull_url": null,
    "state": "superseded",
    "archived": true,
    "hash": "d7128971be7f4a6a67d0b370af71b86db10522c4",
    "submitter": {
        "id": 1408,
        "url": "http://patches.dpdk.org/api/people/1408/?format=api",
        "name": "Junyu Jiang",
        "email": "junyux.jiang@intel.com"
    },
    "delegate": {
        "id": 1540,
        "url": "http://patches.dpdk.org/api/users/1540/?format=api",
        "username": "qzhan15",
        "first_name": "Qi",
        "last_name": "Zhang",
        "email": "qi.z.zhang@intel.com"
    },
    "mbox": "http://patches.dpdk.org/project/dpdk/patch/20200907091711.5980-2-junyux.jiang@intel.com/mbox/",
    "series": [
        {
            "id": 11987,
            "url": "http://patches.dpdk.org/api/series/11987/?format=api",
            "web_url": "http://patches.dpdk.org/project/dpdk/list/?series=11987",
            "date": "2020-09-07T09:17:06",
            "name": "supports RxDID #22 and FDID",
            "version": 2,
            "mbox": "http://patches.dpdk.org/series/11987/mbox/"
        }
    ],
    "comments": "http://patches.dpdk.org/api/patches/76662/comments/",
    "check": "success",
    "checks": "http://patches.dpdk.org/api/patches/76662/checks/",
    "tags": {},
    "related": [],
    "headers": {
        "Return-Path": "<dev-bounces@dpdk.org>",
        "X-Original-To": "patchwork@inbox.dpdk.org",
        "Delivered-To": "patchwork@inbox.dpdk.org",
        "Received": [
            "from dpdk.org (dpdk.org [92.243.14.124])\n\tby inbox.dpdk.org (Postfix) with ESMTP id 50710A04B9;\n\tMon,  7 Sep 2020 11:26:44 +0200 (CEST)",
            "from [92.243.14.124] (localhost [127.0.0.1])\n\tby dpdk.org (Postfix) with ESMTP id 2D7DF1C0CE;\n\tMon,  7 Sep 2020 11:26:38 +0200 (CEST)",
            "from mga14.intel.com (mga14.intel.com [192.55.52.115])\n by dpdk.org (Postfix) with ESMTP id C6C0A1BE0C\n for <dev@dpdk.org>; Mon,  7 Sep 2020 11:26:35 +0200 (CEST)",
            "from fmsmga001.fm.intel.com ([10.253.24.23])\n by fmsmga103.fm.intel.com with ESMTP/TLS/ECDHE-RSA-AES256-GCM-SHA384;\n 07 Sep 2020 02:26:35 -0700",
            "from unknown (HELO intel.sh.intel.com) ([10.239.255.60])\n by fmsmga001.fm.intel.com with ESMTP; 07 Sep 2020 02:26:33 -0700"
        ],
        "IronPort-SDR": [
            "\n gcHBbyl2uX2XqA5EkuwWmvcLbHoRqiJ3VDjzMF82IMqmmVQ5LDtQ/9Yu9uQmhutEKkP5k+Rg4A\n VWRkGA54awqg==",
            "\n AigOIg9dz+vXgLBGF1xxbrryvyDrIN81I42aEqliiWpWIwFkb/YKGdtPqK52mSAZSl7bukiR0X\n dDhGxl7a3IbA=="
        ],
        "X-IronPort-AV": [
            "E=McAfee;i=\"6000,8403,9736\"; a=\"157241149\"",
            "E=Sophos;i=\"5.76,401,1592895600\"; d=\"scan'208\";a=\"157241149\"",
            "E=Sophos;i=\"5.76,401,1592895600\"; d=\"scan'208\";a=\"406783281\""
        ],
        "X-Amp-Result": "SKIPPED(no attachment in message)",
        "X-Amp-File-Uploaded": "False",
        "X-ExtLoop1": "1",
        "From": "Junyu Jiang <junyux.jiang@intel.com>",
        "To": "dev@dpdk.org",
        "Cc": "Qi Zhang <qi.z.zhang@intel.com>, Qiming Yang <qiming.yang@intel.com>,\n Guinan Sun <guinanx.sun@intel.com>, Junyu Jiang <junyux.jiang@intel.com>",
        "Date": "Mon,  7 Sep 2020 09:17:07 +0000",
        "Message-Id": "<20200907091711.5980-2-junyux.jiang@intel.com>",
        "X-Mailer": "git-send-email 2.17.1",
        "In-Reply-To": "<20200907091711.5980-1-junyux.jiang@intel.com>",
        "References": "<20200826075501.50052-1-guinanx.sun@intel.com>\n <20200907091711.5980-1-junyux.jiang@intel.com>",
        "Subject": "[dpdk-dev] [PATCH v2 1/5] net/ice: support flex Rx descriptor RxDID\n\t#22",
        "X-BeenThere": "dev@dpdk.org",
        "X-Mailman-Version": "2.1.15",
        "Precedence": "list",
        "List-Id": "DPDK patches and discussions <dev.dpdk.org>",
        "List-Unsubscribe": "<https://mails.dpdk.org/options/dev>,\n <mailto:dev-request@dpdk.org?subject=unsubscribe>",
        "List-Archive": "<http://mails.dpdk.org/archives/dev/>",
        "List-Post": "<mailto:dev@dpdk.org>",
        "List-Help": "<mailto:dev-request@dpdk.org?subject=help>",
        "List-Subscribe": "<https://mails.dpdk.org/listinfo/dev>,\n <mailto:dev-request@dpdk.org?subject=subscribe>",
        "Errors-To": "dev-bounces@dpdk.org",
        "Sender": "\"dev\" <dev-bounces@dpdk.org>"
    },
    "content": "This patch supports RxDID #22 by the following changes:\n-add structure and macro definition for RxDID #22,\n-support RxDID #22 format in normal path,\n-change RSS hash parsing from RxDID #22 in AVX/SSE data path.\n\nSigned-off-by: Junyu Jiang <junyux.jiang@intel.com>\n---\n drivers/net/ice/ice_rxtx.c          | 16 ++---\n drivers/net/ice/ice_rxtx.h          | 42 +++++++++++++\n drivers/net/ice/ice_rxtx_vec_avx2.c | 98 +++++++++++++++++++++++++++--\n drivers/net/ice/ice_rxtx_vec_sse.c  | 89 +++++++++++++++++++++-----\n 4 files changed, 218 insertions(+), 27 deletions(-)",
    "diff": "diff --git a/drivers/net/ice/ice_rxtx.c b/drivers/net/ice/ice_rxtx.c\nindex 2e1f06d2c..a31a976a1 100644\n--- a/drivers/net/ice/ice_rxtx.c\n+++ b/drivers/net/ice/ice_rxtx.c\n@@ -50,7 +50,7 @@ static inline uint8_t\n ice_proto_xtr_type_to_rxdid(uint8_t xtr_type)\n {\n \tstatic uint8_t rxdid_map[] = {\n-\t\t[PROTO_XTR_NONE]      = ICE_RXDID_COMMS_GENERIC,\n+\t\t[PROTO_XTR_NONE]      = ICE_RXDID_COMMS_OVS,\n \t\t[PROTO_XTR_VLAN]      = ICE_RXDID_COMMS_AUX_VLAN,\n \t\t[PROTO_XTR_IPV4]      = ICE_RXDID_COMMS_AUX_IPV4,\n \t\t[PROTO_XTR_IPV6]      = ICE_RXDID_COMMS_AUX_IPV6,\n@@ -59,7 +59,7 @@ ice_proto_xtr_type_to_rxdid(uint8_t xtr_type)\n \t};\n \n \treturn xtr_type < RTE_DIM(rxdid_map) ?\n-\t\t\t\trxdid_map[xtr_type] : ICE_RXDID_COMMS_GENERIC;\n+\t\t\t\trxdid_map[xtr_type] : ICE_RXDID_COMMS_OVS;\n }\n \n static enum ice_status\n@@ -72,7 +72,7 @@ ice_program_hw_rx_queue(struct ice_rx_queue *rxq)\n \tenum ice_status err;\n \tuint16_t buf_size, len;\n \tstruct rte_eth_rxmode *rxmode = &dev->data->dev_conf.rxmode;\n-\tuint32_t rxdid = ICE_RXDID_COMMS_GENERIC;\n+\tuint32_t rxdid = ICE_RXDID_COMMS_OVS;\n \tuint32_t regval;\n \n \t/* Set buffer size as the head split is disabled. */\n@@ -1309,7 +1309,7 @@ ice_rxd_to_vlan_tci(struct rte_mbuf *mb, volatile union ice_rx_flex_desc *rxdp)\n \n static void\n ice_rxd_to_proto_xtr(struct rte_mbuf *mb,\n-\t\t     volatile struct ice_32b_rx_flex_desc_comms *desc)\n+\t\t     volatile struct ice_32b_rx_flex_desc_comms_ovs *desc)\n {\n \tuint16_t stat_err = rte_le_to_cpu_16(desc->status_error1);\n \tuint32_t metadata;\n@@ -1338,8 +1338,9 @@ static inline void\n ice_rxd_to_pkt_fields(struct rte_mbuf *mb,\n \t\t      volatile union ice_rx_flex_desc *rxdp)\n {\n-\tvolatile struct ice_32b_rx_flex_desc_comms *desc =\n-\t\t\t(volatile struct ice_32b_rx_flex_desc_comms *)rxdp;\n+\tvolatile struct ice_32b_rx_flex_desc_comms_ovs *desc =\n+\t\t\t(volatile struct ice_32b_rx_flex_desc_comms_ovs *)rxdp;\n+#ifndef RTE_LIBRTE_ICE_16BYTE_RX_DESC\n \tuint16_t stat_err;\n \n \tstat_err = rte_le_to_cpu_16(desc->status_error0);\n@@ -1347,13 +1348,14 @@ ice_rxd_to_pkt_fields(struct rte_mbuf *mb,\n \t\tmb->ol_flags |= PKT_RX_RSS_HASH;\n \t\tmb->hash.rss = rte_le_to_cpu_32(desc->rss_hash);\n \t}\n+#endif\n \n-#ifndef RTE_LIBRTE_ICE_16BYTE_RX_DESC\n \tif (desc->flow_id != 0xFFFFFFFF) {\n \t\tmb->ol_flags |= PKT_RX_FDIR | PKT_RX_FDIR_ID;\n \t\tmb->hash.fdir.hi = rte_le_to_cpu_32(desc->flow_id);\n \t}\n \n+#ifndef RTE_LIBRTE_ICE_16BYTE_RX_DESC\n \tif (unlikely(rte_net_ice_dynf_proto_xtr_metadata_avail()))\n \t\tice_rxd_to_proto_xtr(mb, desc);\n #endif\ndiff --git a/drivers/net/ice/ice_rxtx.h b/drivers/net/ice/ice_rxtx.h\nindex 2fdcfb7d0..e21ba152d 100644\n--- a/drivers/net/ice/ice_rxtx.h\n+++ b/drivers/net/ice/ice_rxtx.h\n@@ -38,6 +38,8 @@\n \n #define ICE_FDIR_PKT_LEN\t512\n \n+#define ICE_RXDID_COMMS_OVS\t22\n+\n typedef void (*ice_rx_release_mbufs_t)(struct ice_rx_queue *rxq);\n typedef void (*ice_tx_release_mbufs_t)(struct ice_tx_queue *txq);\n \n@@ -135,6 +137,46 @@ union ice_tx_offload {\n \t};\n };\n \n+/* Rx Flex Descriptor for Comms Package Profile\n+ * RxDID Profile ID 22 (swap Hash and FlowID)\n+ * Flex-field 0: Flow ID lower 16-bits\n+ * Flex-field 1: Flow ID upper 16-bits\n+ * Flex-field 2: RSS hash lower 16-bits\n+ * Flex-field 3: RSS hash upper 16-bits\n+ * Flex-field 4: AUX0\n+ * Flex-field 5: AUX1\n+ */\n+struct ice_32b_rx_flex_desc_comms_ovs {\n+\t/* Qword 0 */\n+\tu8 rxdid;\n+\tu8 mir_id_umb_cast;\n+\t__le16 ptype_flexi_flags0;\n+\t__le16 pkt_len;\n+\t__le16 hdr_len_sph_flex_flags1;\n+\n+\t/* Qword 1 */\n+\t__le16 status_error0;\n+\t__le16 l2tag1;\n+\t__le32 flow_id;\n+\n+\t/* Qword 2 */\n+\t__le16 status_error1;\n+\tu8 flexi_flags2;\n+\tu8 ts_low;\n+\t__le16 l2tag2_1st;\n+\t__le16 l2tag2_2nd;\n+\n+\t/* Qword 3 */\n+\t__le32 rss_hash;\n+\tunion {\n+\t\tstruct {\n+\t\t\t__le16 aux0;\n+\t\t\t__le16 aux1;\n+\t\t} flex;\n+\t\t__le32 ts_high;\n+\t} flex_ts;\n+};\n+\n int ice_rx_queue_setup(struct rte_eth_dev *dev,\n \t\t       uint16_t queue_idx,\n \t\t       uint16_t nb_desc,\ndiff --git a/drivers/net/ice/ice_rxtx_vec_avx2.c b/drivers/net/ice/ice_rxtx_vec_avx2.c\nindex be50677c2..07d129e3f 100644\n--- a/drivers/net/ice/ice_rxtx_vec_avx2.c\n+++ b/drivers/net/ice/ice_rxtx_vec_avx2.c\n@@ -191,8 +191,8 @@ _ice_recv_raw_pkts_vec_avx2(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \tconst __m256i shuf_msk =\n \t\t_mm256_set_epi8\n \t\t\t(/* first descriptor */\n-\t\t\t 15, 14,\n-\t\t\t 13, 12,\t/* octet 12~15, 32 bits rss */\n+\t\t\t 0xFF, 0xFF,\n+\t\t\t 0xFF, 0xFF,\t/* rss hash parsed separately */\n \t\t\t 11, 10,\t/* octet 10~11, 16 bits vlan_macip */\n \t\t\t 5, 4,\t\t/* octet 4~5, 16 bits data_len */\n \t\t\t 0xFF, 0xFF,\t/* skip hi 16 bits pkt_len, zero out */\n@@ -200,8 +200,8 @@ _ice_recv_raw_pkts_vec_avx2(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t\t\t 0xFF, 0xFF,\t/* pkt_type set as unknown */\n \t\t\t 0xFF, 0xFF,\t/*pkt_type set as unknown */\n \t\t\t /* second descriptor */\n-\t\t\t 15, 14,\n-\t\t\t 13, 12,\t/* octet 12~15, 32 bits rss */\n+\t\t\t 0xFF, 0xFF,\n+\t\t\t 0xFF, 0xFF,\t/* rss hash parsed separately */\n \t\t\t 11, 10,\t/* octet 10~11, 16 bits vlan_macip */\n \t\t\t 5, 4,\t\t/* octet 4~5, 16 bits data_len */\n \t\t\t 0xFF, 0xFF,\t/* skip hi 16 bits pkt_len, zero out */\n@@ -461,6 +461,96 @@ _ice_recv_raw_pkts_vec_avx2(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t\t/* merge flags */\n \t\tconst __m256i mbuf_flags = _mm256_or_si256(l3_l4_flags,\n \t\t\t\trss_vlan_flags);\n+\n+#ifndef RTE_LIBRTE_ICE_16BYTE_RX_DESC\n+\t\t/**\n+\t\t * needs to load 2nd 16B of each desc for RSS hash parsing,\n+\t\t * will cause performance drop to get into this context.\n+\t\t */\n+\t\tif (rxq->vsi->adapter->eth_dev->data->dev_conf.rxmode.offloads &\n+\t\t\t\tDEV_RX_OFFLOAD_RSS_HASH) {\n+\t\t\t/* load bottom half of every 32B desc */\n+\t\t\tconst __m128i raw_desc_bh7 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[7].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh6 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[6].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh5 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[5].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh4 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[4].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh3 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[3].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh2 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[2].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh1 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[1].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh0 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[0].wb.status_error1));\n+\n+\t\t\t__m256i raw_desc_bh6_7 =\n+\t\t\t\t_mm256_inserti128_si256\n+\t\t\t\t\t(_mm256_castsi128_si256(raw_desc_bh6),\n+\t\t\t\t\traw_desc_bh7, 1);\n+\t\t\t__m256i raw_desc_bh4_5 =\n+\t\t\t\t_mm256_inserti128_si256\n+\t\t\t\t\t(_mm256_castsi128_si256(raw_desc_bh4),\n+\t\t\t\t\traw_desc_bh5, 1);\n+\t\t\t__m256i raw_desc_bh2_3 =\n+\t\t\t\t_mm256_inserti128_si256\n+\t\t\t\t\t(_mm256_castsi128_si256(raw_desc_bh2),\n+\t\t\t\t\traw_desc_bh3, 1);\n+\t\t\t__m256i raw_desc_bh0_1 =\n+\t\t\t\t_mm256_inserti128_si256\n+\t\t\t\t\t(_mm256_castsi128_si256(raw_desc_bh0),\n+\t\t\t\t\traw_desc_bh1, 1);\n+\n+\t\t\t/**\n+\t\t\t * to shift the 32b RSS hash value to the\n+\t\t\t * highest 32b of each 128b before mask\n+\t\t\t */\n+\t\t\t__m256i rss_hash6_7 =\n+\t\t\t\t_mm256_slli_epi64(raw_desc_bh6_7, 32);\n+\t\t\t__m256i rss_hash4_5 =\n+\t\t\t\t_mm256_slli_epi64(raw_desc_bh4_5, 32);\n+\t\t\t__m256i rss_hash2_3 =\n+\t\t\t\t_mm256_slli_epi64(raw_desc_bh2_3, 32);\n+\t\t\t__m256i rss_hash0_1 =\n+\t\t\t\t_mm256_slli_epi64(raw_desc_bh0_1, 32);\n+\n+\t\t\t__m256i rss_hash_msk =\n+\t\t\t\t_mm256_set_epi32(0xFFFFFFFF, 0, 0, 0,\n+\t\t\t\t\t\t 0xFFFFFFFF, 0, 0, 0);\n+\n+\t\t\trss_hash6_7 = _mm256_and_si256\n+\t\t\t\t\t(rss_hash6_7, rss_hash_msk);\n+\t\t\trss_hash4_5 = _mm256_and_si256\n+\t\t\t\t\t(rss_hash4_5, rss_hash_msk);\n+\t\t\trss_hash2_3 = _mm256_and_si256\n+\t\t\t\t\t(rss_hash2_3, rss_hash_msk);\n+\t\t\trss_hash0_1 = _mm256_and_si256\n+\t\t\t\t\t(rss_hash0_1, rss_hash_msk);\n+\n+\t\t\tmb6_7 = _mm256_or_si256(mb6_7, rss_hash6_7);\n+\t\t\tmb4_5 = _mm256_or_si256(mb4_5, rss_hash4_5);\n+\t\t\tmb2_3 = _mm256_or_si256(mb2_3, rss_hash2_3);\n+\t\t\tmb0_1 = _mm256_or_si256(mb0_1, rss_hash0_1);\n+\t\t} /* if() on RSS hash parsing */\n+#endif\n \t\t/**\n \t\t * At this point, we have the 8 sets of flags in the low 16-bits\n \t\t * of each 32-bit value in vlan0.\ndiff --git a/drivers/net/ice/ice_rxtx_vec_sse.c b/drivers/net/ice/ice_rxtx_vec_sse.c\nindex 382ef31f3..fffb27138 100644\n--- a/drivers/net/ice/ice_rxtx_vec_sse.c\n+++ b/drivers/net/ice/ice_rxtx_vec_sse.c\n@@ -230,7 +230,8 @@ _ice_recv_raw_pkts_vec(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \tconst __m128i zero = _mm_setzero_si128();\n \t/* mask to shuffle from desc. to mbuf */\n \tconst __m128i shuf_msk = _mm_set_epi8\n-\t\t\t(15, 14, 13, 12,  /* octet 12~15, 32 bits rss */\n+\t\t\t(0xFF, 0xFF,\n+\t\t\t 0xFF, 0xFF,  /* rss hash parsed separately */\n \t\t\t 11, 10,      /* octet 10~11, 16 bits vlan_macip */\n \t\t\t 5, 4,        /* octet 4~5, 16 bits data_len */\n \t\t\t 0xFF, 0xFF,  /* skip high 16 bits pkt_len, zero out */\n@@ -321,7 +322,7 @@ _ice_recv_raw_pkts_vec(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t     pos += ICE_DESCS_PER_LOOP,\n \t     rxdp += ICE_DESCS_PER_LOOP) {\n \t\t__m128i descs[ICE_DESCS_PER_LOOP];\n-\t\t__m128i pkt_mb1, pkt_mb2, pkt_mb3, pkt_mb4;\n+\t\t__m128i pkt_mb0, pkt_mb1, pkt_mb2, pkt_mb3;\n \t\t__m128i staterr, sterr_tmp1, sterr_tmp2;\n \t\t/* 2 64 bit or 4 32 bit mbuf pointers in one XMM reg. */\n \t\t__m128i mbp1;\n@@ -367,8 +368,12 @@ _ice_recv_raw_pkts_vec(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t\trte_compiler_barrier();\n \n \t\t/* D.1 pkt 3,4 convert format from desc to pktmbuf */\n-\t\tpkt_mb4 = _mm_shuffle_epi8(descs[3], shuf_msk);\n-\t\tpkt_mb3 = _mm_shuffle_epi8(descs[2], shuf_msk);\n+\t\tpkt_mb3 = _mm_shuffle_epi8(descs[3], shuf_msk);\n+\t\tpkt_mb2 = _mm_shuffle_epi8(descs[2], shuf_msk);\n+\n+\t\t/* D.1 pkt 1,2 convert format from desc to pktmbuf */\n+\t\tpkt_mb1 = _mm_shuffle_epi8(descs[1], shuf_msk);\n+\t\tpkt_mb0 = _mm_shuffle_epi8(descs[0], shuf_msk);\n \n \t\t/* C.1 4=>2 filter staterr info only */\n \t\tsterr_tmp2 = _mm_unpackhi_epi32(descs[3], descs[2]);\n@@ -378,12 +383,68 @@ _ice_recv_raw_pkts_vec(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t\tice_rx_desc_to_olflags_v(rxq, descs, &rx_pkts[pos]);\n \n \t\t/* D.2 pkt 3,4 set in_port/nb_seg and remove crc */\n-\t\tpkt_mb4 = _mm_add_epi16(pkt_mb4, crc_adjust);\n \t\tpkt_mb3 = _mm_add_epi16(pkt_mb3, crc_adjust);\n+\t\tpkt_mb2 = _mm_add_epi16(pkt_mb2, crc_adjust);\n \n-\t\t/* D.1 pkt 1,2 convert format from desc to pktmbuf */\n-\t\tpkt_mb2 = _mm_shuffle_epi8(descs[1], shuf_msk);\n-\t\tpkt_mb1 = _mm_shuffle_epi8(descs[0], shuf_msk);\n+\t\t/* D.2 pkt 1,2 set in_port/nb_seg and remove crc */\n+\t\tpkt_mb1 = _mm_add_epi16(pkt_mb1, crc_adjust);\n+\t\tpkt_mb0 = _mm_add_epi16(pkt_mb0, crc_adjust);\n+\n+#ifndef RTE_LIBRTE_ICE_16BYTE_RX_DESC\n+\t\t/**\n+\t\t * needs to load 2nd 16B of each desc for RSS hash parsing,\n+\t\t * will cause performance drop to get into this context.\n+\t\t */\n+\t\tif (rxq->vsi->adapter->eth_dev->data->dev_conf.rxmode.offloads &\n+\t\t\t\tDEV_RX_OFFLOAD_RSS_HASH) {\n+\t\t\t/* load bottom half of every 32B desc */\n+\t\t\tconst __m128i raw_desc_bh3 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[3].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh2 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[2].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh1 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[1].wb.status_error1));\n+\t\t\trte_compiler_barrier();\n+\t\t\tconst __m128i raw_desc_bh0 =\n+\t\t\t\t_mm_load_si128\n+\t\t\t\t\t((void *)(&rxdp[0].wb.status_error1));\n+\n+\t\t\t/**\n+\t\t\t * to shift the 32b RSS hash value to the\n+\t\t\t * highest 32b of each 128b before mask\n+\t\t\t */\n+\t\t\t__m128i rss_hash3 =\n+\t\t\t\t_mm_slli_epi64(raw_desc_bh3, 32);\n+\t\t\t__m128i rss_hash2 =\n+\t\t\t\t_mm_slli_epi64(raw_desc_bh2, 32);\n+\t\t\t__m128i rss_hash1 =\n+\t\t\t\t_mm_slli_epi64(raw_desc_bh1, 32);\n+\t\t\t__m128i rss_hash0 =\n+\t\t\t\t_mm_slli_epi64(raw_desc_bh0, 32);\n+\n+\t\t\t__m128i rss_hash_msk =\n+\t\t\t\t_mm_set_epi32(0xFFFFFFFF, 0, 0, 0);\n+\n+\t\t\trss_hash3 = _mm_and_si128\n+\t\t\t\t\t(rss_hash3, rss_hash_msk);\n+\t\t\trss_hash2 = _mm_and_si128\n+\t\t\t\t\t(rss_hash2, rss_hash_msk);\n+\t\t\trss_hash1 = _mm_and_si128\n+\t\t\t\t\t(rss_hash1, rss_hash_msk);\n+\t\t\trss_hash0 = _mm_and_si128\n+\t\t\t\t\t(rss_hash0, rss_hash_msk);\n+\n+\t\t\tpkt_mb3 = _mm_or_si128(pkt_mb3, rss_hash3);\n+\t\t\tpkt_mb2 = _mm_or_si128(pkt_mb2, rss_hash2);\n+\t\t\tpkt_mb1 = _mm_or_si128(pkt_mb1, rss_hash1);\n+\t\t\tpkt_mb0 = _mm_or_si128(pkt_mb0, rss_hash0);\n+\t\t} /* if() on RSS hash parsing */\n+#endif\n \n \t\t/* C.2 get 4 pkts staterr value  */\n \t\tstaterr = _mm_unpacklo_epi32(sterr_tmp1, sterr_tmp2);\n@@ -391,14 +452,10 @@ _ice_recv_raw_pkts_vec(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t\t/* D.3 copy final 3,4 data to rx_pkts */\n \t\t_mm_storeu_si128\n \t\t\t((void *)&rx_pkts[pos + 3]->rx_descriptor_fields1,\n-\t\t\t pkt_mb4);\n+\t\t\t pkt_mb3);\n \t\t_mm_storeu_si128\n \t\t\t((void *)&rx_pkts[pos + 2]->rx_descriptor_fields1,\n-\t\t\t pkt_mb3);\n-\n-\t\t/* D.2 pkt 1,2 set in_port/nb_seg and remove crc */\n-\t\tpkt_mb2 = _mm_add_epi16(pkt_mb2, crc_adjust);\n-\t\tpkt_mb1 = _mm_add_epi16(pkt_mb1, crc_adjust);\n+\t\t\t pkt_mb2);\n \n \t\t/* C* extract and record EOP bit */\n \t\tif (split_packet) {\n@@ -422,9 +479,9 @@ _ice_recv_raw_pkts_vec(struct ice_rx_queue *rxq, struct rte_mbuf **rx_pkts,\n \t\t/* D.3 copy final 1,2 data to rx_pkts */\n \t\t_mm_storeu_si128\n \t\t\t((void *)&rx_pkts[pos + 1]->rx_descriptor_fields1,\n-\t\t\t pkt_mb2);\n+\t\t\t pkt_mb1);\n \t\t_mm_storeu_si128((void *)&rx_pkts[pos]->rx_descriptor_fields1,\n-\t\t\t\t pkt_mb1);\n+\t\t\t\t pkt_mb0);\n \t\tice_rx_desc_to_ptype_v(descs, &rx_pkts[pos], ptype_tbl);\n \t\t/* C.4 calc avaialbe number of desc */\n \t\tvar = __builtin_popcountll(_mm_cvtsi128_si64(staterr));\n",
    "prefixes": [
        "v2",
        "1/5"
    ]
}