net/mlx5e: SHAMPO, Re-enable HW-GRO

Add back HW-GRO to the reported features. As the current implementation of HW-GRO uses KSMs with a specific fixed buffer size (256B) to map its headers buffer, we reported the feature only if the NIC is supporting KSM and the minimum value for buffer size is below the requested one. iperf3 bandwidth comparison: +---------+--------+--------+-----------+ | streams | SW GRO | HW GRO | Unit | |---------+--------+--------+-----------| | 1 | 36 | 42 | Gbits/sec | | 4 | 34 | 39 | Gbits/sec | | 8 | 31 | 35 | Gbits/sec | +---------+--------+--------+-----------+ A downstream patch will add skb fragment coalescing which will improve performance considerably. Benchmark details: VM based setup CPU: Intel(R) Xeon(R) Platinum 8380 CPU, 24 cores NIC: ConnectX-7 100GbE iperf3 and irq running on same CPU over a single receive queue Signed-off-by: Yoray Zack <yorayz@nvidia.com> Signed-off-by: Tariq Toukan <tariqt@nvidia.com> Link: https://lore.kernel.org/r/20240603212219.1037656-14-tariqt@nvidia.com Signed-off-by: Jakub Kicinski <kuba@kernel.org>
author: Yoray Zack <yorayz@nvidia.com> 2024-06-04 00:22:18 +0300
committer: Jakub Kicinski <kuba@kernel.org> 2024-06-05 20:20:46 -0700
commit: 99be56171fa9ffea494dfe3d4a7f6e7e51630c2e (patch)
tree: b1288b786bf10d0d31facc6cd8dffc4b0b4acc7c /include/linux
parent: 758191c9ea7bcc45dd99398a538ae4ab27c4029e (diff)
download: linux-99be56171fa9ffea494dfe3d4a7f6e7e51630c2e.tar.gz
linux-99be56171fa9ffea494dfe3d4a7f6e7e51630c2e.tar.bz2
linux-99be56171fa9ffea494dfe3d4a7f6e7e51630c2e.zip
1 files changed, 11 insertions, 5 deletions
diff --git a/include/linux/mlx5/mlx5_ifc.h b/include/linux/mlx5/mlx5_ifc.h
index 5df52e15f7d6..17acd0f3ca8e 100644
--- a/include/linux/mlx5/mlx5_ifc.h
+++ b/include/linux/mlx5/mlx5_ifc.h
@@ -1526,8 +1526,7 @@ struct mlx5_ifc_cmd_hca_cap_bits {
 	u8         ts_cqe_to_dest_cqn[0x1];
 	u8         reserved_at_b3[0x6];
 	u8         go_back_n[0x1];
-	u8         shampo[0x1];
-	u8         reserved_at_bb[0x5];
+	u8         reserved_at_ba[0x6];
 
 	u8         max_sgl_for_optimized_performance[0x8];
 	u8         log_max_cq_sz[0x8];
@@ -1744,7 +1743,9 @@ struct mlx5_ifc_cmd_hca_cap_bits {
 	u8         reserved_at_280[0x10];
 	u8         max_wqe_sz_sq[0x10];
 
-	u8         reserved_at_2a0[0x10];
+	u8         reserved_at_2a0[0xb];
+	u8         shampo[0x1];
+	u8         reserved_at_2ac[0x4];
 	u8         max_wqe_sz_rq[0x10];
 
 	u8         max_flow_counter_31_16[0x10];
@@ -2017,7 +2018,8 @@ struct mlx5_ifc_cmd_hca_cap_2_bits {
 	u8	   reserved_at_250[0x10];
 
 	u8	   reserved_at_260[0x120];
-	u8	   reserved_at_380[0x10];
+	u8	   reserved_at_380[0xb];
+	u8	   min_mkey_log_entity_size_fixed_buffer[0x5];
 	u8	   ec_vf_vport_base[0x10];
 
 	u8	   reserved_at_3a0[0x10];
@@ -2029,7 +2031,11 @@ struct mlx5_ifc_cmd_hca_cap_2_bits {
 	u8	   pcc_ifa2[0x1];
 	u8	   reserved_at_3f1[0xf];
 
-	u8	   reserved_at_400[0x400];
+	u8	   reserved_at_400[0x1];
+	u8	   min_mkey_log_entity_size_fixed_buffer_valid[0x1];
+	u8	   reserved_at_402[0x1e];
+
+	u8	   reserved_at_420[0x3e0];
 };
 
 enum mlx5_ifc_flow_destination_type {
author	Yoray Zack <yorayz@nvidia.com>	2024-06-04 00:22:18 +0300
committer	Jakub Kicinski <kuba@kernel.org>	2024-06-05 20:20:46 -0700
commit	99be56171fa9ffea494dfe3d4a7f6e7e51630c2e (patch)
tree	b1288b786bf10d0d31facc6cd8dffc4b0b4acc7c /include/linux
parent	758191c9ea7bcc45dd99398a538ae4ab27c4029e (diff)
download	linux-99be56171fa9ffea494dfe3d4a7f6e7e51630c2e.tar.gz linux-99be56171fa9ffea494dfe3d4a7f6e7e51630c2e.tar.bz2 linux-99be56171fa9ffea494dfe3d4a7f6e7e51630c2e.zip