mlx5_en_main.c revision 353191
1/*- 2 * Copyright (c) 2015-2018 Mellanox Technologies. All rights reserved. 3 * 4 * Redistribution and use in source and binary forms, with or without 5 * modification, are permitted provided that the following conditions 6 * are met: 7 * 1. Redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer. 9 * 2. Redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution. 12 * 13 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND 14 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 16 * ARE DISCLAIMED. IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE 17 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 18 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 19 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 20 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 21 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 22 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 23 * SUCH DAMAGE. 24 * 25 * $FreeBSD: stable/11/sys/dev/mlx5/mlx5_en/mlx5_en_main.c 353191 2019-10-07 08:41:53Z hselasky $ 26 */ 27 28#include "en.h" 29 30#include <sys/sockio.h> 31#include <machine/atomic.h> 32 33#ifndef ETH_DRIVER_VERSION 34#define ETH_DRIVER_VERSION "3.5.1" 35#endif 36#define DRIVER_RELDATE "April 2019" 37 38static const char mlx5e_version[] = "mlx5en: Mellanox Ethernet driver " 39 ETH_DRIVER_VERSION " (" DRIVER_RELDATE ")\n"; 40 41static int mlx5e_get_wqe_sz(struct mlx5e_priv *priv, u32 *wqe_sz, u32 *nsegs); 42 43struct mlx5e_channel_param { 44 struct mlx5e_rq_param rq; 45 struct mlx5e_sq_param sq; 46 struct mlx5e_cq_param rx_cq; 47 struct mlx5e_cq_param tx_cq; 48}; 49 50struct media { 51 u32 subtype; 52 u64 baudrate; 53}; 54 55static const struct media mlx5e_mode_table[MLX5E_LINK_SPEEDS_NUMBER][MLX5E_LINK_MODES_NUMBER] = { 56 57 [MLX5E_1000BASE_CX_SGMII][MLX5E_SGMII] = { 58 .subtype = IFM_1000_CX_SGMII, 59 .baudrate = IF_Mbps(1000ULL), 60 }, 61 [MLX5E_1000BASE_KX][MLX5E_KX] = { 62 .subtype = IFM_1000_KX, 63 .baudrate = IF_Mbps(1000ULL), 64 }, 65 [MLX5E_10GBASE_CX4][MLX5E_CX4] = { 66 .subtype = IFM_10G_CX4, 67 .baudrate = IF_Gbps(10ULL), 68 }, 69 [MLX5E_10GBASE_KX4][MLX5E_KX4] = { 70 .subtype = IFM_10G_KX4, 71 .baudrate = IF_Gbps(10ULL), 72 }, 73 [MLX5E_10GBASE_KR][MLX5E_KR] = { 74 .subtype = IFM_10G_KR, 75 .baudrate = IF_Gbps(10ULL), 76 }, 77 [MLX5E_20GBASE_KR2][MLX5E_KR2] = { 78 .subtype = IFM_20G_KR2, 79 .baudrate = IF_Gbps(20ULL), 80 }, 81 [MLX5E_40GBASE_CR4][MLX5E_CR4] = { 82 .subtype = IFM_40G_CR4, 83 .baudrate = IF_Gbps(40ULL), 84 }, 85 [MLX5E_40GBASE_KR4][MLX5E_KR4] = { 86 .subtype = IFM_40G_KR4, 87 .baudrate = IF_Gbps(40ULL), 88 }, 89 [MLX5E_56GBASE_R4][MLX5E_R] = { 90 .subtype = IFM_56G_R4, 91 .baudrate = IF_Gbps(56ULL), 92 }, 93 [MLX5E_10GBASE_CR][MLX5E_CR1] = { 94 .subtype = IFM_10G_CR1, 95 .baudrate = IF_Gbps(10ULL), 96 }, 97 [MLX5E_10GBASE_SR][MLX5E_SR] = { 98 .subtype = IFM_10G_SR, 99 .baudrate = IF_Gbps(10ULL), 100 }, 101 [MLX5E_10GBASE_ER_LR][MLX5E_ER] = { 102 .subtype = IFM_10G_ER, 103 .baudrate = IF_Gbps(10ULL), 104 }, 105 [MLX5E_10GBASE_ER_LR][MLX5E_LR] = { 106 .subtype = IFM_10G_LR, 107 .baudrate = IF_Gbps(10ULL), 108 }, 109 [MLX5E_40GBASE_SR4][MLX5E_SR4] = { 110 .subtype = IFM_40G_SR4, 111 .baudrate = IF_Gbps(40ULL), 112 }, 113 [MLX5E_40GBASE_LR4_ER4][MLX5E_LR4] = { 114 .subtype = IFM_40G_LR4, 115 .baudrate = IF_Gbps(40ULL), 116 }, 117 [MLX5E_40GBASE_LR4_ER4][MLX5E_ER4] = { 118 .subtype = IFM_40G_ER4, 119 .baudrate = IF_Gbps(40ULL), 120 }, 121 [MLX5E_100GBASE_CR4][MLX5E_CR4] = { 122 .subtype = IFM_100G_CR4, 123 .baudrate = IF_Gbps(100ULL), 124 }, 125 [MLX5E_100GBASE_SR4][MLX5E_SR4] = { 126 .subtype = IFM_100G_SR4, 127 .baudrate = IF_Gbps(100ULL), 128 }, 129 [MLX5E_100GBASE_KR4][MLX5E_KR4] = { 130 .subtype = IFM_100G_KR4, 131 .baudrate = IF_Gbps(100ULL), 132 }, 133 [MLX5E_100GBASE_LR4][MLX5E_LR4] = { 134 .subtype = IFM_100G_LR4, 135 .baudrate = IF_Gbps(100ULL), 136 }, 137 [MLX5E_100BASE_TX][MLX5E_TX] = { 138 .subtype = IFM_100_TX, 139 .baudrate = IF_Mbps(100ULL), 140 }, 141 [MLX5E_1000BASE_T][MLX5E_T] = { 142 .subtype = IFM_1000_T, 143 .baudrate = IF_Mbps(1000ULL), 144 }, 145 [MLX5E_10GBASE_T][MLX5E_T] = { 146 .subtype = IFM_10G_T, 147 .baudrate = IF_Gbps(10ULL), 148 }, 149 [MLX5E_25GBASE_CR][MLX5E_CR] = { 150 .subtype = IFM_25G_CR, 151 .baudrate = IF_Gbps(25ULL), 152 }, 153 [MLX5E_25GBASE_KR][MLX5E_KR] = { 154 .subtype = IFM_25G_KR, 155 .baudrate = IF_Gbps(25ULL), 156 }, 157 [MLX5E_25GBASE_SR][MLX5E_SR] = { 158 .subtype = IFM_25G_SR, 159 .baudrate = IF_Gbps(25ULL), 160 }, 161 [MLX5E_50GBASE_CR2][MLX5E_CR2] = { 162 .subtype = IFM_50G_CR2, 163 .baudrate = IF_Gbps(50ULL), 164 }, 165 [MLX5E_50GBASE_KR2][MLX5E_KR2] = { 166 .subtype = IFM_50G_KR2, 167 .baudrate = IF_Gbps(50ULL), 168 }, 169}; 170 171static const struct media mlx5e_ext_mode_table[MLX5E_EXT_LINK_SPEEDS_NUMBER][MLX5E_LINK_MODES_NUMBER] = { 172 [MLX5E_SGMII_100M][MLX5E_SGMII] = { 173 .subtype = IFM_100_SGMII, 174 .baudrate = IF_Mbps(100), 175 }, 176 [MLX5E_1000BASE_X_SGMII][MLX5E_KX] = { 177 .subtype = IFM_1000_KX, 178 .baudrate = IF_Mbps(1000), 179 }, 180 [MLX5E_1000BASE_X_SGMII][MLX5E_CX_SGMII] = { 181 .subtype = IFM_1000_CX_SGMII, 182 .baudrate = IF_Mbps(1000), 183 }, 184 [MLX5E_1000BASE_X_SGMII][MLX5E_CX] = { 185 .subtype = IFM_1000_CX, 186 .baudrate = IF_Mbps(1000), 187 }, 188 [MLX5E_1000BASE_X_SGMII][MLX5E_LX] = { 189 .subtype = IFM_1000_LX, 190 .baudrate = IF_Mbps(1000), 191 }, 192 [MLX5E_1000BASE_X_SGMII][MLX5E_SX] = { 193 .subtype = IFM_1000_SX, 194 .baudrate = IF_Mbps(1000), 195 }, 196 [MLX5E_1000BASE_X_SGMII][MLX5E_T] = { 197 .subtype = IFM_1000_T, 198 .baudrate = IF_Mbps(1000), 199 }, 200 [MLX5E_5GBASE_R][MLX5E_T] = { 201 .subtype = IFM_5000_T, 202 .baudrate = IF_Mbps(5000), 203 }, 204 [MLX5E_5GBASE_R][MLX5E_KR] = { 205 .subtype = IFM_5000_KR, 206 .baudrate = IF_Mbps(5000), 207 }, 208 [MLX5E_5GBASE_R][MLX5E_KR1] = { 209 .subtype = IFM_5000_KR1, 210 .baudrate = IF_Mbps(5000), 211 }, 212 [MLX5E_5GBASE_R][MLX5E_KR_S] = { 213 .subtype = IFM_5000_KR_S, 214 .baudrate = IF_Mbps(5000), 215 }, 216 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_ER] = { 217 .subtype = IFM_10G_ER, 218 .baudrate = IF_Gbps(10ULL), 219 }, 220 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_KR] = { 221 .subtype = IFM_10G_KR, 222 .baudrate = IF_Gbps(10ULL), 223 }, 224 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_LR] = { 225 .subtype = IFM_10G_LR, 226 .baudrate = IF_Gbps(10ULL), 227 }, 228 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_SR] = { 229 .subtype = IFM_10G_SR, 230 .baudrate = IF_Gbps(10ULL), 231 }, 232 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_T] = { 233 .subtype = IFM_10G_T, 234 .baudrate = IF_Gbps(10ULL), 235 }, 236 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_AOC] = { 237 .subtype = IFM_10G_AOC, 238 .baudrate = IF_Gbps(10ULL), 239 }, 240 [MLX5E_10GBASE_XFI_XAUI_1][MLX5E_CR1] = { 241 .subtype = IFM_10G_CR1, 242 .baudrate = IF_Gbps(10ULL), 243 }, 244 [MLX5E_40GBASE_XLAUI_4_XLPPI_4][MLX5E_CR4] = { 245 .subtype = IFM_40G_CR4, 246 .baudrate = IF_Gbps(40ULL), 247 }, 248 [MLX5E_40GBASE_XLAUI_4_XLPPI_4][MLX5E_KR4] = { 249 .subtype = IFM_40G_KR4, 250 .baudrate = IF_Gbps(40ULL), 251 }, 252 [MLX5E_40GBASE_XLAUI_4_XLPPI_4][MLX5E_LR4] = { 253 .subtype = IFM_40G_LR4, 254 .baudrate = IF_Gbps(40ULL), 255 }, 256 [MLX5E_40GBASE_XLAUI_4_XLPPI_4][MLX5E_SR4] = { 257 .subtype = IFM_40G_SR4, 258 .baudrate = IF_Gbps(40ULL), 259 }, 260 [MLX5E_40GBASE_XLAUI_4_XLPPI_4][MLX5E_ER4] = { 261 .subtype = IFM_40G_ER4, 262 .baudrate = IF_Gbps(40ULL), 263 }, 264 265 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_CR] = { 266 .subtype = IFM_25G_CR, 267 .baudrate = IF_Gbps(25ULL), 268 }, 269 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_KR] = { 270 .subtype = IFM_25G_KR, 271 .baudrate = IF_Gbps(25ULL), 272 }, 273 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_SR] = { 274 .subtype = IFM_25G_SR, 275 .baudrate = IF_Gbps(25ULL), 276 }, 277 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_ACC] = { 278 .subtype = IFM_25G_ACC, 279 .baudrate = IF_Gbps(25ULL), 280 }, 281 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_AOC] = { 282 .subtype = IFM_25G_AOC, 283 .baudrate = IF_Gbps(25ULL), 284 }, 285 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_CR1] = { 286 .subtype = IFM_25G_CR1, 287 .baudrate = IF_Gbps(25ULL), 288 }, 289 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_CR_S] = { 290 .subtype = IFM_25G_CR_S, 291 .baudrate = IF_Gbps(25ULL), 292 }, 293 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_KR1] = { 294 .subtype = IFM_5000_KR1, 295 .baudrate = IF_Gbps(25ULL), 296 }, 297 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_KR_S] = { 298 .subtype = IFM_25G_KR_S, 299 .baudrate = IF_Gbps(25ULL), 300 }, 301 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_LR] = { 302 .subtype = IFM_25G_LR, 303 .baudrate = IF_Gbps(25ULL), 304 }, 305 [MLX5E_25GAUI_1_25GBASE_CR_KR][MLX5E_T] = { 306 .subtype = IFM_25G_T, 307 .baudrate = IF_Gbps(25ULL), 308 }, 309 [MLX5E_50GAUI_2_LAUI_2_50GBASE_CR2_KR2][MLX5E_CR2] = { 310 .subtype = IFM_50G_CR2, 311 .baudrate = IF_Gbps(50ULL), 312 }, 313 [MLX5E_50GAUI_2_LAUI_2_50GBASE_CR2_KR2][MLX5E_KR2] = { 314 .subtype = IFM_50G_KR2, 315 .baudrate = IF_Gbps(50ULL), 316 }, 317 [MLX5E_50GAUI_2_LAUI_2_50GBASE_CR2_KR2][MLX5E_SR2] = { 318 .subtype = IFM_50G_SR2, 319 .baudrate = IF_Gbps(50ULL), 320 }, 321 [MLX5E_50GAUI_2_LAUI_2_50GBASE_CR2_KR2][MLX5E_LR2] = { 322 .subtype = IFM_50G_LR2, 323 .baudrate = IF_Gbps(50ULL), 324 }, 325 [MLX5E_50GAUI_1_LAUI_1_50GBASE_CR_KR][MLX5E_LR] = { 326 .subtype = IFM_50G_LR, 327 .baudrate = IF_Gbps(50ULL), 328 }, 329 [MLX5E_50GAUI_1_LAUI_1_50GBASE_CR_KR][MLX5E_SR] = { 330 .subtype = IFM_50G_SR, 331 .baudrate = IF_Gbps(50ULL), 332 }, 333 [MLX5E_50GAUI_1_LAUI_1_50GBASE_CR_KR][MLX5E_CP] = { 334 .subtype = IFM_50G_CP, 335 .baudrate = IF_Gbps(50ULL), 336 }, 337 [MLX5E_50GAUI_1_LAUI_1_50GBASE_CR_KR][MLX5E_FR] = { 338 .subtype = IFM_50G_FR, 339 .baudrate = IF_Gbps(50ULL), 340 }, 341 [MLX5E_50GAUI_1_LAUI_1_50GBASE_CR_KR][MLX5E_KR_PAM4] = { 342 .subtype = IFM_50G_KR_PAM4, 343 .baudrate = IF_Gbps(50ULL), 344 }, 345 [MLX5E_CAUI_4_100GBASE_CR4_KR4][MLX5E_CR4] = { 346 .subtype = IFM_100G_CR4, 347 .baudrate = IF_Gbps(100ULL), 348 }, 349 [MLX5E_CAUI_4_100GBASE_CR4_KR4][MLX5E_KR4] = { 350 .subtype = IFM_100G_KR4, 351 .baudrate = IF_Gbps(100ULL), 352 }, 353 [MLX5E_CAUI_4_100GBASE_CR4_KR4][MLX5E_LR4] = { 354 .subtype = IFM_100G_LR4, 355 .baudrate = IF_Gbps(100ULL), 356 }, 357 [MLX5E_CAUI_4_100GBASE_CR4_KR4][MLX5E_SR4] = { 358 .subtype = IFM_100G_SR4, 359 .baudrate = IF_Gbps(100ULL), 360 }, 361 [MLX5E_100GAUI_2_100GBASE_CR2_KR2][MLX5E_SR2] = { 362 .subtype = IFM_100G_SR2, 363 .baudrate = IF_Gbps(100ULL), 364 }, 365 [MLX5E_100GAUI_2_100GBASE_CR2_KR2][MLX5E_CP2] = { 366 .subtype = IFM_100G_CP2, 367 .baudrate = IF_Gbps(100ULL), 368 }, 369 [MLX5E_100GAUI_2_100GBASE_CR2_KR2][MLX5E_KR2_PAM4] = { 370 .subtype = IFM_100G_KR2_PAM4, 371 .baudrate = IF_Gbps(100ULL), 372 }, 373 [MLX5E_200GAUI_4_200GBASE_CR4_KR4][MLX5E_DR4] = { 374 .subtype = IFM_200G_DR4, 375 .baudrate = IF_Gbps(200ULL), 376 }, 377 [MLX5E_200GAUI_4_200GBASE_CR4_KR4][MLX5E_LR4] = { 378 .subtype = IFM_200G_LR4, 379 .baudrate = IF_Gbps(200ULL), 380 }, 381 [MLX5E_200GAUI_4_200GBASE_CR4_KR4][MLX5E_SR4] = { 382 .subtype = IFM_200G_SR4, 383 .baudrate = IF_Gbps(200ULL), 384 }, 385 [MLX5E_200GAUI_4_200GBASE_CR4_KR4][MLX5E_FR4] = { 386 .subtype = IFM_200G_FR4, 387 .baudrate = IF_Gbps(200ULL), 388 }, 389 [MLX5E_200GAUI_4_200GBASE_CR4_KR4][MLX5E_CR4_PAM4] = { 390 .subtype = IFM_200G_CR4_PAM4, 391 .baudrate = IF_Gbps(200ULL), 392 }, 393 [MLX5E_200GAUI_4_200GBASE_CR4_KR4][MLX5E_KR4_PAM4] = { 394 .subtype = IFM_200G_KR4_PAM4, 395 .baudrate = IF_Gbps(200ULL), 396 }, 397}; 398 399MALLOC_DEFINE(M_MLX5EN, "MLX5EN", "MLX5 Ethernet"); 400 401static void 402mlx5e_update_carrier(struct mlx5e_priv *priv) 403{ 404 struct mlx5_core_dev *mdev = priv->mdev; 405 u32 out[MLX5_ST_SZ_DW(ptys_reg)]; 406 u32 eth_proto_oper; 407 int error; 408 u8 port_state; 409 u8 is_er_type; 410 u8 i, j; 411 bool ext; 412 struct media media_entry = {}; 413 414 port_state = mlx5_query_vport_state(mdev, 415 MLX5_QUERY_VPORT_STATE_IN_OP_MOD_VNIC_VPORT, 0); 416 417 if (port_state == VPORT_STATE_UP) { 418 priv->media_status_last |= IFM_ACTIVE; 419 } else { 420 priv->media_status_last &= ~IFM_ACTIVE; 421 priv->media_active_last = IFM_ETHER; 422 if_link_state_change(priv->ifp, LINK_STATE_DOWN); 423 return; 424 } 425 426 error = mlx5_query_port_ptys(mdev, out, sizeof(out), 427 MLX5_PTYS_EN, 1); 428 if (error) { 429 priv->media_active_last = IFM_ETHER; 430 priv->ifp->if_baudrate = 1; 431 if_printf(priv->ifp, "%s: query port ptys failed: " 432 "0x%x\n", __func__, error); 433 return; 434 } 435 436 ext = MLX5_CAP_PCAM_FEATURE(mdev, ptys_extended_ethernet); 437 eth_proto_oper = MLX5_GET_ETH_PROTO(ptys_reg, out, ext, 438 eth_proto_oper); 439 440 i = ilog2(eth_proto_oper); 441 442 for (j = 0; j != MLX5E_LINK_MODES_NUMBER; j++) { 443 media_entry = ext ? mlx5e_ext_mode_table[i][j] : 444 mlx5e_mode_table[i][j]; 445 if (media_entry.baudrate != 0) 446 break; 447 } 448 449 if (media_entry.subtype == 0) { 450 if_printf(priv->ifp, "%s: Could not find operational " 451 "media subtype\n", __func__); 452 return; 453 } 454 455 switch (media_entry.subtype) { 456 case IFM_10G_ER: 457 error = mlx5_query_pddr_range_info(mdev, 1, &is_er_type); 458 if (error != 0) { 459 if_printf(priv->ifp, "%s: query port pddr failed: %d\n", 460 __func__, error); 461 } 462 if (error != 0 || is_er_type == 0) 463 media_entry.subtype = IFM_10G_LR; 464 break; 465 case IFM_40G_LR4: 466 error = mlx5_query_pddr_range_info(mdev, 1, &is_er_type); 467 if (error != 0) { 468 if_printf(priv->ifp, "%s: query port pddr failed: %d\n", 469 __func__, error); 470 } 471 if (error == 0 && is_er_type != 0) 472 media_entry.subtype = IFM_40G_ER4; 473 break; 474 } 475 priv->media_active_last = media_entry.subtype | IFM_ETHER | IFM_FDX; 476 priv->ifp->if_baudrate = media_entry.baudrate; 477 478 if_link_state_change(priv->ifp, LINK_STATE_UP); 479} 480 481static void 482mlx5e_media_status(struct ifnet *dev, struct ifmediareq *ifmr) 483{ 484 struct mlx5e_priv *priv = dev->if_softc; 485 486 ifmr->ifm_status = priv->media_status_last; 487 ifmr->ifm_active = priv->media_active_last | 488 (priv->params.rx_pauseframe_control ? IFM_ETH_RXPAUSE : 0) | 489 (priv->params.tx_pauseframe_control ? IFM_ETH_TXPAUSE : 0); 490 491} 492 493static u32 494mlx5e_find_link_mode(u32 subtype, bool ext) 495{ 496 u32 i; 497 u32 j; 498 u32 link_mode = 0; 499 u32 speeds_num = 0; 500 struct media media_entry = {}; 501 502 switch (subtype) { 503 case IFM_10G_LR: 504 subtype = IFM_10G_ER; 505 break; 506 case IFM_40G_ER4: 507 subtype = IFM_40G_LR4; 508 break; 509 } 510 511 speeds_num = ext ? MLX5E_EXT_LINK_SPEEDS_NUMBER : 512 MLX5E_LINK_SPEEDS_NUMBER; 513 514 for (i = 0; i != speeds_num; i++) { 515 for (j = 0; j < MLX5E_LINK_MODES_NUMBER ; ++j) { 516 media_entry = ext ? mlx5e_ext_mode_table[i][j] : 517 mlx5e_mode_table[i][j]; 518 if (media_entry.baudrate == 0) 519 continue; 520 if (media_entry.subtype == subtype) { 521 link_mode |= MLX5E_PROT_MASK(i); 522 } 523 } 524 } 525 526 return (link_mode); 527} 528 529static int 530mlx5e_set_port_pause_and_pfc(struct mlx5e_priv *priv) 531{ 532 return (mlx5_set_port_pause_and_pfc(priv->mdev, 1, 533 priv->params.rx_pauseframe_control, 534 priv->params.tx_pauseframe_control, 535 priv->params.rx_priority_flow_control, 536 priv->params.tx_priority_flow_control)); 537} 538 539static int 540mlx5e_set_port_pfc(struct mlx5e_priv *priv) 541{ 542 int error; 543 544 if (priv->gone != 0) { 545 error = -ENXIO; 546 } else if (priv->params.rx_pauseframe_control || 547 priv->params.tx_pauseframe_control) { 548 if_printf(priv->ifp, 549 "Global pauseframes must be disabled before " 550 "enabling PFC.\n"); 551 error = -EINVAL; 552 } else { 553 error = mlx5e_set_port_pause_and_pfc(priv); 554 } 555 return (error); 556} 557 558static int 559mlx5e_media_change(struct ifnet *dev) 560{ 561 struct mlx5e_priv *priv = dev->if_softc; 562 struct mlx5_core_dev *mdev = priv->mdev; 563 u32 eth_proto_cap; 564 u32 link_mode; 565 u32 out[MLX5_ST_SZ_DW(ptys_reg)]; 566 int was_opened; 567 int locked; 568 int error; 569 bool ext; 570 571 locked = PRIV_LOCKED(priv); 572 if (!locked) 573 PRIV_LOCK(priv); 574 575 if (IFM_TYPE(priv->media.ifm_media) != IFM_ETHER) { 576 error = EINVAL; 577 goto done; 578 } 579 580 error = mlx5_query_port_ptys(mdev, out, sizeof(out), 581 MLX5_PTYS_EN, 1); 582 if (error != 0) { 583 if_printf(dev, "Query port media capability failed\n"); 584 goto done; 585 } 586 587 ext = MLX5_CAP_PCAM_FEATURE(mdev, ptys_extended_ethernet); 588 link_mode = mlx5e_find_link_mode(IFM_SUBTYPE(priv->media.ifm_media), ext); 589 590 /* query supported capabilities */ 591 eth_proto_cap = MLX5_GET_ETH_PROTO(ptys_reg, out, ext, 592 eth_proto_capability); 593 594 /* check for autoselect */ 595 if (IFM_SUBTYPE(priv->media.ifm_media) == IFM_AUTO) { 596 link_mode = eth_proto_cap; 597 if (link_mode == 0) { 598 if_printf(dev, "Port media capability is zero\n"); 599 error = EINVAL; 600 goto done; 601 } 602 } else { 603 link_mode = link_mode & eth_proto_cap; 604 if (link_mode == 0) { 605 if_printf(dev, "Not supported link mode requested\n"); 606 error = EINVAL; 607 goto done; 608 } 609 } 610 if (priv->media.ifm_media & (IFM_ETH_RXPAUSE | IFM_ETH_TXPAUSE)) { 611 /* check if PFC is enabled */ 612 if (priv->params.rx_priority_flow_control || 613 priv->params.tx_priority_flow_control) { 614 if_printf(dev, "PFC must be disabled before enabling global pauseframes.\n"); 615 error = EINVAL; 616 goto done; 617 } 618 } 619 /* update pauseframe control bits */ 620 priv->params.rx_pauseframe_control = 621 (priv->media.ifm_media & IFM_ETH_RXPAUSE) ? 1 : 0; 622 priv->params.tx_pauseframe_control = 623 (priv->media.ifm_media & IFM_ETH_TXPAUSE) ? 1 : 0; 624 625 /* check if device is opened */ 626 was_opened = test_bit(MLX5E_STATE_OPENED, &priv->state); 627 628 /* reconfigure the hardware */ 629 mlx5_set_port_status(mdev, MLX5_PORT_DOWN); 630 mlx5_set_port_proto(mdev, link_mode, MLX5_PTYS_EN, ext); 631 error = -mlx5e_set_port_pause_and_pfc(priv); 632 if (was_opened) 633 mlx5_set_port_status(mdev, MLX5_PORT_UP); 634 635done: 636 if (!locked) 637 PRIV_UNLOCK(priv); 638 return (error); 639} 640 641static void 642mlx5e_update_carrier_work(struct work_struct *work) 643{ 644 struct mlx5e_priv *priv = container_of(work, struct mlx5e_priv, 645 update_carrier_work); 646 647 PRIV_LOCK(priv); 648 if (test_bit(MLX5E_STATE_OPENED, &priv->state)) 649 mlx5e_update_carrier(priv); 650 PRIV_UNLOCK(priv); 651} 652 653#define MLX5E_PCIE_PERF_GET_64(a,b,c,d,e,f) \ 654 s_debug->c = MLX5_GET64(mpcnt_reg, out, counter_set.f.c); 655 656#define MLX5E_PCIE_PERF_GET_32(a,b,c,d,e,f) \ 657 s_debug->c = MLX5_GET(mpcnt_reg, out, counter_set.f.c); 658 659static void 660mlx5e_update_pcie_counters(struct mlx5e_priv *priv) 661{ 662 struct mlx5_core_dev *mdev = priv->mdev; 663 struct mlx5e_port_stats_debug *s_debug = &priv->stats.port_stats_debug; 664 const unsigned sz = MLX5_ST_SZ_BYTES(mpcnt_reg); 665 void *out; 666 void *in; 667 int err; 668 669 /* allocate firmware request structures */ 670 in = mlx5_vzalloc(sz); 671 out = mlx5_vzalloc(sz); 672 if (in == NULL || out == NULL) 673 goto free_out; 674 675 MLX5_SET(mpcnt_reg, in, grp, MLX5_PCIE_PERFORMANCE_COUNTERS_GROUP); 676 err = mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_MPCNT, 0, 0); 677 if (err != 0) 678 goto free_out; 679 680 MLX5E_PCIE_PERFORMANCE_COUNTERS_64(MLX5E_PCIE_PERF_GET_64) 681 MLX5E_PCIE_PERFORMANCE_COUNTERS_32(MLX5E_PCIE_PERF_GET_32) 682 683 MLX5_SET(mpcnt_reg, in, grp, MLX5_PCIE_TIMERS_AND_STATES_COUNTERS_GROUP); 684 err = mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_MPCNT, 0, 0); 685 if (err != 0) 686 goto free_out; 687 688 MLX5E_PCIE_TIMERS_AND_STATES_COUNTERS_32(MLX5E_PCIE_PERF_GET_32) 689 690 MLX5_SET(mpcnt_reg, in, grp, MLX5_PCIE_LANE_COUNTERS_GROUP); 691 err = mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_MPCNT, 0, 0); 692 if (err != 0) 693 goto free_out; 694 695 MLX5E_PCIE_LANE_COUNTERS_32(MLX5E_PCIE_PERF_GET_32) 696 697free_out: 698 /* free firmware request structures */ 699 kvfree(in); 700 kvfree(out); 701} 702 703/* 704 * This function reads the physical port counters from the firmware 705 * using a pre-defined layout defined by various MLX5E_PPORT_XXX() 706 * macros. The output is converted from big-endian 64-bit values into 707 * host endian ones and stored in the "priv->stats.pport" structure. 708 */ 709static void 710mlx5e_update_pport_counters(struct mlx5e_priv *priv) 711{ 712 struct mlx5_core_dev *mdev = priv->mdev; 713 struct mlx5e_pport_stats *s = &priv->stats.pport; 714 struct mlx5e_port_stats_debug *s_debug = &priv->stats.port_stats_debug; 715 u32 *in; 716 u32 *out; 717 const u64 *ptr; 718 unsigned sz = MLX5_ST_SZ_BYTES(ppcnt_reg); 719 unsigned x; 720 unsigned y; 721 unsigned z; 722 723 /* allocate firmware request structures */ 724 in = mlx5_vzalloc(sz); 725 out = mlx5_vzalloc(sz); 726 if (in == NULL || out == NULL) 727 goto free_out; 728 729 /* 730 * Get pointer to the 64-bit counter set which is located at a 731 * fixed offset in the output firmware request structure: 732 */ 733 ptr = (const uint64_t *)MLX5_ADDR_OF(ppcnt_reg, out, counter_set); 734 735 MLX5_SET(ppcnt_reg, in, local_port, 1); 736 737 /* read IEEE802_3 counter group using predefined counter layout */ 738 MLX5_SET(ppcnt_reg, in, grp, MLX5_IEEE_802_3_COUNTERS_GROUP); 739 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 740 for (x = 0, y = MLX5E_PPORT_PER_PRIO_STATS_NUM; 741 x != MLX5E_PPORT_IEEE802_3_STATS_NUM; x++, y++) 742 s->arg[y] = be64toh(ptr[x]); 743 744 /* read RFC2819 counter group using predefined counter layout */ 745 MLX5_SET(ppcnt_reg, in, grp, MLX5_RFC_2819_COUNTERS_GROUP); 746 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 747 for (x = 0; x != MLX5E_PPORT_RFC2819_STATS_NUM; x++, y++) 748 s->arg[y] = be64toh(ptr[x]); 749 750 for (y = 0; x != MLX5E_PPORT_RFC2819_STATS_NUM + 751 MLX5E_PPORT_RFC2819_STATS_DEBUG_NUM; x++, y++) 752 s_debug->arg[y] = be64toh(ptr[x]); 753 754 /* read RFC2863 counter group using predefined counter layout */ 755 MLX5_SET(ppcnt_reg, in, grp, MLX5_RFC_2863_COUNTERS_GROUP); 756 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 757 for (x = 0; x != MLX5E_PPORT_RFC2863_STATS_DEBUG_NUM; x++, y++) 758 s_debug->arg[y] = be64toh(ptr[x]); 759 760 /* read physical layer stats counter group using predefined counter layout */ 761 MLX5_SET(ppcnt_reg, in, grp, MLX5_PHYSICAL_LAYER_COUNTERS_GROUP); 762 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 763 for (x = 0; x != MLX5E_PPORT_PHYSICAL_LAYER_STATS_DEBUG_NUM; x++, y++) 764 s_debug->arg[y] = be64toh(ptr[x]); 765 766 /* read Extended Ethernet counter group using predefined counter layout */ 767 MLX5_SET(ppcnt_reg, in, grp, MLX5_ETHERNET_EXTENDED_COUNTERS_GROUP); 768 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 769 for (x = 0; x != MLX5E_PPORT_ETHERNET_EXTENDED_STATS_DEBUG_NUM; x++, y++) 770 s_debug->arg[y] = be64toh(ptr[x]); 771 772 /* read Extended Statistical Group */ 773 if (MLX5_CAP_GEN(mdev, pcam_reg) && 774 MLX5_CAP_PCAM_FEATURE(mdev, ppcnt_statistical_group) && 775 MLX5_CAP_PCAM_FEATURE(mdev, per_lane_error_counters)) { 776 /* read Extended Statistical counter group using predefined counter layout */ 777 MLX5_SET(ppcnt_reg, in, grp, MLX5_PHYSICAL_LAYER_STATISTICAL_GROUP); 778 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 779 780 for (x = 0; x != MLX5E_PPORT_STATISTICAL_DEBUG_NUM; x++, y++) 781 s_debug->arg[y] = be64toh(ptr[x]); 782 } 783 784 /* read PCIE counters */ 785 mlx5e_update_pcie_counters(priv); 786 787 /* read per-priority counters */ 788 MLX5_SET(ppcnt_reg, in, grp, MLX5_PER_PRIORITY_COUNTERS_GROUP); 789 790 /* iterate all the priorities */ 791 for (y = z = 0; z != MLX5E_PPORT_PER_PRIO_STATS_NUM_PRIO; z++) { 792 MLX5_SET(ppcnt_reg, in, prio_tc, z); 793 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0); 794 795 /* read per priority stats counter group using predefined counter layout */ 796 for (x = 0; x != (MLX5E_PPORT_PER_PRIO_STATS_NUM / 797 MLX5E_PPORT_PER_PRIO_STATS_NUM_PRIO); x++, y++) 798 s->arg[y] = be64toh(ptr[x]); 799 } 800 801free_out: 802 /* free firmware request structures */ 803 kvfree(in); 804 kvfree(out); 805} 806 807static void 808mlx5e_grp_vnic_env_update_stats(struct mlx5e_priv *priv) 809{ 810 u32 out[MLX5_ST_SZ_DW(query_vnic_env_out)] = {}; 811 u32 in[MLX5_ST_SZ_DW(query_vnic_env_in)] = {}; 812 813 if (!MLX5_CAP_GEN(priv->mdev, nic_receive_steering_discard)) 814 return; 815 816 MLX5_SET(query_vnic_env_in, in, opcode, 817 MLX5_CMD_OP_QUERY_VNIC_ENV); 818 MLX5_SET(query_vnic_env_in, in, op_mod, 0); 819 MLX5_SET(query_vnic_env_in, in, other_vport, 0); 820 821 if (mlx5_cmd_exec(priv->mdev, in, sizeof(in), out, sizeof(out)) != 0) 822 return; 823 824 priv->stats.vport.rx_steer_missed_packets = 825 MLX5_GET64(query_vnic_env_out, out, 826 vport_env.nic_receive_steering_discard); 827} 828 829/* 830 * This function is called regularly to collect all statistics 831 * counters from the firmware. The values can be viewed through the 832 * sysctl interface. Execution is serialized using the priv's global 833 * configuration lock. 834 */ 835static void 836mlx5e_update_stats_locked(struct mlx5e_priv *priv) 837{ 838 struct mlx5_core_dev *mdev = priv->mdev; 839 struct mlx5e_vport_stats *s = &priv->stats.vport; 840 struct mlx5e_sq_stats *sq_stats; 841 struct buf_ring *sq_br; 842#if (__FreeBSD_version < 1100000) 843 struct ifnet *ifp = priv->ifp; 844#endif 845 846 u32 in[MLX5_ST_SZ_DW(query_vport_counter_in)]; 847 u32 *out; 848 int outlen = MLX5_ST_SZ_BYTES(query_vport_counter_out); 849 u64 tso_packets = 0; 850 u64 tso_bytes = 0; 851 u64 tx_queue_dropped = 0; 852 u64 tx_defragged = 0; 853 u64 tx_offload_none = 0; 854 u64 lro_packets = 0; 855 u64 lro_bytes = 0; 856 u64 sw_lro_queued = 0; 857 u64 sw_lro_flushed = 0; 858 u64 rx_csum_none = 0; 859 u64 rx_wqe_err = 0; 860 u64 rx_packets = 0; 861 u64 rx_bytes = 0; 862 u32 rx_out_of_buffer = 0; 863 int i; 864 int j; 865 866 out = mlx5_vzalloc(outlen); 867 if (out == NULL) 868 goto free_out; 869 870 /* Collect firts the SW counters and then HW for consistency */ 871 for (i = 0; i < priv->params.num_channels; i++) { 872 struct mlx5e_channel *pch = priv->channel + i; 873 struct mlx5e_rq *rq = &pch->rq; 874 struct mlx5e_rq_stats *rq_stats = &pch->rq.stats; 875 876 /* collect stats from LRO */ 877 rq_stats->sw_lro_queued = rq->lro.lro_queued; 878 rq_stats->sw_lro_flushed = rq->lro.lro_flushed; 879 sw_lro_queued += rq_stats->sw_lro_queued; 880 sw_lro_flushed += rq_stats->sw_lro_flushed; 881 lro_packets += rq_stats->lro_packets; 882 lro_bytes += rq_stats->lro_bytes; 883 rx_csum_none += rq_stats->csum_none; 884 rx_wqe_err += rq_stats->wqe_err; 885 rx_packets += rq_stats->packets; 886 rx_bytes += rq_stats->bytes; 887 888 for (j = 0; j < priv->num_tc; j++) { 889 sq_stats = &pch->sq[j].stats; 890 sq_br = pch->sq[j].br; 891 892 tso_packets += sq_stats->tso_packets; 893 tso_bytes += sq_stats->tso_bytes; 894 tx_queue_dropped += sq_stats->dropped; 895 if (sq_br != NULL) 896 tx_queue_dropped += sq_br->br_drops; 897 tx_defragged += sq_stats->defragged; 898 tx_offload_none += sq_stats->csum_offload_none; 899 } 900 } 901 902 /* update counters */ 903 s->tso_packets = tso_packets; 904 s->tso_bytes = tso_bytes; 905 s->tx_queue_dropped = tx_queue_dropped; 906 s->tx_defragged = tx_defragged; 907 s->lro_packets = lro_packets; 908 s->lro_bytes = lro_bytes; 909 s->sw_lro_queued = sw_lro_queued; 910 s->sw_lro_flushed = sw_lro_flushed; 911 s->rx_csum_none = rx_csum_none; 912 s->rx_wqe_err = rx_wqe_err; 913 s->rx_packets = rx_packets; 914 s->rx_bytes = rx_bytes; 915 916 mlx5e_grp_vnic_env_update_stats(priv); 917 918 /* HW counters */ 919 memset(in, 0, sizeof(in)); 920 921 MLX5_SET(query_vport_counter_in, in, opcode, 922 MLX5_CMD_OP_QUERY_VPORT_COUNTER); 923 MLX5_SET(query_vport_counter_in, in, op_mod, 0); 924 MLX5_SET(query_vport_counter_in, in, other_vport, 0); 925 926 memset(out, 0, outlen); 927 928 /* get number of out-of-buffer drops first */ 929 if (test_bit(MLX5E_STATE_OPENED, &priv->state) != 0 && 930 mlx5_vport_query_out_of_rx_buffer(mdev, priv->counter_set_id, 931 &rx_out_of_buffer) == 0) { 932 s->rx_out_of_buffer = rx_out_of_buffer; 933 } 934 935 /* get port statistics */ 936 if (mlx5_cmd_exec(mdev, in, sizeof(in), out, outlen) == 0) { 937#define MLX5_GET_CTR(out, x) \ 938 MLX5_GET64(query_vport_counter_out, out, x) 939 940 s->rx_error_packets = 941 MLX5_GET_CTR(out, received_errors.packets); 942 s->rx_error_bytes = 943 MLX5_GET_CTR(out, received_errors.octets); 944 s->tx_error_packets = 945 MLX5_GET_CTR(out, transmit_errors.packets); 946 s->tx_error_bytes = 947 MLX5_GET_CTR(out, transmit_errors.octets); 948 949 s->rx_unicast_packets = 950 MLX5_GET_CTR(out, received_eth_unicast.packets); 951 s->rx_unicast_bytes = 952 MLX5_GET_CTR(out, received_eth_unicast.octets); 953 s->tx_unicast_packets = 954 MLX5_GET_CTR(out, transmitted_eth_unicast.packets); 955 s->tx_unicast_bytes = 956 MLX5_GET_CTR(out, transmitted_eth_unicast.octets); 957 958 s->rx_multicast_packets = 959 MLX5_GET_CTR(out, received_eth_multicast.packets); 960 s->rx_multicast_bytes = 961 MLX5_GET_CTR(out, received_eth_multicast.octets); 962 s->tx_multicast_packets = 963 MLX5_GET_CTR(out, transmitted_eth_multicast.packets); 964 s->tx_multicast_bytes = 965 MLX5_GET_CTR(out, transmitted_eth_multicast.octets); 966 967 s->rx_broadcast_packets = 968 MLX5_GET_CTR(out, received_eth_broadcast.packets); 969 s->rx_broadcast_bytes = 970 MLX5_GET_CTR(out, received_eth_broadcast.octets); 971 s->tx_broadcast_packets = 972 MLX5_GET_CTR(out, transmitted_eth_broadcast.packets); 973 s->tx_broadcast_bytes = 974 MLX5_GET_CTR(out, transmitted_eth_broadcast.octets); 975 976 s->tx_packets = s->tx_unicast_packets + 977 s->tx_multicast_packets + s->tx_broadcast_packets; 978 s->tx_bytes = s->tx_unicast_bytes + s->tx_multicast_bytes + 979 s->tx_broadcast_bytes; 980 981 /* Update calculated offload counters */ 982 s->tx_csum_offload = s->tx_packets - tx_offload_none; 983 s->rx_csum_good = s->rx_packets - s->rx_csum_none; 984 } 985 986 /* Get physical port counters */ 987 mlx5e_update_pport_counters(priv); 988 989 s->tx_jumbo_packets = 990 priv->stats.port_stats_debug.tx_stat_p1519to2047octets + 991 priv->stats.port_stats_debug.tx_stat_p2048to4095octets + 992 priv->stats.port_stats_debug.tx_stat_p4096to8191octets + 993 priv->stats.port_stats_debug.tx_stat_p8192to10239octets; 994 995#if (__FreeBSD_version < 1100000) 996 /* no get_counters interface in fbsd 10 */ 997 ifp->if_ipackets = s->rx_packets; 998 ifp->if_ierrors = priv->stats.pport.in_range_len_errors + 999 priv->stats.pport.out_of_range_len + 1000 priv->stats.pport.too_long_errors + 1001 priv->stats.pport.check_seq_err + 1002 priv->stats.pport.alignment_err; 1003 ifp->if_iqdrops = s->rx_out_of_buffer; 1004 ifp->if_opackets = s->tx_packets; 1005 ifp->if_oerrors = priv->stats.port_stats_debug.out_discards; 1006 ifp->if_snd.ifq_drops = s->tx_queue_dropped; 1007 ifp->if_ibytes = s->rx_bytes; 1008 ifp->if_obytes = s->tx_bytes; 1009 ifp->if_collisions = 1010 priv->stats.pport.collisions; 1011#endif 1012 1013free_out: 1014 kvfree(out); 1015 1016 /* Update diagnostics, if any */ 1017 if (priv->params_ethtool.diag_pci_enable || 1018 priv->params_ethtool.diag_general_enable) { 1019 int error = mlx5_core_get_diagnostics_full(mdev, 1020 priv->params_ethtool.diag_pci_enable ? &priv->params_pci : NULL, 1021 priv->params_ethtool.diag_general_enable ? &priv->params_general : NULL); 1022 if (error != 0) 1023 if_printf(priv->ifp, "Failed reading diagnostics: %d\n", error); 1024 } 1025} 1026 1027static void 1028mlx5e_update_stats_work(struct work_struct *work) 1029{ 1030 struct mlx5e_priv *priv; 1031 1032 priv = container_of(work, struct mlx5e_priv, update_stats_work); 1033 PRIV_LOCK(priv); 1034 if (test_bit(MLX5E_STATE_OPENED, &priv->state) != 0) 1035 mlx5e_update_stats_locked(priv); 1036 PRIV_UNLOCK(priv); 1037} 1038 1039static void 1040mlx5e_update_stats(void *arg) 1041{ 1042 struct mlx5e_priv *priv = arg; 1043 1044 queue_work(priv->wq, &priv->update_stats_work); 1045 1046 callout_reset(&priv->watchdog, hz, &mlx5e_update_stats, priv); 1047} 1048 1049static void 1050mlx5e_async_event_sub(struct mlx5e_priv *priv, 1051 enum mlx5_dev_event event) 1052{ 1053 switch (event) { 1054 case MLX5_DEV_EVENT_PORT_UP: 1055 case MLX5_DEV_EVENT_PORT_DOWN: 1056 queue_work(priv->wq, &priv->update_carrier_work); 1057 break; 1058 1059 default: 1060 break; 1061 } 1062} 1063 1064static void 1065mlx5e_async_event(struct mlx5_core_dev *mdev, void *vpriv, 1066 enum mlx5_dev_event event, unsigned long param) 1067{ 1068 struct mlx5e_priv *priv = vpriv; 1069 1070 mtx_lock(&priv->async_events_mtx); 1071 if (test_bit(MLX5E_STATE_ASYNC_EVENTS_ENABLE, &priv->state)) 1072 mlx5e_async_event_sub(priv, event); 1073 mtx_unlock(&priv->async_events_mtx); 1074} 1075 1076static void 1077mlx5e_enable_async_events(struct mlx5e_priv *priv) 1078{ 1079 set_bit(MLX5E_STATE_ASYNC_EVENTS_ENABLE, &priv->state); 1080} 1081 1082static void 1083mlx5e_disable_async_events(struct mlx5e_priv *priv) 1084{ 1085 mtx_lock(&priv->async_events_mtx); 1086 clear_bit(MLX5E_STATE_ASYNC_EVENTS_ENABLE, &priv->state); 1087 mtx_unlock(&priv->async_events_mtx); 1088} 1089 1090static const char *mlx5e_rq_stats_desc[] = { 1091 MLX5E_RQ_STATS(MLX5E_STATS_DESC) 1092}; 1093 1094static int 1095mlx5e_create_rq(struct mlx5e_channel *c, 1096 struct mlx5e_rq_param *param, 1097 struct mlx5e_rq *rq) 1098{ 1099 struct mlx5e_priv *priv = c->priv; 1100 struct mlx5_core_dev *mdev = priv->mdev; 1101 char buffer[16]; 1102 void *rqc = param->rqc; 1103 void *rqc_wq = MLX5_ADDR_OF(rqc, rqc, wq); 1104 int wq_sz; 1105 int err; 1106 int i; 1107 u32 nsegs, wqe_sz; 1108 1109 err = mlx5e_get_wqe_sz(priv, &wqe_sz, &nsegs); 1110 if (err != 0) 1111 goto done; 1112 1113 /* Create DMA descriptor TAG */ 1114 if ((err = -bus_dma_tag_create( 1115 bus_get_dma_tag(mdev->pdev->dev.bsddev), 1116 1, /* any alignment */ 1117 0, /* no boundary */ 1118 BUS_SPACE_MAXADDR, /* lowaddr */ 1119 BUS_SPACE_MAXADDR, /* highaddr */ 1120 NULL, NULL, /* filter, filterarg */ 1121 nsegs * MLX5E_MAX_RX_BYTES, /* maxsize */ 1122 nsegs, /* nsegments */ 1123 nsegs * MLX5E_MAX_RX_BYTES, /* maxsegsize */ 1124 0, /* flags */ 1125 NULL, NULL, /* lockfunc, lockfuncarg */ 1126 &rq->dma_tag))) 1127 goto done; 1128 1129 err = mlx5_wq_ll_create(mdev, ¶m->wq, rqc_wq, &rq->wq, 1130 &rq->wq_ctrl); 1131 if (err) 1132 goto err_free_dma_tag; 1133 1134 rq->wq.db = &rq->wq.db[MLX5_RCV_DBR]; 1135 1136 err = mlx5e_get_wqe_sz(priv, &rq->wqe_sz, &rq->nsegs); 1137 if (err != 0) 1138 goto err_rq_wq_destroy; 1139 1140 wq_sz = mlx5_wq_ll_get_size(&rq->wq); 1141 1142 err = -tcp_lro_init_args(&rq->lro, c->ifp, TCP_LRO_ENTRIES, wq_sz); 1143 if (err) 1144 goto err_rq_wq_destroy; 1145 1146 rq->mbuf = malloc(wq_sz * sizeof(rq->mbuf[0]), M_MLX5EN, M_WAITOK | M_ZERO); 1147 for (i = 0; i != wq_sz; i++) { 1148 struct mlx5e_rx_wqe *wqe = mlx5_wq_ll_get_wqe(&rq->wq, i); 1149 int j; 1150 1151 err = -bus_dmamap_create(rq->dma_tag, 0, &rq->mbuf[i].dma_map); 1152 if (err != 0) { 1153 while (i--) 1154 bus_dmamap_destroy(rq->dma_tag, rq->mbuf[i].dma_map); 1155 goto err_rq_mbuf_free; 1156 } 1157 1158 /* set value for constant fields */ 1159 for (j = 0; j < rq->nsegs; j++) 1160 wqe->data[j].lkey = c->mkey_be; 1161 } 1162 1163 INIT_WORK(&rq->dim.work, mlx5e_dim_work); 1164 if (priv->params.rx_cq_moderation_mode < 2) { 1165 rq->dim.mode = NET_DIM_CQ_PERIOD_MODE_DISABLED; 1166 } else { 1167 void *cqc = container_of(param, 1168 struct mlx5e_channel_param, rq)->rx_cq.cqc; 1169 1170 switch (MLX5_GET(cqc, cqc, cq_period_mode)) { 1171 case MLX5_CQ_PERIOD_MODE_START_FROM_EQE: 1172 rq->dim.mode = NET_DIM_CQ_PERIOD_MODE_START_FROM_EQE; 1173 break; 1174 case MLX5_CQ_PERIOD_MODE_START_FROM_CQE: 1175 rq->dim.mode = NET_DIM_CQ_PERIOD_MODE_START_FROM_CQE; 1176 break; 1177 default: 1178 rq->dim.mode = NET_DIM_CQ_PERIOD_MODE_DISABLED; 1179 break; 1180 } 1181 } 1182 1183 rq->ifp = c->ifp; 1184 rq->channel = c; 1185 rq->ix = c->ix; 1186 1187 snprintf(buffer, sizeof(buffer), "rxstat%d", c->ix); 1188 mlx5e_create_stats(&rq->stats.ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 1189 buffer, mlx5e_rq_stats_desc, MLX5E_RQ_STATS_NUM, 1190 rq->stats.arg); 1191 return (0); 1192 1193err_rq_mbuf_free: 1194 free(rq->mbuf, M_MLX5EN); 1195 tcp_lro_free(&rq->lro); 1196err_rq_wq_destroy: 1197 mlx5_wq_destroy(&rq->wq_ctrl); 1198err_free_dma_tag: 1199 bus_dma_tag_destroy(rq->dma_tag); 1200done: 1201 return (err); 1202} 1203 1204static void 1205mlx5e_destroy_rq(struct mlx5e_rq *rq) 1206{ 1207 int wq_sz; 1208 int i; 1209 1210 /* destroy all sysctl nodes */ 1211 sysctl_ctx_free(&rq->stats.ctx); 1212 1213 /* free leftover LRO packets, if any */ 1214 tcp_lro_free(&rq->lro); 1215 1216 wq_sz = mlx5_wq_ll_get_size(&rq->wq); 1217 for (i = 0; i != wq_sz; i++) { 1218 if (rq->mbuf[i].mbuf != NULL) { 1219 bus_dmamap_unload(rq->dma_tag, rq->mbuf[i].dma_map); 1220 m_freem(rq->mbuf[i].mbuf); 1221 } 1222 bus_dmamap_destroy(rq->dma_tag, rq->mbuf[i].dma_map); 1223 } 1224 free(rq->mbuf, M_MLX5EN); 1225 mlx5_wq_destroy(&rq->wq_ctrl); 1226 bus_dma_tag_destroy(rq->dma_tag); 1227} 1228 1229static int 1230mlx5e_enable_rq(struct mlx5e_rq *rq, struct mlx5e_rq_param *param) 1231{ 1232 struct mlx5e_channel *c = rq->channel; 1233 struct mlx5e_priv *priv = c->priv; 1234 struct mlx5_core_dev *mdev = priv->mdev; 1235 1236 void *in; 1237 void *rqc; 1238 void *wq; 1239 int inlen; 1240 int err; 1241 1242 inlen = MLX5_ST_SZ_BYTES(create_rq_in) + 1243 sizeof(u64) * rq->wq_ctrl.buf.npages; 1244 in = mlx5_vzalloc(inlen); 1245 if (in == NULL) 1246 return (-ENOMEM); 1247 1248 rqc = MLX5_ADDR_OF(create_rq_in, in, ctx); 1249 wq = MLX5_ADDR_OF(rqc, rqc, wq); 1250 1251 memcpy(rqc, param->rqc, sizeof(param->rqc)); 1252 1253 MLX5_SET(rqc, rqc, cqn, c->rq.cq.mcq.cqn); 1254 MLX5_SET(rqc, rqc, state, MLX5_RQC_STATE_RST); 1255 MLX5_SET(rqc, rqc, flush_in_error_en, 1); 1256 if (priv->counter_set_id >= 0) 1257 MLX5_SET(rqc, rqc, counter_set_id, priv->counter_set_id); 1258 MLX5_SET(wq, wq, log_wq_pg_sz, rq->wq_ctrl.buf.page_shift - 1259 PAGE_SHIFT); 1260 MLX5_SET64(wq, wq, dbr_addr, rq->wq_ctrl.db.dma); 1261 1262 mlx5_fill_page_array(&rq->wq_ctrl.buf, 1263 (__be64 *) MLX5_ADDR_OF(wq, wq, pas)); 1264 1265 err = mlx5_core_create_rq(mdev, in, inlen, &rq->rqn); 1266 1267 kvfree(in); 1268 1269 return (err); 1270} 1271 1272static int 1273mlx5e_modify_rq(struct mlx5e_rq *rq, int curr_state, int next_state) 1274{ 1275 struct mlx5e_channel *c = rq->channel; 1276 struct mlx5e_priv *priv = c->priv; 1277 struct mlx5_core_dev *mdev = priv->mdev; 1278 1279 void *in; 1280 void *rqc; 1281 int inlen; 1282 int err; 1283 1284 inlen = MLX5_ST_SZ_BYTES(modify_rq_in); 1285 in = mlx5_vzalloc(inlen); 1286 if (in == NULL) 1287 return (-ENOMEM); 1288 1289 rqc = MLX5_ADDR_OF(modify_rq_in, in, ctx); 1290 1291 MLX5_SET(modify_rq_in, in, rqn, rq->rqn); 1292 MLX5_SET(modify_rq_in, in, rq_state, curr_state); 1293 MLX5_SET(rqc, rqc, state, next_state); 1294 1295 err = mlx5_core_modify_rq(mdev, in, inlen); 1296 1297 kvfree(in); 1298 1299 return (err); 1300} 1301 1302static void 1303mlx5e_disable_rq(struct mlx5e_rq *rq) 1304{ 1305 struct mlx5e_channel *c = rq->channel; 1306 struct mlx5e_priv *priv = c->priv; 1307 struct mlx5_core_dev *mdev = priv->mdev; 1308 1309 mlx5_core_destroy_rq(mdev, rq->rqn); 1310} 1311 1312static int 1313mlx5e_wait_for_min_rx_wqes(struct mlx5e_rq *rq) 1314{ 1315 struct mlx5e_channel *c = rq->channel; 1316 struct mlx5e_priv *priv = c->priv; 1317 struct mlx5_wq_ll *wq = &rq->wq; 1318 int i; 1319 1320 for (i = 0; i < 1000; i++) { 1321 if (wq->cur_sz >= priv->params.min_rx_wqes) 1322 return (0); 1323 1324 msleep(4); 1325 } 1326 return (-ETIMEDOUT); 1327} 1328 1329static int 1330mlx5e_open_rq(struct mlx5e_channel *c, 1331 struct mlx5e_rq_param *param, 1332 struct mlx5e_rq *rq) 1333{ 1334 int err; 1335 1336 err = mlx5e_create_rq(c, param, rq); 1337 if (err) 1338 return (err); 1339 1340 err = mlx5e_enable_rq(rq, param); 1341 if (err) 1342 goto err_destroy_rq; 1343 1344 err = mlx5e_modify_rq(rq, MLX5_RQC_STATE_RST, MLX5_RQC_STATE_RDY); 1345 if (err) 1346 goto err_disable_rq; 1347 1348 c->rq.enabled = 1; 1349 1350 return (0); 1351 1352err_disable_rq: 1353 mlx5e_disable_rq(rq); 1354err_destroy_rq: 1355 mlx5e_destroy_rq(rq); 1356 1357 return (err); 1358} 1359 1360static void 1361mlx5e_close_rq(struct mlx5e_rq *rq) 1362{ 1363 mtx_lock(&rq->mtx); 1364 rq->enabled = 0; 1365 callout_stop(&rq->watchdog); 1366 mtx_unlock(&rq->mtx); 1367 1368 callout_drain(&rq->watchdog); 1369 1370 mlx5e_modify_rq(rq, MLX5_RQC_STATE_RDY, MLX5_RQC_STATE_ERR); 1371} 1372 1373static void 1374mlx5e_close_rq_wait(struct mlx5e_rq *rq) 1375{ 1376 1377 mlx5e_disable_rq(rq); 1378 mlx5e_close_cq(&rq->cq); 1379 cancel_work_sync(&rq->dim.work); 1380 mlx5e_destroy_rq(rq); 1381} 1382 1383void 1384mlx5e_free_sq_db(struct mlx5e_sq *sq) 1385{ 1386 int wq_sz = mlx5_wq_cyc_get_size(&sq->wq); 1387 int x; 1388 1389 for (x = 0; x != wq_sz; x++) { 1390 if (sq->mbuf[x].mbuf != NULL) { 1391 bus_dmamap_unload(sq->dma_tag, sq->mbuf[x].dma_map); 1392 m_freem(sq->mbuf[x].mbuf); 1393 } 1394 bus_dmamap_destroy(sq->dma_tag, sq->mbuf[x].dma_map); 1395 } 1396 free(sq->mbuf, M_MLX5EN); 1397} 1398 1399int 1400mlx5e_alloc_sq_db(struct mlx5e_sq *sq) 1401{ 1402 int wq_sz = mlx5_wq_cyc_get_size(&sq->wq); 1403 int err; 1404 int x; 1405 1406 sq->mbuf = malloc(wq_sz * sizeof(sq->mbuf[0]), M_MLX5EN, M_WAITOK | M_ZERO); 1407 1408 /* Create DMA descriptor MAPs */ 1409 for (x = 0; x != wq_sz; x++) { 1410 err = -bus_dmamap_create(sq->dma_tag, 0, &sq->mbuf[x].dma_map); 1411 if (err != 0) { 1412 while (x--) 1413 bus_dmamap_destroy(sq->dma_tag, sq->mbuf[x].dma_map); 1414 free(sq->mbuf, M_MLX5EN); 1415 return (err); 1416 } 1417 } 1418 return (0); 1419} 1420 1421static const char *mlx5e_sq_stats_desc[] = { 1422 MLX5E_SQ_STATS(MLX5E_STATS_DESC) 1423}; 1424 1425void 1426mlx5e_update_sq_inline(struct mlx5e_sq *sq) 1427{ 1428 sq->max_inline = sq->priv->params.tx_max_inline; 1429 sq->min_inline_mode = sq->priv->params.tx_min_inline_mode; 1430 1431 /* 1432 * Check if trust state is DSCP or if inline mode is NONE which 1433 * indicates CX-5 or newer hardware. 1434 */ 1435 if (sq->priv->params_ethtool.trust_state != MLX5_QPTS_TRUST_PCP || 1436 sq->min_inline_mode == MLX5_INLINE_MODE_NONE) { 1437 if (MLX5_CAP_ETH(sq->priv->mdev, wqe_vlan_insert)) 1438 sq->min_insert_caps = MLX5E_INSERT_VLAN | MLX5E_INSERT_NON_VLAN; 1439 else 1440 sq->min_insert_caps = MLX5E_INSERT_NON_VLAN; 1441 } else { 1442 sq->min_insert_caps = 0; 1443 } 1444} 1445 1446static void 1447mlx5e_refresh_sq_inline_sub(struct mlx5e_priv *priv, struct mlx5e_channel *c) 1448{ 1449 int i; 1450 1451 for (i = 0; i != c->num_tc; i++) { 1452 mtx_lock(&c->sq[i].lock); 1453 mlx5e_update_sq_inline(&c->sq[i]); 1454 mtx_unlock(&c->sq[i].lock); 1455 } 1456} 1457 1458void 1459mlx5e_refresh_sq_inline(struct mlx5e_priv *priv) 1460{ 1461 int i; 1462 1463 /* check if channels are closed */ 1464 if (test_bit(MLX5E_STATE_OPENED, &priv->state) == 0) 1465 return; 1466 1467 for (i = 0; i < priv->params.num_channels; i++) 1468 mlx5e_refresh_sq_inline_sub(priv, &priv->channel[i]); 1469} 1470 1471static int 1472mlx5e_create_sq(struct mlx5e_channel *c, 1473 int tc, 1474 struct mlx5e_sq_param *param, 1475 struct mlx5e_sq *sq) 1476{ 1477 struct mlx5e_priv *priv = c->priv; 1478 struct mlx5_core_dev *mdev = priv->mdev; 1479 char buffer[16]; 1480 void *sqc = param->sqc; 1481 void *sqc_wq = MLX5_ADDR_OF(sqc, sqc, wq); 1482 int err; 1483 1484 /* Create DMA descriptor TAG */ 1485 if ((err = -bus_dma_tag_create( 1486 bus_get_dma_tag(mdev->pdev->dev.bsddev), 1487 1, /* any alignment */ 1488 0, /* no boundary */ 1489 BUS_SPACE_MAXADDR, /* lowaddr */ 1490 BUS_SPACE_MAXADDR, /* highaddr */ 1491 NULL, NULL, /* filter, filterarg */ 1492 MLX5E_MAX_TX_PAYLOAD_SIZE, /* maxsize */ 1493 MLX5E_MAX_TX_MBUF_FRAGS, /* nsegments */ 1494 MLX5E_MAX_TX_MBUF_SIZE, /* maxsegsize */ 1495 0, /* flags */ 1496 NULL, NULL, /* lockfunc, lockfuncarg */ 1497 &sq->dma_tag))) 1498 goto done; 1499 1500 err = mlx5_alloc_map_uar(mdev, &sq->uar); 1501 if (err) 1502 goto err_free_dma_tag; 1503 1504 err = mlx5_wq_cyc_create(mdev, ¶m->wq, sqc_wq, &sq->wq, 1505 &sq->wq_ctrl); 1506 if (err) 1507 goto err_unmap_free_uar; 1508 1509 sq->wq.db = &sq->wq.db[MLX5_SND_DBR]; 1510 sq->bf_buf_size = (1 << MLX5_CAP_GEN(mdev, log_bf_reg_size)) / 2; 1511 1512 err = mlx5e_alloc_sq_db(sq); 1513 if (err) 1514 goto err_sq_wq_destroy; 1515 1516 sq->mkey_be = c->mkey_be; 1517 sq->ifp = priv->ifp; 1518 sq->priv = priv; 1519 sq->tc = tc; 1520 1521 mlx5e_update_sq_inline(sq); 1522 1523 snprintf(buffer, sizeof(buffer), "txstat%dtc%d", c->ix, tc); 1524 mlx5e_create_stats(&sq->stats.ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 1525 buffer, mlx5e_sq_stats_desc, MLX5E_SQ_STATS_NUM, 1526 sq->stats.arg); 1527 1528 return (0); 1529 1530err_sq_wq_destroy: 1531 mlx5_wq_destroy(&sq->wq_ctrl); 1532 1533err_unmap_free_uar: 1534 mlx5_unmap_free_uar(mdev, &sq->uar); 1535 1536err_free_dma_tag: 1537 bus_dma_tag_destroy(sq->dma_tag); 1538done: 1539 return (err); 1540} 1541 1542static void 1543mlx5e_destroy_sq(struct mlx5e_sq *sq) 1544{ 1545 /* destroy all sysctl nodes */ 1546 sysctl_ctx_free(&sq->stats.ctx); 1547 1548 mlx5e_free_sq_db(sq); 1549 mlx5_wq_destroy(&sq->wq_ctrl); 1550 mlx5_unmap_free_uar(sq->priv->mdev, &sq->uar); 1551 bus_dma_tag_destroy(sq->dma_tag); 1552} 1553 1554int 1555mlx5e_enable_sq(struct mlx5e_sq *sq, struct mlx5e_sq_param *param, 1556 int tis_num) 1557{ 1558 void *in; 1559 void *sqc; 1560 void *wq; 1561 int inlen; 1562 int err; 1563 1564 inlen = MLX5_ST_SZ_BYTES(create_sq_in) + 1565 sizeof(u64) * sq->wq_ctrl.buf.npages; 1566 in = mlx5_vzalloc(inlen); 1567 if (in == NULL) 1568 return (-ENOMEM); 1569 1570 sqc = MLX5_ADDR_OF(create_sq_in, in, ctx); 1571 wq = MLX5_ADDR_OF(sqc, sqc, wq); 1572 1573 memcpy(sqc, param->sqc, sizeof(param->sqc)); 1574 1575 MLX5_SET(sqc, sqc, tis_num_0, tis_num); 1576 MLX5_SET(sqc, sqc, cqn, sq->cq.mcq.cqn); 1577 MLX5_SET(sqc, sqc, state, MLX5_SQC_STATE_RST); 1578 MLX5_SET(sqc, sqc, tis_lst_sz, 1); 1579 MLX5_SET(sqc, sqc, flush_in_error_en, 1); 1580 1581 MLX5_SET(wq, wq, wq_type, MLX5_WQ_TYPE_CYCLIC); 1582 MLX5_SET(wq, wq, uar_page, sq->uar.index); 1583 MLX5_SET(wq, wq, log_wq_pg_sz, sq->wq_ctrl.buf.page_shift - 1584 PAGE_SHIFT); 1585 MLX5_SET64(wq, wq, dbr_addr, sq->wq_ctrl.db.dma); 1586 1587 mlx5_fill_page_array(&sq->wq_ctrl.buf, 1588 (__be64 *) MLX5_ADDR_OF(wq, wq, pas)); 1589 1590 err = mlx5_core_create_sq(sq->priv->mdev, in, inlen, &sq->sqn); 1591 1592 kvfree(in); 1593 1594 return (err); 1595} 1596 1597int 1598mlx5e_modify_sq(struct mlx5e_sq *sq, int curr_state, int next_state) 1599{ 1600 void *in; 1601 void *sqc; 1602 int inlen; 1603 int err; 1604 1605 inlen = MLX5_ST_SZ_BYTES(modify_sq_in); 1606 in = mlx5_vzalloc(inlen); 1607 if (in == NULL) 1608 return (-ENOMEM); 1609 1610 sqc = MLX5_ADDR_OF(modify_sq_in, in, ctx); 1611 1612 MLX5_SET(modify_sq_in, in, sqn, sq->sqn); 1613 MLX5_SET(modify_sq_in, in, sq_state, curr_state); 1614 MLX5_SET(sqc, sqc, state, next_state); 1615 1616 err = mlx5_core_modify_sq(sq->priv->mdev, in, inlen); 1617 1618 kvfree(in); 1619 1620 return (err); 1621} 1622 1623void 1624mlx5e_disable_sq(struct mlx5e_sq *sq) 1625{ 1626 1627 mlx5_core_destroy_sq(sq->priv->mdev, sq->sqn); 1628} 1629 1630static int 1631mlx5e_open_sq(struct mlx5e_channel *c, 1632 int tc, 1633 struct mlx5e_sq_param *param, 1634 struct mlx5e_sq *sq) 1635{ 1636 int err; 1637 1638 err = mlx5e_create_sq(c, tc, param, sq); 1639 if (err) 1640 return (err); 1641 1642 err = mlx5e_enable_sq(sq, param, c->priv->tisn[tc]); 1643 if (err) 1644 goto err_destroy_sq; 1645 1646 err = mlx5e_modify_sq(sq, MLX5_SQC_STATE_RST, MLX5_SQC_STATE_RDY); 1647 if (err) 1648 goto err_disable_sq; 1649 1650 WRITE_ONCE(sq->running, 1); 1651 1652 return (0); 1653 1654err_disable_sq: 1655 mlx5e_disable_sq(sq); 1656err_destroy_sq: 1657 mlx5e_destroy_sq(sq); 1658 1659 return (err); 1660} 1661 1662static void 1663mlx5e_sq_send_nops_locked(struct mlx5e_sq *sq, int can_sleep) 1664{ 1665 /* fill up remainder with NOPs */ 1666 while (sq->cev_counter != 0) { 1667 while (!mlx5e_sq_has_room_for(sq, 1)) { 1668 if (can_sleep != 0) { 1669 mtx_unlock(&sq->lock); 1670 msleep(4); 1671 mtx_lock(&sq->lock); 1672 } else { 1673 goto done; 1674 } 1675 } 1676 /* send a single NOP */ 1677 mlx5e_send_nop(sq, 1); 1678 atomic_thread_fence_rel(); 1679 } 1680done: 1681 /* Check if we need to write the doorbell */ 1682 if (likely(sq->doorbell.d64 != 0)) { 1683 mlx5e_tx_notify_hw(sq, sq->doorbell.d32, 0); 1684 sq->doorbell.d64 = 0; 1685 } 1686} 1687 1688void 1689mlx5e_sq_cev_timeout(void *arg) 1690{ 1691 struct mlx5e_sq *sq = arg; 1692 1693 mtx_assert(&sq->lock, MA_OWNED); 1694 1695 /* check next state */ 1696 switch (sq->cev_next_state) { 1697 case MLX5E_CEV_STATE_SEND_NOPS: 1698 /* fill TX ring with NOPs, if any */ 1699 mlx5e_sq_send_nops_locked(sq, 0); 1700 1701 /* check if completed */ 1702 if (sq->cev_counter == 0) { 1703 sq->cev_next_state = MLX5E_CEV_STATE_INITIAL; 1704 return; 1705 } 1706 break; 1707 default: 1708 /* send NOPs on next timeout */ 1709 sq->cev_next_state = MLX5E_CEV_STATE_SEND_NOPS; 1710 break; 1711 } 1712 1713 /* restart timer */ 1714 callout_reset_curcpu(&sq->cev_callout, hz, mlx5e_sq_cev_timeout, sq); 1715} 1716 1717void 1718mlx5e_drain_sq(struct mlx5e_sq *sq) 1719{ 1720 int error; 1721 struct mlx5_core_dev *mdev= sq->priv->mdev; 1722 1723 /* 1724 * Check if already stopped. 1725 * 1726 * NOTE: Serialization of this function is managed by the 1727 * caller ensuring the priv's state lock is locked or in case 1728 * of rate limit support, a single thread manages drain and 1729 * resume of SQs. The "running" variable can therefore safely 1730 * be read without any locks. 1731 */ 1732 if (READ_ONCE(sq->running) == 0) 1733 return; 1734 1735 /* don't put more packets into the SQ */ 1736 WRITE_ONCE(sq->running, 0); 1737 1738 /* serialize access to DMA rings */ 1739 mtx_lock(&sq->lock); 1740 1741 /* teardown event factor timer, if any */ 1742 sq->cev_next_state = MLX5E_CEV_STATE_HOLD_NOPS; 1743 callout_stop(&sq->cev_callout); 1744 1745 /* send dummy NOPs in order to flush the transmit ring */ 1746 mlx5e_sq_send_nops_locked(sq, 1); 1747 mtx_unlock(&sq->lock); 1748 1749 /* make sure it is safe to free the callout */ 1750 callout_drain(&sq->cev_callout); 1751 1752 /* wait till SQ is empty or link is down */ 1753 mtx_lock(&sq->lock); 1754 while (sq->cc != sq->pc && 1755 (sq->priv->media_status_last & IFM_ACTIVE) != 0 && 1756 mdev->state != MLX5_DEVICE_STATE_INTERNAL_ERROR) { 1757 mtx_unlock(&sq->lock); 1758 msleep(1); 1759 sq->cq.mcq.comp(&sq->cq.mcq); 1760 mtx_lock(&sq->lock); 1761 } 1762 mtx_unlock(&sq->lock); 1763 1764 /* error out remaining requests */ 1765 error = mlx5e_modify_sq(sq, MLX5_SQC_STATE_RDY, MLX5_SQC_STATE_ERR); 1766 if (error != 0) { 1767 if_printf(sq->ifp, 1768 "mlx5e_modify_sq() from RDY to ERR failed: %d\n", error); 1769 } 1770 1771 /* wait till SQ is empty */ 1772 mtx_lock(&sq->lock); 1773 while (sq->cc != sq->pc && 1774 mdev->state != MLX5_DEVICE_STATE_INTERNAL_ERROR) { 1775 mtx_unlock(&sq->lock); 1776 msleep(1); 1777 sq->cq.mcq.comp(&sq->cq.mcq); 1778 mtx_lock(&sq->lock); 1779 } 1780 mtx_unlock(&sq->lock); 1781} 1782 1783static void 1784mlx5e_close_sq_wait(struct mlx5e_sq *sq) 1785{ 1786 1787 mlx5e_drain_sq(sq); 1788 mlx5e_disable_sq(sq); 1789 mlx5e_destroy_sq(sq); 1790} 1791 1792static int 1793mlx5e_create_cq(struct mlx5e_priv *priv, 1794 struct mlx5e_cq_param *param, 1795 struct mlx5e_cq *cq, 1796 mlx5e_cq_comp_t *comp, 1797 int eq_ix) 1798{ 1799 struct mlx5_core_dev *mdev = priv->mdev; 1800 struct mlx5_core_cq *mcq = &cq->mcq; 1801 int eqn_not_used; 1802 int irqn; 1803 int err; 1804 u32 i; 1805 1806 param->wq.buf_numa_node = 0; 1807 param->wq.db_numa_node = 0; 1808 1809 err = mlx5_vector2eqn(mdev, eq_ix, &eqn_not_used, &irqn); 1810 if (err) 1811 return (err); 1812 1813 err = mlx5_cqwq_create(mdev, ¶m->wq, param->cqc, &cq->wq, 1814 &cq->wq_ctrl); 1815 if (err) 1816 return (err); 1817 1818 mcq->cqe_sz = 64; 1819 mcq->set_ci_db = cq->wq_ctrl.db.db; 1820 mcq->arm_db = cq->wq_ctrl.db.db + 1; 1821 *mcq->set_ci_db = 0; 1822 *mcq->arm_db = 0; 1823 mcq->vector = eq_ix; 1824 mcq->comp = comp; 1825 mcq->event = mlx5e_cq_error_event; 1826 mcq->irqn = irqn; 1827 mcq->uar = &priv->cq_uar; 1828 1829 for (i = 0; i < mlx5_cqwq_get_size(&cq->wq); i++) { 1830 struct mlx5_cqe64 *cqe = mlx5_cqwq_get_wqe(&cq->wq, i); 1831 1832 cqe->op_own = 0xf1; 1833 } 1834 1835 cq->priv = priv; 1836 1837 return (0); 1838} 1839 1840static void 1841mlx5e_destroy_cq(struct mlx5e_cq *cq) 1842{ 1843 mlx5_wq_destroy(&cq->wq_ctrl); 1844} 1845 1846static int 1847mlx5e_enable_cq(struct mlx5e_cq *cq, struct mlx5e_cq_param *param, int eq_ix) 1848{ 1849 struct mlx5_core_cq *mcq = &cq->mcq; 1850 void *in; 1851 void *cqc; 1852 int inlen; 1853 int irqn_not_used; 1854 int eqn; 1855 int err; 1856 1857 inlen = MLX5_ST_SZ_BYTES(create_cq_in) + 1858 sizeof(u64) * cq->wq_ctrl.buf.npages; 1859 in = mlx5_vzalloc(inlen); 1860 if (in == NULL) 1861 return (-ENOMEM); 1862 1863 cqc = MLX5_ADDR_OF(create_cq_in, in, cq_context); 1864 1865 memcpy(cqc, param->cqc, sizeof(param->cqc)); 1866 1867 mlx5_fill_page_array(&cq->wq_ctrl.buf, 1868 (__be64 *) MLX5_ADDR_OF(create_cq_in, in, pas)); 1869 1870 mlx5_vector2eqn(cq->priv->mdev, eq_ix, &eqn, &irqn_not_used); 1871 1872 MLX5_SET(cqc, cqc, c_eqn, eqn); 1873 MLX5_SET(cqc, cqc, uar_page, mcq->uar->index); 1874 MLX5_SET(cqc, cqc, log_page_size, cq->wq_ctrl.buf.page_shift - 1875 PAGE_SHIFT); 1876 MLX5_SET64(cqc, cqc, dbr_addr, cq->wq_ctrl.db.dma); 1877 1878 err = mlx5_core_create_cq(cq->priv->mdev, mcq, in, inlen); 1879 1880 kvfree(in); 1881 1882 if (err) 1883 return (err); 1884 1885 mlx5e_cq_arm(cq, MLX5_GET_DOORBELL_LOCK(&cq->priv->doorbell_lock)); 1886 1887 return (0); 1888} 1889 1890static void 1891mlx5e_disable_cq(struct mlx5e_cq *cq) 1892{ 1893 1894 mlx5_core_destroy_cq(cq->priv->mdev, &cq->mcq); 1895} 1896 1897int 1898mlx5e_open_cq(struct mlx5e_priv *priv, 1899 struct mlx5e_cq_param *param, 1900 struct mlx5e_cq *cq, 1901 mlx5e_cq_comp_t *comp, 1902 int eq_ix) 1903{ 1904 int err; 1905 1906 err = mlx5e_create_cq(priv, param, cq, comp, eq_ix); 1907 if (err) 1908 return (err); 1909 1910 err = mlx5e_enable_cq(cq, param, eq_ix); 1911 if (err) 1912 goto err_destroy_cq; 1913 1914 return (0); 1915 1916err_destroy_cq: 1917 mlx5e_destroy_cq(cq); 1918 1919 return (err); 1920} 1921 1922void 1923mlx5e_close_cq(struct mlx5e_cq *cq) 1924{ 1925 mlx5e_disable_cq(cq); 1926 mlx5e_destroy_cq(cq); 1927} 1928 1929static int 1930mlx5e_open_tx_cqs(struct mlx5e_channel *c, 1931 struct mlx5e_channel_param *cparam) 1932{ 1933 int err; 1934 int tc; 1935 1936 for (tc = 0; tc < c->num_tc; tc++) { 1937 /* open completion queue */ 1938 err = mlx5e_open_cq(c->priv, &cparam->tx_cq, &c->sq[tc].cq, 1939 &mlx5e_tx_cq_comp, c->ix); 1940 if (err) 1941 goto err_close_tx_cqs; 1942 } 1943 return (0); 1944 1945err_close_tx_cqs: 1946 for (tc--; tc >= 0; tc--) 1947 mlx5e_close_cq(&c->sq[tc].cq); 1948 1949 return (err); 1950} 1951 1952static void 1953mlx5e_close_tx_cqs(struct mlx5e_channel *c) 1954{ 1955 int tc; 1956 1957 for (tc = 0; tc < c->num_tc; tc++) 1958 mlx5e_close_cq(&c->sq[tc].cq); 1959} 1960 1961static int 1962mlx5e_open_sqs(struct mlx5e_channel *c, 1963 struct mlx5e_channel_param *cparam) 1964{ 1965 int err; 1966 int tc; 1967 1968 for (tc = 0; tc < c->num_tc; tc++) { 1969 err = mlx5e_open_sq(c, tc, &cparam->sq, &c->sq[tc]); 1970 if (err) 1971 goto err_close_sqs; 1972 } 1973 1974 return (0); 1975 1976err_close_sqs: 1977 for (tc--; tc >= 0; tc--) 1978 mlx5e_close_sq_wait(&c->sq[tc]); 1979 1980 return (err); 1981} 1982 1983static void 1984mlx5e_close_sqs_wait(struct mlx5e_channel *c) 1985{ 1986 int tc; 1987 1988 for (tc = 0; tc < c->num_tc; tc++) 1989 mlx5e_close_sq_wait(&c->sq[tc]); 1990} 1991 1992static void 1993mlx5e_chan_mtx_init(struct mlx5e_channel *c) 1994{ 1995 int tc; 1996 1997 mtx_init(&c->rq.mtx, "mlx5rx", MTX_NETWORK_LOCK, MTX_DEF); 1998 1999 callout_init_mtx(&c->rq.watchdog, &c->rq.mtx, 0); 2000 2001 for (tc = 0; tc < c->num_tc; tc++) { 2002 struct mlx5e_sq *sq = c->sq + tc; 2003 2004 mtx_init(&sq->lock, "mlx5tx", 2005 MTX_NETWORK_LOCK " TX", MTX_DEF); 2006 mtx_init(&sq->comp_lock, "mlx5comp", 2007 MTX_NETWORK_LOCK " TX", MTX_DEF); 2008 2009 callout_init_mtx(&sq->cev_callout, &sq->lock, 0); 2010 2011 sq->cev_factor = c->priv->params_ethtool.tx_completion_fact; 2012 2013 /* ensure the TX completion event factor is not zero */ 2014 if (sq->cev_factor == 0) 2015 sq->cev_factor = 1; 2016 } 2017} 2018 2019static void 2020mlx5e_chan_mtx_destroy(struct mlx5e_channel *c) 2021{ 2022 int tc; 2023 2024 mtx_destroy(&c->rq.mtx); 2025 2026 for (tc = 0; tc < c->num_tc; tc++) { 2027 mtx_destroy(&c->sq[tc].lock); 2028 mtx_destroy(&c->sq[tc].comp_lock); 2029 } 2030} 2031 2032static int 2033mlx5e_open_channel(struct mlx5e_priv *priv, int ix, 2034 struct mlx5e_channel_param *cparam, 2035 struct mlx5e_channel *c) 2036{ 2037 int err; 2038 2039 memset(c, 0, sizeof(*c)); 2040 2041 c->priv = priv; 2042 c->ix = ix; 2043 c->ifp = priv->ifp; 2044 c->mkey_be = cpu_to_be32(priv->mr.key); 2045 c->num_tc = priv->num_tc; 2046 2047 /* init mutexes */ 2048 mlx5e_chan_mtx_init(c); 2049 2050 /* open transmit completion queue */ 2051 err = mlx5e_open_tx_cqs(c, cparam); 2052 if (err) 2053 goto err_free; 2054 2055 /* open receive completion queue */ 2056 err = mlx5e_open_cq(c->priv, &cparam->rx_cq, &c->rq.cq, 2057 &mlx5e_rx_cq_comp, c->ix); 2058 if (err) 2059 goto err_close_tx_cqs; 2060 2061 err = mlx5e_open_sqs(c, cparam); 2062 if (err) 2063 goto err_close_rx_cq; 2064 2065 err = mlx5e_open_rq(c, &cparam->rq, &c->rq); 2066 if (err) 2067 goto err_close_sqs; 2068 2069 /* poll receive queue initially */ 2070 c->rq.cq.mcq.comp(&c->rq.cq.mcq); 2071 2072 return (0); 2073 2074err_close_sqs: 2075 mlx5e_close_sqs_wait(c); 2076 2077err_close_rx_cq: 2078 mlx5e_close_cq(&c->rq.cq); 2079 2080err_close_tx_cqs: 2081 mlx5e_close_tx_cqs(c); 2082 2083err_free: 2084 /* destroy mutexes */ 2085 mlx5e_chan_mtx_destroy(c); 2086 return (err); 2087} 2088 2089static void 2090mlx5e_close_channel(struct mlx5e_channel *c) 2091{ 2092 mlx5e_close_rq(&c->rq); 2093} 2094 2095static void 2096mlx5e_close_channel_wait(struct mlx5e_channel *c) 2097{ 2098 mlx5e_close_rq_wait(&c->rq); 2099 mlx5e_close_sqs_wait(c); 2100 mlx5e_close_tx_cqs(c); 2101 /* destroy mutexes */ 2102 mlx5e_chan_mtx_destroy(c); 2103} 2104 2105static int 2106mlx5e_get_wqe_sz(struct mlx5e_priv *priv, u32 *wqe_sz, u32 *nsegs) 2107{ 2108 u32 r, n; 2109 2110 r = priv->params.hw_lro_en ? priv->params.lro_wqe_sz : 2111 MLX5E_SW2MB_MTU(priv->ifp->if_mtu); 2112 if (r > MJUM16BYTES) 2113 return (-ENOMEM); 2114 2115 if (r > MJUM9BYTES) 2116 r = MJUM16BYTES; 2117 else if (r > MJUMPAGESIZE) 2118 r = MJUM9BYTES; 2119 else if (r > MCLBYTES) 2120 r = MJUMPAGESIZE; 2121 else 2122 r = MCLBYTES; 2123 2124 /* 2125 * n + 1 must be a power of two, because stride size must be. 2126 * Stride size is 16 * (n + 1), as the first segment is 2127 * control. 2128 */ 2129 for (n = howmany(r, MLX5E_MAX_RX_BYTES); !powerof2(n + 1); n++) 2130 ; 2131 2132 if (n > MLX5E_MAX_BUSDMA_RX_SEGS) 2133 return (-ENOMEM); 2134 2135 *wqe_sz = r; 2136 *nsegs = n; 2137 return (0); 2138} 2139 2140static void 2141mlx5e_build_rq_param(struct mlx5e_priv *priv, 2142 struct mlx5e_rq_param *param) 2143{ 2144 void *rqc = param->rqc; 2145 void *wq = MLX5_ADDR_OF(rqc, rqc, wq); 2146 u32 wqe_sz, nsegs; 2147 2148 mlx5e_get_wqe_sz(priv, &wqe_sz, &nsegs); 2149 MLX5_SET(wq, wq, wq_type, MLX5_WQ_TYPE_LINKED_LIST); 2150 MLX5_SET(wq, wq, end_padding_mode, MLX5_WQ_END_PAD_MODE_ALIGN); 2151 MLX5_SET(wq, wq, log_wq_stride, ilog2(sizeof(struct mlx5e_rx_wqe) + 2152 nsegs * sizeof(struct mlx5_wqe_data_seg))); 2153 MLX5_SET(wq, wq, log_wq_sz, priv->params.log_rq_size); 2154 MLX5_SET(wq, wq, pd, priv->pdn); 2155 2156 param->wq.buf_numa_node = 0; 2157 param->wq.db_numa_node = 0; 2158 param->wq.linear = 1; 2159} 2160 2161static void 2162mlx5e_build_sq_param(struct mlx5e_priv *priv, 2163 struct mlx5e_sq_param *param) 2164{ 2165 void *sqc = param->sqc; 2166 void *wq = MLX5_ADDR_OF(sqc, sqc, wq); 2167 2168 MLX5_SET(wq, wq, log_wq_sz, priv->params.log_sq_size); 2169 MLX5_SET(wq, wq, log_wq_stride, ilog2(MLX5_SEND_WQE_BB)); 2170 MLX5_SET(wq, wq, pd, priv->pdn); 2171 2172 param->wq.buf_numa_node = 0; 2173 param->wq.db_numa_node = 0; 2174 param->wq.linear = 1; 2175} 2176 2177static void 2178mlx5e_build_common_cq_param(struct mlx5e_priv *priv, 2179 struct mlx5e_cq_param *param) 2180{ 2181 void *cqc = param->cqc; 2182 2183 MLX5_SET(cqc, cqc, uar_page, priv->cq_uar.index); 2184} 2185 2186static void 2187mlx5e_get_default_profile(struct mlx5e_priv *priv, int mode, struct net_dim_cq_moder *ptr) 2188{ 2189 2190 *ptr = net_dim_get_profile(mode, MLX5E_DIM_DEFAULT_PROFILE); 2191 2192 /* apply LRO restrictions */ 2193 if (priv->params.hw_lro_en && 2194 ptr->pkts > MLX5E_DIM_MAX_RX_CQ_MODERATION_PKTS_WITH_LRO) { 2195 ptr->pkts = MLX5E_DIM_MAX_RX_CQ_MODERATION_PKTS_WITH_LRO; 2196 } 2197} 2198 2199static void 2200mlx5e_build_rx_cq_param(struct mlx5e_priv *priv, 2201 struct mlx5e_cq_param *param) 2202{ 2203 struct net_dim_cq_moder curr; 2204 void *cqc = param->cqc; 2205 2206 /* 2207 * We use MLX5_CQE_FORMAT_HASH because the RX hash mini CQE 2208 * format is more beneficial for FreeBSD use case. 2209 * 2210 * Adding support for MLX5_CQE_FORMAT_CSUM will require changes 2211 * in mlx5e_decompress_cqe. 2212 */ 2213 if (priv->params.cqe_zipping_en) { 2214 MLX5_SET(cqc, cqc, mini_cqe_res_format, MLX5_CQE_FORMAT_HASH); 2215 MLX5_SET(cqc, cqc, cqe_compression_en, 1); 2216 } 2217 2218 MLX5_SET(cqc, cqc, log_cq_size, priv->params.log_rq_size); 2219 2220 switch (priv->params.rx_cq_moderation_mode) { 2221 case 0: 2222 MLX5_SET(cqc, cqc, cq_period, priv->params.rx_cq_moderation_usec); 2223 MLX5_SET(cqc, cqc, cq_max_count, priv->params.rx_cq_moderation_pkts); 2224 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_EQE); 2225 break; 2226 case 1: 2227 MLX5_SET(cqc, cqc, cq_period, priv->params.rx_cq_moderation_usec); 2228 MLX5_SET(cqc, cqc, cq_max_count, priv->params.rx_cq_moderation_pkts); 2229 if (MLX5_CAP_GEN(priv->mdev, cq_period_start_from_cqe)) 2230 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_CQE); 2231 else 2232 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_EQE); 2233 break; 2234 case 2: 2235 mlx5e_get_default_profile(priv, NET_DIM_CQ_PERIOD_MODE_START_FROM_EQE, &curr); 2236 MLX5_SET(cqc, cqc, cq_period, curr.usec); 2237 MLX5_SET(cqc, cqc, cq_max_count, curr.pkts); 2238 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_EQE); 2239 break; 2240 case 3: 2241 mlx5e_get_default_profile(priv, NET_DIM_CQ_PERIOD_MODE_START_FROM_CQE, &curr); 2242 MLX5_SET(cqc, cqc, cq_period, curr.usec); 2243 MLX5_SET(cqc, cqc, cq_max_count, curr.pkts); 2244 if (MLX5_CAP_GEN(priv->mdev, cq_period_start_from_cqe)) 2245 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_CQE); 2246 else 2247 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_EQE); 2248 break; 2249 default: 2250 break; 2251 } 2252 2253 mlx5e_dim_build_cq_param(priv, param); 2254 2255 mlx5e_build_common_cq_param(priv, param); 2256} 2257 2258static void 2259mlx5e_build_tx_cq_param(struct mlx5e_priv *priv, 2260 struct mlx5e_cq_param *param) 2261{ 2262 void *cqc = param->cqc; 2263 2264 MLX5_SET(cqc, cqc, log_cq_size, priv->params.log_sq_size); 2265 MLX5_SET(cqc, cqc, cq_period, priv->params.tx_cq_moderation_usec); 2266 MLX5_SET(cqc, cqc, cq_max_count, priv->params.tx_cq_moderation_pkts); 2267 2268 switch (priv->params.tx_cq_moderation_mode) { 2269 case 0: 2270 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_EQE); 2271 break; 2272 default: 2273 if (MLX5_CAP_GEN(priv->mdev, cq_period_start_from_cqe)) 2274 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_CQE); 2275 else 2276 MLX5_SET(cqc, cqc, cq_period_mode, MLX5_CQ_PERIOD_MODE_START_FROM_EQE); 2277 break; 2278 } 2279 2280 mlx5e_build_common_cq_param(priv, param); 2281} 2282 2283static void 2284mlx5e_build_channel_param(struct mlx5e_priv *priv, 2285 struct mlx5e_channel_param *cparam) 2286{ 2287 memset(cparam, 0, sizeof(*cparam)); 2288 2289 mlx5e_build_rq_param(priv, &cparam->rq); 2290 mlx5e_build_sq_param(priv, &cparam->sq); 2291 mlx5e_build_rx_cq_param(priv, &cparam->rx_cq); 2292 mlx5e_build_tx_cq_param(priv, &cparam->tx_cq); 2293} 2294 2295static int 2296mlx5e_open_channels(struct mlx5e_priv *priv) 2297{ 2298 struct mlx5e_channel_param cparam; 2299 int err; 2300 int i; 2301 int j; 2302 2303 mlx5e_build_channel_param(priv, &cparam); 2304 for (i = 0; i < priv->params.num_channels; i++) { 2305 err = mlx5e_open_channel(priv, i, &cparam, &priv->channel[i]); 2306 if (err) 2307 goto err_close_channels; 2308 } 2309 2310 for (j = 0; j < priv->params.num_channels; j++) { 2311 err = mlx5e_wait_for_min_rx_wqes(&priv->channel[j].rq); 2312 if (err) 2313 goto err_close_channels; 2314 } 2315 2316 return (0); 2317 2318err_close_channels: 2319 while (i--) { 2320 mlx5e_close_channel(&priv->channel[i]); 2321 mlx5e_close_channel_wait(&priv->channel[i]); 2322 } 2323 return (err); 2324} 2325 2326static void 2327mlx5e_close_channels(struct mlx5e_priv *priv) 2328{ 2329 int i; 2330 2331 for (i = 0; i < priv->params.num_channels; i++) 2332 mlx5e_close_channel(&priv->channel[i]); 2333 for (i = 0; i < priv->params.num_channels; i++) 2334 mlx5e_close_channel_wait(&priv->channel[i]); 2335} 2336 2337static int 2338mlx5e_refresh_sq_params(struct mlx5e_priv *priv, struct mlx5e_sq *sq) 2339{ 2340 2341 if (MLX5_CAP_GEN(priv->mdev, cq_period_mode_modify)) { 2342 uint8_t cq_mode; 2343 2344 switch (priv->params.tx_cq_moderation_mode) { 2345 case 0: 2346 case 2: 2347 cq_mode = MLX5_CQ_PERIOD_MODE_START_FROM_EQE; 2348 break; 2349 default: 2350 cq_mode = MLX5_CQ_PERIOD_MODE_START_FROM_CQE; 2351 break; 2352 } 2353 2354 return (mlx5_core_modify_cq_moderation_mode(priv->mdev, &sq->cq.mcq, 2355 priv->params.tx_cq_moderation_usec, 2356 priv->params.tx_cq_moderation_pkts, 2357 cq_mode)); 2358 } 2359 2360 return (mlx5_core_modify_cq_moderation(priv->mdev, &sq->cq.mcq, 2361 priv->params.tx_cq_moderation_usec, 2362 priv->params.tx_cq_moderation_pkts)); 2363} 2364 2365static int 2366mlx5e_refresh_rq_params(struct mlx5e_priv *priv, struct mlx5e_rq *rq) 2367{ 2368 2369 if (MLX5_CAP_GEN(priv->mdev, cq_period_mode_modify)) { 2370 uint8_t cq_mode; 2371 uint8_t dim_mode; 2372 int retval; 2373 2374 switch (priv->params.rx_cq_moderation_mode) { 2375 case 0: 2376 case 2: 2377 cq_mode = MLX5_CQ_PERIOD_MODE_START_FROM_EQE; 2378 dim_mode = NET_DIM_CQ_PERIOD_MODE_START_FROM_EQE; 2379 break; 2380 default: 2381 cq_mode = MLX5_CQ_PERIOD_MODE_START_FROM_CQE; 2382 dim_mode = NET_DIM_CQ_PERIOD_MODE_START_FROM_CQE; 2383 break; 2384 } 2385 2386 /* tear down dynamic interrupt moderation */ 2387 mtx_lock(&rq->mtx); 2388 rq->dim.mode = NET_DIM_CQ_PERIOD_MODE_DISABLED; 2389 mtx_unlock(&rq->mtx); 2390 2391 /* wait for dynamic interrupt moderation work task, if any */ 2392 cancel_work_sync(&rq->dim.work); 2393 2394 if (priv->params.rx_cq_moderation_mode >= 2) { 2395 struct net_dim_cq_moder curr; 2396 2397 mlx5e_get_default_profile(priv, dim_mode, &curr); 2398 2399 retval = mlx5_core_modify_cq_moderation_mode(priv->mdev, &rq->cq.mcq, 2400 curr.usec, curr.pkts, cq_mode); 2401 2402 /* set dynamic interrupt moderation mode and zero defaults */ 2403 mtx_lock(&rq->mtx); 2404 rq->dim.mode = dim_mode; 2405 rq->dim.state = 0; 2406 rq->dim.profile_ix = MLX5E_DIM_DEFAULT_PROFILE; 2407 mtx_unlock(&rq->mtx); 2408 } else { 2409 retval = mlx5_core_modify_cq_moderation_mode(priv->mdev, &rq->cq.mcq, 2410 priv->params.rx_cq_moderation_usec, 2411 priv->params.rx_cq_moderation_pkts, 2412 cq_mode); 2413 } 2414 return (retval); 2415 } 2416 2417 return (mlx5_core_modify_cq_moderation(priv->mdev, &rq->cq.mcq, 2418 priv->params.rx_cq_moderation_usec, 2419 priv->params.rx_cq_moderation_pkts)); 2420} 2421 2422static int 2423mlx5e_refresh_channel_params_sub(struct mlx5e_priv *priv, struct mlx5e_channel *c) 2424{ 2425 int err; 2426 int i; 2427 2428 err = mlx5e_refresh_rq_params(priv, &c->rq); 2429 if (err) 2430 goto done; 2431 2432 for (i = 0; i != c->num_tc; i++) { 2433 err = mlx5e_refresh_sq_params(priv, &c->sq[i]); 2434 if (err) 2435 goto done; 2436 } 2437done: 2438 return (err); 2439} 2440 2441int 2442mlx5e_refresh_channel_params(struct mlx5e_priv *priv) 2443{ 2444 int i; 2445 2446 /* check if channels are closed */ 2447 if (test_bit(MLX5E_STATE_OPENED, &priv->state) == 0) 2448 return (EINVAL); 2449 2450 for (i = 0; i < priv->params.num_channels; i++) { 2451 int err; 2452 2453 err = mlx5e_refresh_channel_params_sub(priv, &priv->channel[i]); 2454 if (err) 2455 return (err); 2456 } 2457 return (0); 2458} 2459 2460static int 2461mlx5e_open_tis(struct mlx5e_priv *priv, int tc) 2462{ 2463 struct mlx5_core_dev *mdev = priv->mdev; 2464 u32 in[MLX5_ST_SZ_DW(create_tis_in)]; 2465 void *tisc = MLX5_ADDR_OF(create_tis_in, in, ctx); 2466 2467 memset(in, 0, sizeof(in)); 2468 2469 MLX5_SET(tisc, tisc, prio, tc); 2470 MLX5_SET(tisc, tisc, transport_domain, priv->tdn); 2471 2472 return (mlx5_core_create_tis(mdev, in, sizeof(in), &priv->tisn[tc])); 2473} 2474 2475static void 2476mlx5e_close_tis(struct mlx5e_priv *priv, int tc) 2477{ 2478 mlx5_core_destroy_tis(priv->mdev, priv->tisn[tc]); 2479} 2480 2481static int 2482mlx5e_open_tises(struct mlx5e_priv *priv) 2483{ 2484 int num_tc = priv->num_tc; 2485 int err; 2486 int tc; 2487 2488 for (tc = 0; tc < num_tc; tc++) { 2489 err = mlx5e_open_tis(priv, tc); 2490 if (err) 2491 goto err_close_tises; 2492 } 2493 2494 return (0); 2495 2496err_close_tises: 2497 for (tc--; tc >= 0; tc--) 2498 mlx5e_close_tis(priv, tc); 2499 2500 return (err); 2501} 2502 2503static void 2504mlx5e_close_tises(struct mlx5e_priv *priv) 2505{ 2506 int num_tc = priv->num_tc; 2507 int tc; 2508 2509 for (tc = 0; tc < num_tc; tc++) 2510 mlx5e_close_tis(priv, tc); 2511} 2512 2513static int 2514mlx5e_open_rqt(struct mlx5e_priv *priv) 2515{ 2516 struct mlx5_core_dev *mdev = priv->mdev; 2517 u32 *in; 2518 u32 out[MLX5_ST_SZ_DW(create_rqt_out)] = {0}; 2519 void *rqtc; 2520 int inlen; 2521 int err; 2522 int sz; 2523 int i; 2524 2525 sz = 1 << priv->params.rx_hash_log_tbl_sz; 2526 2527 inlen = MLX5_ST_SZ_BYTES(create_rqt_in) + sizeof(u32) * sz; 2528 in = mlx5_vzalloc(inlen); 2529 if (in == NULL) 2530 return (-ENOMEM); 2531 rqtc = MLX5_ADDR_OF(create_rqt_in, in, rqt_context); 2532 2533 MLX5_SET(rqtc, rqtc, rqt_actual_size, sz); 2534 MLX5_SET(rqtc, rqtc, rqt_max_size, sz); 2535 2536 for (i = 0; i < sz; i++) { 2537 int ix = i; 2538#ifdef RSS 2539 ix = rss_get_indirection_to_bucket(ix); 2540#endif 2541 /* ensure we don't overflow */ 2542 ix %= priv->params.num_channels; 2543 2544 /* apply receive side scaling stride, if any */ 2545 ix -= ix % (int)priv->params.channels_rsss; 2546 2547 MLX5_SET(rqtc, rqtc, rq_num[i], priv->channel[ix].rq.rqn); 2548 } 2549 2550 MLX5_SET(create_rqt_in, in, opcode, MLX5_CMD_OP_CREATE_RQT); 2551 2552 err = mlx5_cmd_exec(mdev, in, inlen, out, sizeof(out)); 2553 if (!err) 2554 priv->rqtn = MLX5_GET(create_rqt_out, out, rqtn); 2555 2556 kvfree(in); 2557 2558 return (err); 2559} 2560 2561static void 2562mlx5e_close_rqt(struct mlx5e_priv *priv) 2563{ 2564 u32 in[MLX5_ST_SZ_DW(destroy_rqt_in)] = {0}; 2565 u32 out[MLX5_ST_SZ_DW(destroy_rqt_out)] = {0}; 2566 2567 MLX5_SET(destroy_rqt_in, in, opcode, MLX5_CMD_OP_DESTROY_RQT); 2568 MLX5_SET(destroy_rqt_in, in, rqtn, priv->rqtn); 2569 2570 mlx5_cmd_exec(priv->mdev, in, sizeof(in), out, sizeof(out)); 2571} 2572 2573static void 2574mlx5e_build_tir_ctx(struct mlx5e_priv *priv, u32 * tirc, int tt) 2575{ 2576 void *hfso = MLX5_ADDR_OF(tirc, tirc, rx_hash_field_selector_outer); 2577 __be32 *hkey; 2578 2579 MLX5_SET(tirc, tirc, transport_domain, priv->tdn); 2580 2581#define ROUGH_MAX_L2_L3_HDR_SZ 256 2582 2583#define MLX5_HASH_IP (MLX5_HASH_FIELD_SEL_SRC_IP |\ 2584 MLX5_HASH_FIELD_SEL_DST_IP) 2585 2586#define MLX5_HASH_ALL (MLX5_HASH_FIELD_SEL_SRC_IP |\ 2587 MLX5_HASH_FIELD_SEL_DST_IP |\ 2588 MLX5_HASH_FIELD_SEL_L4_SPORT |\ 2589 MLX5_HASH_FIELD_SEL_L4_DPORT) 2590 2591#define MLX5_HASH_IP_IPSEC_SPI (MLX5_HASH_FIELD_SEL_SRC_IP |\ 2592 MLX5_HASH_FIELD_SEL_DST_IP |\ 2593 MLX5_HASH_FIELD_SEL_IPSEC_SPI) 2594 2595 if (priv->params.hw_lro_en) { 2596 MLX5_SET(tirc, tirc, lro_enable_mask, 2597 MLX5_TIRC_LRO_ENABLE_MASK_IPV4_LRO | 2598 MLX5_TIRC_LRO_ENABLE_MASK_IPV6_LRO); 2599 MLX5_SET(tirc, tirc, lro_max_msg_sz, 2600 (priv->params.lro_wqe_sz - 2601 ROUGH_MAX_L2_L3_HDR_SZ) >> 8); 2602 /* TODO: add the option to choose timer value dynamically */ 2603 MLX5_SET(tirc, tirc, lro_timeout_period_usecs, 2604 MLX5_CAP_ETH(priv->mdev, 2605 lro_timer_supported_periods[2])); 2606 } 2607 2608 /* setup parameters for hashing TIR type, if any */ 2609 switch (tt) { 2610 case MLX5E_TT_ANY: 2611 MLX5_SET(tirc, tirc, disp_type, 2612 MLX5_TIRC_DISP_TYPE_DIRECT); 2613 MLX5_SET(tirc, tirc, inline_rqn, 2614 priv->channel[0].rq.rqn); 2615 break; 2616 default: 2617 MLX5_SET(tirc, tirc, disp_type, 2618 MLX5_TIRC_DISP_TYPE_INDIRECT); 2619 MLX5_SET(tirc, tirc, indirect_table, 2620 priv->rqtn); 2621 MLX5_SET(tirc, tirc, rx_hash_fn, 2622 MLX5_TIRC_RX_HASH_FN_HASH_TOEPLITZ); 2623 hkey = (__be32 *) MLX5_ADDR_OF(tirc, tirc, rx_hash_toeplitz_key); 2624#ifdef RSS 2625 /* 2626 * The FreeBSD RSS implementation does currently not 2627 * support symmetric Toeplitz hashes: 2628 */ 2629 MLX5_SET(tirc, tirc, rx_hash_symmetric, 0); 2630 rss_getkey((uint8_t *)hkey); 2631#else 2632 MLX5_SET(tirc, tirc, rx_hash_symmetric, 1); 2633 hkey[0] = cpu_to_be32(0xD181C62C); 2634 hkey[1] = cpu_to_be32(0xF7F4DB5B); 2635 hkey[2] = cpu_to_be32(0x1983A2FC); 2636 hkey[3] = cpu_to_be32(0x943E1ADB); 2637 hkey[4] = cpu_to_be32(0xD9389E6B); 2638 hkey[5] = cpu_to_be32(0xD1039C2C); 2639 hkey[6] = cpu_to_be32(0xA74499AD); 2640 hkey[7] = cpu_to_be32(0x593D56D9); 2641 hkey[8] = cpu_to_be32(0xF3253C06); 2642 hkey[9] = cpu_to_be32(0x2ADC1FFC); 2643#endif 2644 break; 2645 } 2646 2647 switch (tt) { 2648 case MLX5E_TT_IPV4_TCP: 2649 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2650 MLX5_L3_PROT_TYPE_IPV4); 2651 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type, 2652 MLX5_L4_PROT_TYPE_TCP); 2653#ifdef RSS 2654 if (!(rss_gethashconfig() & RSS_HASHTYPE_RSS_TCP_IPV4)) { 2655 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2656 MLX5_HASH_IP); 2657 } else 2658#endif 2659 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2660 MLX5_HASH_ALL); 2661 break; 2662 2663 case MLX5E_TT_IPV6_TCP: 2664 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2665 MLX5_L3_PROT_TYPE_IPV6); 2666 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type, 2667 MLX5_L4_PROT_TYPE_TCP); 2668#ifdef RSS 2669 if (!(rss_gethashconfig() & RSS_HASHTYPE_RSS_TCP_IPV6)) { 2670 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2671 MLX5_HASH_IP); 2672 } else 2673#endif 2674 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2675 MLX5_HASH_ALL); 2676 break; 2677 2678 case MLX5E_TT_IPV4_UDP: 2679 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2680 MLX5_L3_PROT_TYPE_IPV4); 2681 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type, 2682 MLX5_L4_PROT_TYPE_UDP); 2683#ifdef RSS 2684 if (!(rss_gethashconfig() & RSS_HASHTYPE_RSS_UDP_IPV4)) { 2685 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2686 MLX5_HASH_IP); 2687 } else 2688#endif 2689 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2690 MLX5_HASH_ALL); 2691 break; 2692 2693 case MLX5E_TT_IPV6_UDP: 2694 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2695 MLX5_L3_PROT_TYPE_IPV6); 2696 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type, 2697 MLX5_L4_PROT_TYPE_UDP); 2698#ifdef RSS 2699 if (!(rss_gethashconfig() & RSS_HASHTYPE_RSS_UDP_IPV6)) { 2700 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2701 MLX5_HASH_IP); 2702 } else 2703#endif 2704 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2705 MLX5_HASH_ALL); 2706 break; 2707 2708 case MLX5E_TT_IPV4_IPSEC_AH: 2709 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2710 MLX5_L3_PROT_TYPE_IPV4); 2711 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2712 MLX5_HASH_IP_IPSEC_SPI); 2713 break; 2714 2715 case MLX5E_TT_IPV6_IPSEC_AH: 2716 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2717 MLX5_L3_PROT_TYPE_IPV6); 2718 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2719 MLX5_HASH_IP_IPSEC_SPI); 2720 break; 2721 2722 case MLX5E_TT_IPV4_IPSEC_ESP: 2723 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2724 MLX5_L3_PROT_TYPE_IPV4); 2725 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2726 MLX5_HASH_IP_IPSEC_SPI); 2727 break; 2728 2729 case MLX5E_TT_IPV6_IPSEC_ESP: 2730 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2731 MLX5_L3_PROT_TYPE_IPV6); 2732 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2733 MLX5_HASH_IP_IPSEC_SPI); 2734 break; 2735 2736 case MLX5E_TT_IPV4: 2737 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2738 MLX5_L3_PROT_TYPE_IPV4); 2739 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2740 MLX5_HASH_IP); 2741 break; 2742 2743 case MLX5E_TT_IPV6: 2744 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type, 2745 MLX5_L3_PROT_TYPE_IPV6); 2746 MLX5_SET(rx_hash_field_select, hfso, selected_fields, 2747 MLX5_HASH_IP); 2748 break; 2749 2750 default: 2751 break; 2752 } 2753} 2754 2755static int 2756mlx5e_open_tir(struct mlx5e_priv *priv, int tt) 2757{ 2758 struct mlx5_core_dev *mdev = priv->mdev; 2759 u32 *in; 2760 void *tirc; 2761 int inlen; 2762 int err; 2763 2764 inlen = MLX5_ST_SZ_BYTES(create_tir_in); 2765 in = mlx5_vzalloc(inlen); 2766 if (in == NULL) 2767 return (-ENOMEM); 2768 tirc = MLX5_ADDR_OF(create_tir_in, in, tir_context); 2769 2770 mlx5e_build_tir_ctx(priv, tirc, tt); 2771 2772 err = mlx5_core_create_tir(mdev, in, inlen, &priv->tirn[tt]); 2773 2774 kvfree(in); 2775 2776 return (err); 2777} 2778 2779static void 2780mlx5e_close_tir(struct mlx5e_priv *priv, int tt) 2781{ 2782 mlx5_core_destroy_tir(priv->mdev, priv->tirn[tt]); 2783} 2784 2785static int 2786mlx5e_open_tirs(struct mlx5e_priv *priv) 2787{ 2788 int err; 2789 int i; 2790 2791 for (i = 0; i < MLX5E_NUM_TT; i++) { 2792 err = mlx5e_open_tir(priv, i); 2793 if (err) 2794 goto err_close_tirs; 2795 } 2796 2797 return (0); 2798 2799err_close_tirs: 2800 for (i--; i >= 0; i--) 2801 mlx5e_close_tir(priv, i); 2802 2803 return (err); 2804} 2805 2806static void 2807mlx5e_close_tirs(struct mlx5e_priv *priv) 2808{ 2809 int i; 2810 2811 for (i = 0; i < MLX5E_NUM_TT; i++) 2812 mlx5e_close_tir(priv, i); 2813} 2814 2815/* 2816 * SW MTU does not include headers, 2817 * HW MTU includes all headers and checksums. 2818 */ 2819static int 2820mlx5e_set_dev_port_mtu(struct ifnet *ifp, int sw_mtu) 2821{ 2822 struct mlx5e_priv *priv = ifp->if_softc; 2823 struct mlx5_core_dev *mdev = priv->mdev; 2824 int hw_mtu; 2825 int err; 2826 2827 hw_mtu = MLX5E_SW2HW_MTU(sw_mtu); 2828 2829 err = mlx5_set_port_mtu(mdev, hw_mtu); 2830 if (err) { 2831 if_printf(ifp, "%s: mlx5_set_port_mtu failed setting %d, err=%d\n", 2832 __func__, sw_mtu, err); 2833 return (err); 2834 } 2835 2836 /* Update vport context MTU */ 2837 err = mlx5_set_vport_mtu(mdev, hw_mtu); 2838 if (err) { 2839 if_printf(ifp, "%s: Failed updating vport context with MTU size, err=%d\n", 2840 __func__, err); 2841 } 2842 2843 ifp->if_mtu = sw_mtu; 2844 2845 err = mlx5_query_vport_mtu(mdev, &hw_mtu); 2846 if (err || !hw_mtu) { 2847 /* fallback to port oper mtu */ 2848 err = mlx5_query_port_oper_mtu(mdev, &hw_mtu); 2849 } 2850 if (err) { 2851 if_printf(ifp, "Query port MTU, after setting new " 2852 "MTU value, failed\n"); 2853 return (err); 2854 } else if (MLX5E_HW2SW_MTU(hw_mtu) < sw_mtu) { 2855 err = -E2BIG, 2856 if_printf(ifp, "Port MTU %d is smaller than " 2857 "ifp mtu %d\n", hw_mtu, sw_mtu); 2858 } else if (MLX5E_HW2SW_MTU(hw_mtu) > sw_mtu) { 2859 err = -EINVAL; 2860 if_printf(ifp, "Port MTU %d is bigger than " 2861 "ifp mtu %d\n", hw_mtu, sw_mtu); 2862 } 2863 priv->params_ethtool.hw_mtu = hw_mtu; 2864 2865 return (err); 2866} 2867 2868int 2869mlx5e_open_locked(struct ifnet *ifp) 2870{ 2871 struct mlx5e_priv *priv = ifp->if_softc; 2872 int err; 2873 u16 set_id; 2874 2875 /* check if already opened */ 2876 if (test_bit(MLX5E_STATE_OPENED, &priv->state) != 0) 2877 return (0); 2878 2879#ifdef RSS 2880 if (rss_getnumbuckets() > priv->params.num_channels) { 2881 if_printf(ifp, "NOTE: There are more RSS buckets(%u) than " 2882 "channels(%u) available\n", rss_getnumbuckets(), 2883 priv->params.num_channels); 2884 } 2885#endif 2886 err = mlx5e_open_tises(priv); 2887 if (err) { 2888 if_printf(ifp, "%s: mlx5e_open_tises failed, %d\n", 2889 __func__, err); 2890 return (err); 2891 } 2892 err = mlx5_vport_alloc_q_counter(priv->mdev, 2893 MLX5_INTERFACE_PROTOCOL_ETH, &set_id); 2894 if (err) { 2895 if_printf(priv->ifp, 2896 "%s: mlx5_vport_alloc_q_counter failed: %d\n", 2897 __func__, err); 2898 goto err_close_tises; 2899 } 2900 /* store counter set ID */ 2901 priv->counter_set_id = set_id; 2902 2903 err = mlx5e_open_channels(priv); 2904 if (err) { 2905 if_printf(ifp, "%s: mlx5e_open_channels failed, %d\n", 2906 __func__, err); 2907 goto err_dalloc_q_counter; 2908 } 2909 err = mlx5e_open_rqt(priv); 2910 if (err) { 2911 if_printf(ifp, "%s: mlx5e_open_rqt failed, %d\n", 2912 __func__, err); 2913 goto err_close_channels; 2914 } 2915 err = mlx5e_open_tirs(priv); 2916 if (err) { 2917 if_printf(ifp, "%s: mlx5e_open_tir failed, %d\n", 2918 __func__, err); 2919 goto err_close_rqls; 2920 } 2921 err = mlx5e_open_flow_table(priv); 2922 if (err) { 2923 if_printf(ifp, "%s: mlx5e_open_flow_table failed, %d\n", 2924 __func__, err); 2925 goto err_close_tirs; 2926 } 2927 err = mlx5e_add_all_vlan_rules(priv); 2928 if (err) { 2929 if_printf(ifp, "%s: mlx5e_add_all_vlan_rules failed, %d\n", 2930 __func__, err); 2931 goto err_close_flow_table; 2932 } 2933 set_bit(MLX5E_STATE_OPENED, &priv->state); 2934 2935 mlx5e_update_carrier(priv); 2936 mlx5e_set_rx_mode_core(priv); 2937 2938 return (0); 2939 2940err_close_flow_table: 2941 mlx5e_close_flow_table(priv); 2942 2943err_close_tirs: 2944 mlx5e_close_tirs(priv); 2945 2946err_close_rqls: 2947 mlx5e_close_rqt(priv); 2948 2949err_close_channels: 2950 mlx5e_close_channels(priv); 2951 2952err_dalloc_q_counter: 2953 mlx5_vport_dealloc_q_counter(priv->mdev, 2954 MLX5_INTERFACE_PROTOCOL_ETH, priv->counter_set_id); 2955 2956err_close_tises: 2957 mlx5e_close_tises(priv); 2958 2959 return (err); 2960} 2961 2962static void 2963mlx5e_open(void *arg) 2964{ 2965 struct mlx5e_priv *priv = arg; 2966 2967 PRIV_LOCK(priv); 2968 if (mlx5_set_port_status(priv->mdev, MLX5_PORT_UP)) 2969 if_printf(priv->ifp, 2970 "%s: Setting port status to up failed\n", 2971 __func__); 2972 2973 mlx5e_open_locked(priv->ifp); 2974 priv->ifp->if_drv_flags |= IFF_DRV_RUNNING; 2975 PRIV_UNLOCK(priv); 2976} 2977 2978int 2979mlx5e_close_locked(struct ifnet *ifp) 2980{ 2981 struct mlx5e_priv *priv = ifp->if_softc; 2982 2983 /* check if already closed */ 2984 if (test_bit(MLX5E_STATE_OPENED, &priv->state) == 0) 2985 return (0); 2986 2987 clear_bit(MLX5E_STATE_OPENED, &priv->state); 2988 2989 mlx5e_set_rx_mode_core(priv); 2990 mlx5e_del_all_vlan_rules(priv); 2991 if_link_state_change(priv->ifp, LINK_STATE_DOWN); 2992 mlx5e_close_flow_table(priv); 2993 mlx5e_close_tirs(priv); 2994 mlx5e_close_rqt(priv); 2995 mlx5e_close_channels(priv); 2996 mlx5_vport_dealloc_q_counter(priv->mdev, 2997 MLX5_INTERFACE_PROTOCOL_ETH, priv->counter_set_id); 2998 mlx5e_close_tises(priv); 2999 3000 return (0); 3001} 3002 3003#if (__FreeBSD_version >= 1100000) 3004static uint64_t 3005mlx5e_get_counter(struct ifnet *ifp, ift_counter cnt) 3006{ 3007 struct mlx5e_priv *priv = ifp->if_softc; 3008 u64 retval; 3009 3010 /* PRIV_LOCK(priv); XXX not allowed */ 3011 switch (cnt) { 3012 case IFCOUNTER_IPACKETS: 3013 retval = priv->stats.vport.rx_packets; 3014 break; 3015 case IFCOUNTER_IERRORS: 3016 retval = priv->stats.pport.in_range_len_errors + 3017 priv->stats.pport.out_of_range_len + 3018 priv->stats.pport.too_long_errors + 3019 priv->stats.pport.check_seq_err + 3020 priv->stats.pport.alignment_err; 3021 break; 3022 case IFCOUNTER_IQDROPS: 3023 retval = priv->stats.vport.rx_out_of_buffer; 3024 break; 3025 case IFCOUNTER_OPACKETS: 3026 retval = priv->stats.vport.tx_packets; 3027 break; 3028 case IFCOUNTER_OERRORS: 3029 retval = priv->stats.port_stats_debug.out_discards; 3030 break; 3031 case IFCOUNTER_IBYTES: 3032 retval = priv->stats.vport.rx_bytes; 3033 break; 3034 case IFCOUNTER_OBYTES: 3035 retval = priv->stats.vport.tx_bytes; 3036 break; 3037 case IFCOUNTER_IMCASTS: 3038 retval = priv->stats.vport.rx_multicast_packets; 3039 break; 3040 case IFCOUNTER_OMCASTS: 3041 retval = priv->stats.vport.tx_multicast_packets; 3042 break; 3043 case IFCOUNTER_OQDROPS: 3044 retval = priv->stats.vport.tx_queue_dropped; 3045 break; 3046 case IFCOUNTER_COLLISIONS: 3047 retval = priv->stats.pport.collisions; 3048 break; 3049 default: 3050 retval = if_get_counter_default(ifp, cnt); 3051 break; 3052 } 3053 /* PRIV_UNLOCK(priv); XXX not allowed */ 3054 return (retval); 3055} 3056#endif 3057 3058static void 3059mlx5e_set_rx_mode(struct ifnet *ifp) 3060{ 3061 struct mlx5e_priv *priv = ifp->if_softc; 3062 3063 queue_work(priv->wq, &priv->set_rx_mode_work); 3064} 3065 3066static int 3067mlx5e_ioctl(struct ifnet *ifp, u_long command, caddr_t data) 3068{ 3069 struct mlx5e_priv *priv; 3070 struct ifreq *ifr; 3071 struct ifi2creq i2c; 3072 int error = 0; 3073 int mask = 0; 3074 int size_read = 0; 3075 int module_status; 3076 int module_num; 3077 int max_mtu; 3078 uint8_t read_addr; 3079 3080 priv = ifp->if_softc; 3081 3082 /* check if detaching */ 3083 if (priv == NULL || priv->gone != 0) 3084 return (ENXIO); 3085 3086 switch (command) { 3087 case SIOCSIFMTU: 3088 ifr = (struct ifreq *)data; 3089 3090 PRIV_LOCK(priv); 3091 mlx5_query_port_max_mtu(priv->mdev, &max_mtu); 3092 3093 if (ifr->ifr_mtu >= MLX5E_MTU_MIN && 3094 ifr->ifr_mtu <= MIN(MLX5E_MTU_MAX, max_mtu)) { 3095 int was_opened; 3096 3097 was_opened = test_bit(MLX5E_STATE_OPENED, &priv->state); 3098 if (was_opened) 3099 mlx5e_close_locked(ifp); 3100 3101 /* set new MTU */ 3102 mlx5e_set_dev_port_mtu(ifp, ifr->ifr_mtu); 3103 3104 if (was_opened) 3105 mlx5e_open_locked(ifp); 3106 } else { 3107 error = EINVAL; 3108 if_printf(ifp, "Invalid MTU value. Min val: %d, Max val: %d\n", 3109 MLX5E_MTU_MIN, MIN(MLX5E_MTU_MAX, max_mtu)); 3110 } 3111 PRIV_UNLOCK(priv); 3112 break; 3113 case SIOCSIFFLAGS: 3114 if ((ifp->if_flags & IFF_UP) && 3115 (ifp->if_drv_flags & IFF_DRV_RUNNING)) { 3116 mlx5e_set_rx_mode(ifp); 3117 break; 3118 } 3119 PRIV_LOCK(priv); 3120 if (ifp->if_flags & IFF_UP) { 3121 if ((ifp->if_drv_flags & IFF_DRV_RUNNING) == 0) { 3122 if (test_bit(MLX5E_STATE_OPENED, &priv->state) == 0) 3123 mlx5e_open_locked(ifp); 3124 ifp->if_drv_flags |= IFF_DRV_RUNNING; 3125 mlx5_set_port_status(priv->mdev, MLX5_PORT_UP); 3126 } 3127 } else { 3128 if (ifp->if_drv_flags & IFF_DRV_RUNNING) { 3129 mlx5_set_port_status(priv->mdev, 3130 MLX5_PORT_DOWN); 3131 if (test_bit(MLX5E_STATE_OPENED, &priv->state) != 0) 3132 mlx5e_close_locked(ifp); 3133 mlx5e_update_carrier(priv); 3134 ifp->if_drv_flags &= ~IFF_DRV_RUNNING; 3135 } 3136 } 3137 PRIV_UNLOCK(priv); 3138 break; 3139 case SIOCADDMULTI: 3140 case SIOCDELMULTI: 3141 mlx5e_set_rx_mode(ifp); 3142 break; 3143 case SIOCSIFMEDIA: 3144 case SIOCGIFMEDIA: 3145 case SIOCGIFXMEDIA: 3146 ifr = (struct ifreq *)data; 3147 error = ifmedia_ioctl(ifp, ifr, &priv->media, command); 3148 break; 3149 case SIOCSIFCAP: 3150 ifr = (struct ifreq *)data; 3151 PRIV_LOCK(priv); 3152 mask = ifr->ifr_reqcap ^ ifp->if_capenable; 3153 3154 if (mask & IFCAP_TXCSUM) { 3155 ifp->if_capenable ^= IFCAP_TXCSUM; 3156 ifp->if_hwassist ^= (CSUM_TCP | CSUM_UDP | CSUM_IP); 3157 3158 if (IFCAP_TSO4 & ifp->if_capenable && 3159 !(IFCAP_TXCSUM & ifp->if_capenable)) { 3160 ifp->if_capenable &= ~IFCAP_TSO4; 3161 ifp->if_hwassist &= ~CSUM_IP_TSO; 3162 if_printf(ifp, 3163 "tso4 disabled due to -txcsum.\n"); 3164 } 3165 } 3166 if (mask & IFCAP_TXCSUM_IPV6) { 3167 ifp->if_capenable ^= IFCAP_TXCSUM_IPV6; 3168 ifp->if_hwassist ^= (CSUM_UDP_IPV6 | CSUM_TCP_IPV6); 3169 3170 if (IFCAP_TSO6 & ifp->if_capenable && 3171 !(IFCAP_TXCSUM_IPV6 & ifp->if_capenable)) { 3172 ifp->if_capenable &= ~IFCAP_TSO6; 3173 ifp->if_hwassist &= ~CSUM_IP6_TSO; 3174 if_printf(ifp, 3175 "tso6 disabled due to -txcsum6.\n"); 3176 } 3177 } 3178 if (mask & IFCAP_RXCSUM) 3179 ifp->if_capenable ^= IFCAP_RXCSUM; 3180 if (mask & IFCAP_RXCSUM_IPV6) 3181 ifp->if_capenable ^= IFCAP_RXCSUM_IPV6; 3182 if (mask & IFCAP_TSO4) { 3183 if (!(IFCAP_TSO4 & ifp->if_capenable) && 3184 !(IFCAP_TXCSUM & ifp->if_capenable)) { 3185 if_printf(ifp, "enable txcsum first.\n"); 3186 error = EAGAIN; 3187 goto out; 3188 } 3189 ifp->if_capenable ^= IFCAP_TSO4; 3190 ifp->if_hwassist ^= CSUM_IP_TSO; 3191 } 3192 if (mask & IFCAP_TSO6) { 3193 if (!(IFCAP_TSO6 & ifp->if_capenable) && 3194 !(IFCAP_TXCSUM_IPV6 & ifp->if_capenable)) { 3195 if_printf(ifp, "enable txcsum6 first.\n"); 3196 error = EAGAIN; 3197 goto out; 3198 } 3199 ifp->if_capenable ^= IFCAP_TSO6; 3200 ifp->if_hwassist ^= CSUM_IP6_TSO; 3201 } 3202 if (mask & IFCAP_VLAN_HWFILTER) { 3203 if (ifp->if_capenable & IFCAP_VLAN_HWFILTER) 3204 mlx5e_disable_vlan_filter(priv); 3205 else 3206 mlx5e_enable_vlan_filter(priv); 3207 3208 ifp->if_capenable ^= IFCAP_VLAN_HWFILTER; 3209 } 3210 if (mask & IFCAP_VLAN_HWTAGGING) 3211 ifp->if_capenable ^= IFCAP_VLAN_HWTAGGING; 3212 if (mask & IFCAP_WOL_MAGIC) 3213 ifp->if_capenable ^= IFCAP_WOL_MAGIC; 3214 3215 VLAN_CAPABILITIES(ifp); 3216 /* turn off LRO means also turn of HW LRO - if it's on */ 3217 if (mask & IFCAP_LRO) { 3218 int was_opened = test_bit(MLX5E_STATE_OPENED, &priv->state); 3219 bool need_restart = false; 3220 3221 ifp->if_capenable ^= IFCAP_LRO; 3222 3223 /* figure out if updating HW LRO is needed */ 3224 if (!(ifp->if_capenable & IFCAP_LRO)) { 3225 if (priv->params.hw_lro_en) { 3226 priv->params.hw_lro_en = false; 3227 need_restart = true; 3228 } 3229 } else { 3230 if (priv->params.hw_lro_en == false && 3231 priv->params_ethtool.hw_lro != 0) { 3232 priv->params.hw_lro_en = true; 3233 need_restart = true; 3234 } 3235 } 3236 if (was_opened && need_restart) { 3237 mlx5e_close_locked(ifp); 3238 mlx5e_open_locked(ifp); 3239 } 3240 } 3241out: 3242 PRIV_UNLOCK(priv); 3243 break; 3244 3245 case SIOCGI2C: 3246 ifr = (struct ifreq *)data; 3247 3248 /* 3249 * Copy from the user-space address ifr_data to the 3250 * kernel-space address i2c 3251 */ 3252 error = copyin(ifr_data_get_ptr(ifr), &i2c, sizeof(i2c)); 3253 if (error) 3254 break; 3255 3256 if (i2c.len > sizeof(i2c.data)) { 3257 error = EINVAL; 3258 break; 3259 } 3260 3261 PRIV_LOCK(priv); 3262 /* Get module_num which is required for the query_eeprom */ 3263 error = mlx5_query_module_num(priv->mdev, &module_num); 3264 if (error) { 3265 if_printf(ifp, "Query module num failed, eeprom " 3266 "reading is not supported\n"); 3267 error = EINVAL; 3268 goto err_i2c; 3269 } 3270 /* Check if module is present before doing an access */ 3271 module_status = mlx5_query_module_status(priv->mdev, module_num); 3272 if (module_status != MLX5_MODULE_STATUS_PLUGGED_ENABLED && 3273 module_status != MLX5_MODULE_STATUS_PLUGGED_DISABLED) { 3274 error = EINVAL; 3275 goto err_i2c; 3276 } 3277 /* 3278 * Currently 0XA0 and 0xA2 are the only addresses permitted. 3279 * The internal conversion is as follows: 3280 */ 3281 if (i2c.dev_addr == 0xA0) 3282 read_addr = MLX5E_I2C_ADDR_LOW; 3283 else if (i2c.dev_addr == 0xA2) 3284 read_addr = MLX5E_I2C_ADDR_HIGH; 3285 else { 3286 if_printf(ifp, "Query eeprom failed, " 3287 "Invalid Address: %X\n", i2c.dev_addr); 3288 error = EINVAL; 3289 goto err_i2c; 3290 } 3291 error = mlx5_query_eeprom(priv->mdev, 3292 read_addr, MLX5E_EEPROM_LOW_PAGE, 3293 (uint32_t)i2c.offset, (uint32_t)i2c.len, module_num, 3294 (uint32_t *)i2c.data, &size_read); 3295 if (error) { 3296 if_printf(ifp, "Query eeprom failed, eeprom " 3297 "reading is not supported\n"); 3298 error = EINVAL; 3299 goto err_i2c; 3300 } 3301 3302 if (i2c.len > MLX5_EEPROM_MAX_BYTES) { 3303 error = mlx5_query_eeprom(priv->mdev, 3304 read_addr, MLX5E_EEPROM_LOW_PAGE, 3305 (uint32_t)(i2c.offset + size_read), 3306 (uint32_t)(i2c.len - size_read), module_num, 3307 (uint32_t *)(i2c.data + size_read), &size_read); 3308 } 3309 if (error) { 3310 if_printf(ifp, "Query eeprom failed, eeprom " 3311 "reading is not supported\n"); 3312 error = EINVAL; 3313 goto err_i2c; 3314 } 3315 3316 error = copyout(&i2c, ifr_data_get_ptr(ifr), sizeof(i2c)); 3317err_i2c: 3318 PRIV_UNLOCK(priv); 3319 break; 3320 3321 default: 3322 error = ether_ioctl(ifp, command, data); 3323 break; 3324 } 3325 return (error); 3326} 3327 3328static int 3329mlx5e_check_required_hca_cap(struct mlx5_core_dev *mdev) 3330{ 3331 /* 3332 * TODO: uncoment once FW really sets all these bits if 3333 * (!mdev->caps.eth.rss_ind_tbl_cap || !mdev->caps.eth.csum_cap || 3334 * !mdev->caps.eth.max_lso_cap || !mdev->caps.eth.vlan_cap || 3335 * !(mdev->caps.gen.flags & MLX5_DEV_CAP_FLAG_SCQE_BRK_MOD)) return 3336 * -ENOTSUPP; 3337 */ 3338 3339 /* TODO: add more must-to-have features */ 3340 3341 if (MLX5_CAP_GEN(mdev, port_type) != MLX5_CAP_PORT_TYPE_ETH) 3342 return (-ENODEV); 3343 3344 return (0); 3345} 3346 3347static u16 3348mlx5e_get_max_inline_cap(struct mlx5_core_dev *mdev) 3349{ 3350 uint32_t bf_buf_size = (1U << MLX5_CAP_GEN(mdev, log_bf_reg_size)) / 2U; 3351 3352 bf_buf_size -= sizeof(struct mlx5e_tx_wqe) - 2; 3353 3354 /* verify against driver hardware limit */ 3355 if (bf_buf_size > MLX5E_MAX_TX_INLINE) 3356 bf_buf_size = MLX5E_MAX_TX_INLINE; 3357 3358 return (bf_buf_size); 3359} 3360 3361static int 3362mlx5e_build_ifp_priv(struct mlx5_core_dev *mdev, 3363 struct mlx5e_priv *priv, 3364 int num_comp_vectors) 3365{ 3366 int err; 3367 3368 /* 3369 * TODO: Consider link speed for setting "log_sq_size", 3370 * "log_rq_size" and "cq_moderation_xxx": 3371 */ 3372 priv->params.log_sq_size = 3373 MLX5E_PARAMS_DEFAULT_LOG_SQ_SIZE; 3374 priv->params.log_rq_size = 3375 MLX5E_PARAMS_DEFAULT_LOG_RQ_SIZE; 3376 priv->params.rx_cq_moderation_usec = 3377 MLX5_CAP_GEN(mdev, cq_period_start_from_cqe) ? 3378 MLX5E_PARAMS_DEFAULT_RX_CQ_MODERATION_USEC_FROM_CQE : 3379 MLX5E_PARAMS_DEFAULT_RX_CQ_MODERATION_USEC; 3380 priv->params.rx_cq_moderation_mode = 3381 MLX5_CAP_GEN(mdev, cq_period_start_from_cqe) ? 1 : 0; 3382 priv->params.rx_cq_moderation_pkts = 3383 MLX5E_PARAMS_DEFAULT_RX_CQ_MODERATION_PKTS; 3384 priv->params.tx_cq_moderation_usec = 3385 MLX5E_PARAMS_DEFAULT_TX_CQ_MODERATION_USEC; 3386 priv->params.tx_cq_moderation_pkts = 3387 MLX5E_PARAMS_DEFAULT_TX_CQ_MODERATION_PKTS; 3388 priv->params.min_rx_wqes = 3389 MLX5E_PARAMS_DEFAULT_MIN_RX_WQES; 3390 priv->params.rx_hash_log_tbl_sz = 3391 (order_base_2(num_comp_vectors) > 3392 MLX5E_PARAMS_DEFAULT_RX_HASH_LOG_TBL_SZ) ? 3393 order_base_2(num_comp_vectors) : 3394 MLX5E_PARAMS_DEFAULT_RX_HASH_LOG_TBL_SZ; 3395 priv->params.num_tc = 1; 3396 priv->params.default_vlan_prio = 0; 3397 priv->counter_set_id = -1; 3398 priv->params.tx_max_inline = mlx5e_get_max_inline_cap(mdev); 3399 3400 err = mlx5_query_min_inline(mdev, &priv->params.tx_min_inline_mode); 3401 if (err) 3402 return (err); 3403 3404 /* 3405 * hw lro is currently defaulted to off. when it won't anymore we 3406 * will consider the HW capability: "!!MLX5_CAP_ETH(mdev, lro_cap)" 3407 */ 3408 priv->params.hw_lro_en = false; 3409 priv->params.lro_wqe_sz = MLX5E_PARAMS_DEFAULT_LRO_WQE_SZ; 3410 3411 /* 3412 * CQE zipping is currently defaulted to off. when it won't 3413 * anymore we will consider the HW capability: 3414 * "!!MLX5_CAP_GEN(mdev, cqe_compression)" 3415 */ 3416 priv->params.cqe_zipping_en = false; 3417 3418 priv->mdev = mdev; 3419 priv->params.num_channels = num_comp_vectors; 3420 priv->params.channels_rsss = 1; 3421 priv->order_base_2_num_channels = order_base_2(num_comp_vectors); 3422 priv->queue_mapping_channel_mask = 3423 roundup_pow_of_two(num_comp_vectors) - 1; 3424 priv->num_tc = priv->params.num_tc; 3425 priv->default_vlan_prio = priv->params.default_vlan_prio; 3426 3427 INIT_WORK(&priv->update_stats_work, mlx5e_update_stats_work); 3428 INIT_WORK(&priv->update_carrier_work, mlx5e_update_carrier_work); 3429 INIT_WORK(&priv->set_rx_mode_work, mlx5e_set_rx_mode_work); 3430 3431 return (0); 3432} 3433 3434static int 3435mlx5e_create_mkey(struct mlx5e_priv *priv, u32 pdn, 3436 struct mlx5_core_mr *mkey) 3437{ 3438 struct ifnet *ifp = priv->ifp; 3439 struct mlx5_core_dev *mdev = priv->mdev; 3440 int inlen = MLX5_ST_SZ_BYTES(create_mkey_in); 3441 void *mkc; 3442 u32 *in; 3443 int err; 3444 3445 in = mlx5_vzalloc(inlen); 3446 if (in == NULL) { 3447 if_printf(ifp, "%s: failed to allocate inbox\n", __func__); 3448 return (-ENOMEM); 3449 } 3450 3451 mkc = MLX5_ADDR_OF(create_mkey_in, in, memory_key_mkey_entry); 3452 MLX5_SET(mkc, mkc, access_mode, MLX5_ACCESS_MODE_PA); 3453 MLX5_SET(mkc, mkc, lw, 1); 3454 MLX5_SET(mkc, mkc, lr, 1); 3455 3456 MLX5_SET(mkc, mkc, pd, pdn); 3457 MLX5_SET(mkc, mkc, length64, 1); 3458 MLX5_SET(mkc, mkc, qpn, 0xffffff); 3459 3460 err = mlx5_core_create_mkey(mdev, mkey, in, inlen); 3461 if (err) 3462 if_printf(ifp, "%s: mlx5_core_create_mkey failed, %d\n", 3463 __func__, err); 3464 3465 kvfree(in); 3466 return (err); 3467} 3468 3469static const char *mlx5e_vport_stats_desc[] = { 3470 MLX5E_VPORT_STATS(MLX5E_STATS_DESC) 3471}; 3472 3473static const char *mlx5e_pport_stats_desc[] = { 3474 MLX5E_PPORT_STATS(MLX5E_STATS_DESC) 3475}; 3476 3477static void 3478mlx5e_priv_mtx_init(struct mlx5e_priv *priv) 3479{ 3480 mtx_init(&priv->async_events_mtx, "mlx5async", MTX_NETWORK_LOCK, MTX_DEF); 3481 sx_init(&priv->state_lock, "mlx5state"); 3482 callout_init_mtx(&priv->watchdog, &priv->async_events_mtx, 0); 3483 MLX5_INIT_DOORBELL_LOCK(&priv->doorbell_lock); 3484} 3485 3486static void 3487mlx5e_priv_mtx_destroy(struct mlx5e_priv *priv) 3488{ 3489 mtx_destroy(&priv->async_events_mtx); 3490 sx_destroy(&priv->state_lock); 3491} 3492 3493static int 3494sysctl_firmware(SYSCTL_HANDLER_ARGS) 3495{ 3496 /* 3497 * %d.%d%.d the string format. 3498 * fw_rev_{maj,min,sub} return u16, 2^16 = 65536. 3499 * We need at most 5 chars to store that. 3500 * It also has: two "." and NULL at the end, which means we need 18 3501 * (5*3 + 3) chars at most. 3502 */ 3503 char fw[18]; 3504 struct mlx5e_priv *priv = arg1; 3505 int error; 3506 3507 snprintf(fw, sizeof(fw), "%d.%d.%d", fw_rev_maj(priv->mdev), fw_rev_min(priv->mdev), 3508 fw_rev_sub(priv->mdev)); 3509 error = sysctl_handle_string(oidp, fw, sizeof(fw), req); 3510 return (error); 3511} 3512 3513static void 3514mlx5e_disable_tx_dma(struct mlx5e_channel *ch) 3515{ 3516 int i; 3517 3518 for (i = 0; i < ch->num_tc; i++) 3519 mlx5e_drain_sq(&ch->sq[i]); 3520} 3521 3522static void 3523mlx5e_reset_sq_doorbell_record(struct mlx5e_sq *sq) 3524{ 3525 3526 sq->doorbell.d32[0] = cpu_to_be32(MLX5_OPCODE_NOP); 3527 sq->doorbell.d32[1] = cpu_to_be32(sq->sqn << 8); 3528 mlx5e_tx_notify_hw(sq, sq->doorbell.d32, 0); 3529 sq->doorbell.d64 = 0; 3530} 3531 3532void 3533mlx5e_resume_sq(struct mlx5e_sq *sq) 3534{ 3535 int err; 3536 3537 /* check if already enabled */ 3538 if (READ_ONCE(sq->running) != 0) 3539 return; 3540 3541 err = mlx5e_modify_sq(sq, MLX5_SQC_STATE_ERR, 3542 MLX5_SQC_STATE_RST); 3543 if (err != 0) { 3544 if_printf(sq->ifp, 3545 "mlx5e_modify_sq() from ERR to RST failed: %d\n", err); 3546 } 3547 3548 sq->cc = 0; 3549 sq->pc = 0; 3550 3551 /* reset doorbell prior to moving from RST to RDY */ 3552 mlx5e_reset_sq_doorbell_record(sq); 3553 3554 err = mlx5e_modify_sq(sq, MLX5_SQC_STATE_RST, 3555 MLX5_SQC_STATE_RDY); 3556 if (err != 0) { 3557 if_printf(sq->ifp, 3558 "mlx5e_modify_sq() from RST to RDY failed: %d\n", err); 3559 } 3560 3561 sq->cev_next_state = MLX5E_CEV_STATE_INITIAL; 3562 WRITE_ONCE(sq->running, 1); 3563} 3564 3565static void 3566mlx5e_enable_tx_dma(struct mlx5e_channel *ch) 3567{ 3568 int i; 3569 3570 for (i = 0; i < ch->num_tc; i++) 3571 mlx5e_resume_sq(&ch->sq[i]); 3572} 3573 3574static void 3575mlx5e_disable_rx_dma(struct mlx5e_channel *ch) 3576{ 3577 struct mlx5e_rq *rq = &ch->rq; 3578 int err; 3579 3580 mtx_lock(&rq->mtx); 3581 rq->enabled = 0; 3582 callout_stop(&rq->watchdog); 3583 mtx_unlock(&rq->mtx); 3584 3585 callout_drain(&rq->watchdog); 3586 3587 err = mlx5e_modify_rq(rq, MLX5_RQC_STATE_RDY, MLX5_RQC_STATE_ERR); 3588 if (err != 0) { 3589 if_printf(rq->ifp, 3590 "mlx5e_modify_rq() from RDY to RST failed: %d\n", err); 3591 } 3592 3593 while (!mlx5_wq_ll_is_empty(&rq->wq)) { 3594 msleep(1); 3595 rq->cq.mcq.comp(&rq->cq.mcq); 3596 } 3597 3598 /* 3599 * Transitioning into RST state will allow the FW to track less ERR state queues, 3600 * thus reducing the recv queue flushing time 3601 */ 3602 err = mlx5e_modify_rq(rq, MLX5_RQC_STATE_ERR, MLX5_RQC_STATE_RST); 3603 if (err != 0) { 3604 if_printf(rq->ifp, 3605 "mlx5e_modify_rq() from ERR to RST failed: %d\n", err); 3606 } 3607} 3608 3609static void 3610mlx5e_enable_rx_dma(struct mlx5e_channel *ch) 3611{ 3612 struct mlx5e_rq *rq = &ch->rq; 3613 int err; 3614 3615 rq->wq.wqe_ctr = 0; 3616 mlx5_wq_ll_update_db_record(&rq->wq); 3617 err = mlx5e_modify_rq(rq, MLX5_RQC_STATE_RST, MLX5_RQC_STATE_RDY); 3618 if (err != 0) { 3619 if_printf(rq->ifp, 3620 "mlx5e_modify_rq() from RST to RDY failed: %d\n", err); 3621 } 3622 3623 rq->enabled = 1; 3624 3625 rq->cq.mcq.comp(&rq->cq.mcq); 3626} 3627 3628void 3629mlx5e_modify_tx_dma(struct mlx5e_priv *priv, uint8_t value) 3630{ 3631 int i; 3632 3633 if (test_bit(MLX5E_STATE_OPENED, &priv->state) == 0) 3634 return; 3635 3636 for (i = 0; i < priv->params.num_channels; i++) { 3637 if (value) 3638 mlx5e_disable_tx_dma(&priv->channel[i]); 3639 else 3640 mlx5e_enable_tx_dma(&priv->channel[i]); 3641 } 3642} 3643 3644void 3645mlx5e_modify_rx_dma(struct mlx5e_priv *priv, uint8_t value) 3646{ 3647 int i; 3648 3649 if (test_bit(MLX5E_STATE_OPENED, &priv->state) == 0) 3650 return; 3651 3652 for (i = 0; i < priv->params.num_channels; i++) { 3653 if (value) 3654 mlx5e_disable_rx_dma(&priv->channel[i]); 3655 else 3656 mlx5e_enable_rx_dma(&priv->channel[i]); 3657 } 3658} 3659 3660static void 3661mlx5e_add_hw_stats(struct mlx5e_priv *priv) 3662{ 3663 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_hw), 3664 OID_AUTO, "fw_version", CTLTYPE_STRING | CTLFLAG_RD, priv, 0, 3665 sysctl_firmware, "A", "HCA firmware version"); 3666 3667 SYSCTL_ADD_STRING(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_hw), 3668 OID_AUTO, "board_id", CTLFLAG_RD, priv->mdev->board_id, 0, 3669 "Board ID"); 3670} 3671 3672static int 3673mlx5e_sysctl_tx_priority_flow_control(SYSCTL_HANDLER_ARGS) 3674{ 3675 struct mlx5e_priv *priv = arg1; 3676 uint8_t temp[MLX5E_MAX_PRIORITY]; 3677 uint32_t tx_pfc; 3678 int err; 3679 int i; 3680 3681 PRIV_LOCK(priv); 3682 3683 tx_pfc = priv->params.tx_priority_flow_control; 3684 3685 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) 3686 temp[i] = (tx_pfc >> i) & 1; 3687 3688 err = SYSCTL_OUT(req, temp, MLX5E_MAX_PRIORITY); 3689 if (err || !req->newptr) 3690 goto done; 3691 err = SYSCTL_IN(req, temp, MLX5E_MAX_PRIORITY); 3692 if (err) 3693 goto done; 3694 3695 priv->params.tx_priority_flow_control = 0; 3696 3697 /* range check input value */ 3698 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) { 3699 if (temp[i] > 1) { 3700 err = ERANGE; 3701 goto done; 3702 } 3703 priv->params.tx_priority_flow_control |= (temp[i] << i); 3704 } 3705 3706 /* check if update is required */ 3707 if (tx_pfc != priv->params.tx_priority_flow_control) 3708 err = -mlx5e_set_port_pfc(priv); 3709done: 3710 if (err != 0) 3711 priv->params.tx_priority_flow_control= tx_pfc; 3712 PRIV_UNLOCK(priv); 3713 3714 return (err); 3715} 3716 3717static int 3718mlx5e_sysctl_rx_priority_flow_control(SYSCTL_HANDLER_ARGS) 3719{ 3720 struct mlx5e_priv *priv = arg1; 3721 uint8_t temp[MLX5E_MAX_PRIORITY]; 3722 uint32_t rx_pfc; 3723 int err; 3724 int i; 3725 3726 PRIV_LOCK(priv); 3727 3728 rx_pfc = priv->params.rx_priority_flow_control; 3729 3730 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) 3731 temp[i] = (rx_pfc >> i) & 1; 3732 3733 err = SYSCTL_OUT(req, temp, MLX5E_MAX_PRIORITY); 3734 if (err || !req->newptr) 3735 goto done; 3736 err = SYSCTL_IN(req, temp, MLX5E_MAX_PRIORITY); 3737 if (err) 3738 goto done; 3739 3740 priv->params.rx_priority_flow_control = 0; 3741 3742 /* range check input value */ 3743 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) { 3744 if (temp[i] > 1) { 3745 err = ERANGE; 3746 goto done; 3747 } 3748 priv->params.rx_priority_flow_control |= (temp[i] << i); 3749 } 3750 3751 /* check if update is required */ 3752 if (rx_pfc != priv->params.rx_priority_flow_control) 3753 err = -mlx5e_set_port_pfc(priv); 3754done: 3755 if (err != 0) 3756 priv->params.rx_priority_flow_control= rx_pfc; 3757 PRIV_UNLOCK(priv); 3758 3759 return (err); 3760} 3761 3762static void 3763mlx5e_setup_pauseframes(struct mlx5e_priv *priv) 3764{ 3765#if (__FreeBSD_version < 1100000) 3766 char path[96]; 3767#endif 3768 int error; 3769 3770 /* enable pauseframes by default */ 3771 priv->params.tx_pauseframe_control = 1; 3772 priv->params.rx_pauseframe_control = 1; 3773 3774 /* disable ports flow control, PFC, by default */ 3775 priv->params.tx_priority_flow_control = 0; 3776 priv->params.rx_priority_flow_control = 0; 3777 3778#if (__FreeBSD_version < 1100000) 3779 /* compute path for sysctl */ 3780 snprintf(path, sizeof(path), "dev.mce.%d.tx_pauseframe_control", 3781 device_get_unit(priv->mdev->pdev->dev.bsddev)); 3782 3783 /* try to fetch tunable, if any */ 3784 TUNABLE_INT_FETCH(path, &priv->params.tx_pauseframe_control); 3785 3786 /* compute path for sysctl */ 3787 snprintf(path, sizeof(path), "dev.mce.%d.rx_pauseframe_control", 3788 device_get_unit(priv->mdev->pdev->dev.bsddev)); 3789 3790 /* try to fetch tunable, if any */ 3791 TUNABLE_INT_FETCH(path, &priv->params.rx_pauseframe_control); 3792#endif 3793 3794 /* register pauseframe SYSCTLs */ 3795 SYSCTL_ADD_INT(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 3796 OID_AUTO, "tx_pauseframe_control", CTLFLAG_RDTUN, 3797 &priv->params.tx_pauseframe_control, 0, 3798 "Set to enable TX pause frames. Clear to disable."); 3799 3800 SYSCTL_ADD_INT(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 3801 OID_AUTO, "rx_pauseframe_control", CTLFLAG_RDTUN, 3802 &priv->params.rx_pauseframe_control, 0, 3803 "Set to enable RX pause frames. Clear to disable."); 3804 3805 /* register priority flow control, PFC, SYSCTLs */ 3806 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 3807 OID_AUTO, "tx_priority_flow_control", CTLTYPE_U8 | CTLFLAG_RWTUN | 3808 CTLFLAG_MPSAFE, priv, 0, &mlx5e_sysctl_tx_priority_flow_control, "CU", 3809 "Set to enable TX ports flow control frames for priorities 0..7. Clear to disable."); 3810 3811 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 3812 OID_AUTO, "rx_priority_flow_control", CTLTYPE_U8 | CTLFLAG_RWTUN | 3813 CTLFLAG_MPSAFE, priv, 0, &mlx5e_sysctl_rx_priority_flow_control, "CU", 3814 "Set to enable RX ports flow control frames for priorities 0..7. Clear to disable."); 3815 3816 PRIV_LOCK(priv); 3817 3818 /* range check */ 3819 priv->params.tx_pauseframe_control = 3820 priv->params.tx_pauseframe_control ? 1 : 0; 3821 priv->params.rx_pauseframe_control = 3822 priv->params.rx_pauseframe_control ? 1 : 0; 3823 3824 /* update firmware */ 3825 error = mlx5e_set_port_pause_and_pfc(priv); 3826 if (error == -EINVAL) { 3827 if_printf(priv->ifp, 3828 "Global pauseframes must be disabled before enabling PFC.\n"); 3829 priv->params.rx_priority_flow_control = 0; 3830 priv->params.tx_priority_flow_control = 0; 3831 3832 /* update firmware */ 3833 (void) mlx5e_set_port_pause_and_pfc(priv); 3834 } 3835 PRIV_UNLOCK(priv); 3836} 3837 3838static void * 3839mlx5e_create_ifp(struct mlx5_core_dev *mdev) 3840{ 3841 struct ifnet *ifp; 3842 struct mlx5e_priv *priv; 3843 u8 dev_addr[ETHER_ADDR_LEN] __aligned(4); 3844 u8 connector_type; 3845 struct sysctl_oid_list *child; 3846 int ncv = mdev->priv.eq_table.num_comp_vectors; 3847 char unit[16]; 3848 int err; 3849 int i,j; 3850 u32 eth_proto_cap; 3851 u32 out[MLX5_ST_SZ_DW(ptys_reg)]; 3852 bool ext = 0; 3853 u32 speeds_num; 3854 struct media media_entry = {}; 3855 3856 if (mlx5e_check_required_hca_cap(mdev)) { 3857 mlx5_core_dbg(mdev, "mlx5e_check_required_hca_cap() failed\n"); 3858 return (NULL); 3859 } 3860 /* 3861 * Try to allocate the priv and make room for worst-case 3862 * number of channel structures: 3863 */ 3864 priv = malloc(sizeof(*priv) + 3865 (sizeof(priv->channel[0]) * mdev->priv.eq_table.num_comp_vectors), 3866 M_MLX5EN, M_WAITOK | M_ZERO); 3867 mlx5e_priv_mtx_init(priv); 3868 3869 ifp = priv->ifp = if_alloc(IFT_ETHER); 3870 if (ifp == NULL) { 3871 mlx5_core_err(mdev, "if_alloc() failed\n"); 3872 goto err_free_priv; 3873 } 3874 ifp->if_softc = priv; 3875 if_initname(ifp, "mce", device_get_unit(mdev->pdev->dev.bsddev)); 3876 ifp->if_mtu = ETHERMTU; 3877 ifp->if_init = mlx5e_open; 3878 ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST; 3879 ifp->if_ioctl = mlx5e_ioctl; 3880 ifp->if_transmit = mlx5e_xmit; 3881 ifp->if_qflush = if_qflush; 3882#if (__FreeBSD_version >= 1100000) 3883 ifp->if_get_counter = mlx5e_get_counter; 3884#endif 3885 ifp->if_snd.ifq_maxlen = ifqmaxlen; 3886 /* 3887 * Set driver features 3888 */ 3889 ifp->if_capabilities |= IFCAP_HWCSUM | IFCAP_HWCSUM_IPV6; 3890 ifp->if_capabilities |= IFCAP_VLAN_MTU | IFCAP_VLAN_HWTAGGING; 3891 ifp->if_capabilities |= IFCAP_VLAN_HWCSUM | IFCAP_VLAN_HWFILTER; 3892 ifp->if_capabilities |= IFCAP_LINKSTATE | IFCAP_JUMBO_MTU; 3893 ifp->if_capabilities |= IFCAP_LRO; 3894 ifp->if_capabilities |= IFCAP_TSO | IFCAP_VLAN_HWTSO; 3895 ifp->if_capabilities |= IFCAP_HWSTATS; 3896 3897 /* set TSO limits so that we don't have to drop TX packets */ 3898 ifp->if_hw_tsomax = MLX5E_MAX_TX_PAYLOAD_SIZE - (ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN); 3899 ifp->if_hw_tsomaxsegcount = MLX5E_MAX_TX_MBUF_FRAGS - 1 /* hdr */; 3900 ifp->if_hw_tsomaxsegsize = MLX5E_MAX_TX_MBUF_SIZE; 3901 3902 ifp->if_capenable = ifp->if_capabilities; 3903 ifp->if_hwassist = 0; 3904 if (ifp->if_capenable & IFCAP_TSO) 3905 ifp->if_hwassist |= CSUM_TSO; 3906 if (ifp->if_capenable & IFCAP_TXCSUM) 3907 ifp->if_hwassist |= (CSUM_TCP | CSUM_UDP | CSUM_IP); 3908 if (ifp->if_capenable & IFCAP_TXCSUM_IPV6) 3909 ifp->if_hwassist |= (CSUM_UDP_IPV6 | CSUM_TCP_IPV6); 3910 3911 /* ifnet sysctl tree */ 3912 sysctl_ctx_init(&priv->sysctl_ctx); 3913 priv->sysctl_ifnet = SYSCTL_ADD_NODE(&priv->sysctl_ctx, SYSCTL_STATIC_CHILDREN(_dev), 3914 OID_AUTO, ifp->if_dname, CTLFLAG_RD, 0, "MLX5 ethernet - interface name"); 3915 if (priv->sysctl_ifnet == NULL) { 3916 mlx5_core_err(mdev, "SYSCTL_ADD_NODE() failed\n"); 3917 goto err_free_sysctl; 3918 } 3919 snprintf(unit, sizeof(unit), "%d", ifp->if_dunit); 3920 priv->sysctl_ifnet = SYSCTL_ADD_NODE(&priv->sysctl_ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 3921 OID_AUTO, unit, CTLFLAG_RD, 0, "MLX5 ethernet - interface unit"); 3922 if (priv->sysctl_ifnet == NULL) { 3923 mlx5_core_err(mdev, "SYSCTL_ADD_NODE() failed\n"); 3924 goto err_free_sysctl; 3925 } 3926 3927 /* HW sysctl tree */ 3928 child = SYSCTL_CHILDREN(device_get_sysctl_tree(mdev->pdev->dev.bsddev)); 3929 priv->sysctl_hw = SYSCTL_ADD_NODE(&priv->sysctl_ctx, child, 3930 OID_AUTO, "hw", CTLFLAG_RD, 0, "MLX5 ethernet dev hw"); 3931 if (priv->sysctl_hw == NULL) { 3932 mlx5_core_err(mdev, "SYSCTL_ADD_NODE() failed\n"); 3933 goto err_free_sysctl; 3934 } 3935 3936 err = mlx5e_build_ifp_priv(mdev, priv, ncv); 3937 if (err) { 3938 mlx5_core_err(mdev, "mlx5e_build_ifp_priv() failed (%d)\n", err); 3939 goto err_free_sysctl; 3940 } 3941 3942 /* reuse mlx5core's watchdog workqueue */ 3943 priv->wq = mdev->priv.health.wq_watchdog; 3944 3945 err = mlx5_alloc_map_uar(mdev, &priv->cq_uar); 3946 if (err) { 3947 if_printf(ifp, "%s: mlx5_alloc_map_uar failed, %d\n", 3948 __func__, err); 3949 goto err_free_wq; 3950 } 3951 err = mlx5_core_alloc_pd(mdev, &priv->pdn); 3952 if (err) { 3953 if_printf(ifp, "%s: mlx5_core_alloc_pd failed, %d\n", 3954 __func__, err); 3955 goto err_unmap_free_uar; 3956 } 3957 err = mlx5_alloc_transport_domain(mdev, &priv->tdn); 3958 if (err) { 3959 if_printf(ifp, "%s: mlx5_alloc_transport_domain failed, %d\n", 3960 __func__, err); 3961 goto err_dealloc_pd; 3962 } 3963 err = mlx5e_create_mkey(priv, priv->pdn, &priv->mr); 3964 if (err) { 3965 if_printf(ifp, "%s: mlx5e_create_mkey failed, %d\n", 3966 __func__, err); 3967 goto err_dealloc_transport_domain; 3968 } 3969 mlx5_query_nic_vport_mac_address(priv->mdev, 0, dev_addr); 3970 3971 /* check if we should generate a random MAC address */ 3972 if (MLX5_CAP_GEN(priv->mdev, vport_group_manager) == 0 && 3973 is_zero_ether_addr(dev_addr)) { 3974 random_ether_addr(dev_addr); 3975 if_printf(ifp, "Assigned random MAC address\n"); 3976 } 3977 3978 /* set default MTU */ 3979 mlx5e_set_dev_port_mtu(ifp, ifp->if_mtu); 3980 3981 /* Set default media status */ 3982 priv->media_status_last = IFM_AVALID; 3983 priv->media_active_last = IFM_ETHER | IFM_AUTO | 3984 IFM_ETH_RXPAUSE | IFM_FDX; 3985 3986 /* setup default pauseframes configuration */ 3987 mlx5e_setup_pauseframes(priv); 3988 3989 /* Setup supported medias */ 3990 //TODO: If we failed to query ptys is it ok to proceed?? 3991 if (!mlx5_query_port_ptys(mdev, out, sizeof(out), MLX5_PTYS_EN, 1)) { 3992 ext = MLX5_CAP_PCAM_FEATURE(mdev, 3993 ptys_extended_ethernet); 3994 eth_proto_cap = MLX5_GET_ETH_PROTO(ptys_reg, out, ext, 3995 eth_proto_capability); 3996 if (MLX5_CAP_PCAM_FEATURE(mdev, ptys_connector_type)) 3997 connector_type = MLX5_GET(ptys_reg, out, 3998 connector_type); 3999 } else { 4000 eth_proto_cap = 0; 4001 if_printf(ifp, "%s: Query port media capability failed," 4002 " %d\n", __func__, err); 4003 } 4004 4005 ifmedia_init(&priv->media, IFM_IMASK | IFM_ETH_FMASK, 4006 mlx5e_media_change, mlx5e_media_status); 4007 4008 speeds_num = ext ? MLX5E_EXT_LINK_SPEEDS_NUMBER : MLX5E_LINK_SPEEDS_NUMBER; 4009 for (i = 0; i != speeds_num; i++) { 4010 for (j = 0; j < MLX5E_LINK_MODES_NUMBER ; ++j) { 4011 media_entry = ext ? mlx5e_ext_mode_table[i][j] : 4012 mlx5e_mode_table[i][j]; 4013 if (media_entry.baudrate == 0) 4014 continue; 4015 if (MLX5E_PROT_MASK(i) & eth_proto_cap) { 4016 ifmedia_add(&priv->media, 4017 media_entry.subtype | 4018 IFM_ETHER, 0, NULL); 4019 ifmedia_add(&priv->media, 4020 media_entry.subtype | 4021 IFM_ETHER | IFM_FDX | 4022 IFM_ETH_RXPAUSE | IFM_ETH_TXPAUSE, 0, NULL); 4023 } 4024 } 4025 } 4026 4027 ifmedia_add(&priv->media, IFM_ETHER | IFM_AUTO, 0, NULL); 4028 ifmedia_add(&priv->media, IFM_ETHER | IFM_AUTO | IFM_FDX | 4029 IFM_ETH_RXPAUSE | IFM_ETH_TXPAUSE, 0, NULL); 4030 4031 /* Set autoselect by default */ 4032 ifmedia_set(&priv->media, IFM_ETHER | IFM_AUTO | IFM_FDX | 4033 IFM_ETH_RXPAUSE | IFM_ETH_TXPAUSE); 4034 ether_ifattach(ifp, dev_addr); 4035 4036 /* Register for VLAN events */ 4037 priv->vlan_attach = EVENTHANDLER_REGISTER(vlan_config, 4038 mlx5e_vlan_rx_add_vid, priv, EVENTHANDLER_PRI_FIRST); 4039 priv->vlan_detach = EVENTHANDLER_REGISTER(vlan_unconfig, 4040 mlx5e_vlan_rx_kill_vid, priv, EVENTHANDLER_PRI_FIRST); 4041 4042 /* Link is down by default */ 4043 if_link_state_change(ifp, LINK_STATE_DOWN); 4044 4045 mlx5e_enable_async_events(priv); 4046 4047 mlx5e_add_hw_stats(priv); 4048 4049 mlx5e_create_stats(&priv->stats.vport.ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 4050 "vstats", mlx5e_vport_stats_desc, MLX5E_VPORT_STATS_NUM, 4051 priv->stats.vport.arg); 4052 4053 mlx5e_create_stats(&priv->stats.pport.ctx, SYSCTL_CHILDREN(priv->sysctl_ifnet), 4054 "pstats", mlx5e_pport_stats_desc, MLX5E_PPORT_STATS_NUM, 4055 priv->stats.pport.arg); 4056 4057 mlx5e_create_ethtool(priv); 4058 4059 mtx_lock(&priv->async_events_mtx); 4060 mlx5e_update_stats(priv); 4061 mtx_unlock(&priv->async_events_mtx); 4062 4063 return (priv); 4064 4065err_dealloc_transport_domain: 4066 mlx5_dealloc_transport_domain(mdev, priv->tdn); 4067 4068err_dealloc_pd: 4069 mlx5_core_dealloc_pd(mdev, priv->pdn); 4070 4071err_unmap_free_uar: 4072 mlx5_unmap_free_uar(mdev, &priv->cq_uar); 4073 4074err_free_wq: 4075 flush_workqueue(priv->wq); 4076 4077err_free_sysctl: 4078 sysctl_ctx_free(&priv->sysctl_ctx); 4079 if (priv->sysctl_debug) 4080 sysctl_ctx_free(&priv->stats.port_stats_debug.ctx); 4081 if_free(ifp); 4082 4083err_free_priv: 4084 mlx5e_priv_mtx_destroy(priv); 4085 free(priv, M_MLX5EN); 4086 return (NULL); 4087} 4088 4089static void 4090mlx5e_destroy_ifp(struct mlx5_core_dev *mdev, void *vpriv) 4091{ 4092 struct mlx5e_priv *priv = vpriv; 4093 struct ifnet *ifp = priv->ifp; 4094 4095 /* don't allow more IOCTLs */ 4096 priv->gone = 1; 4097 4098 /* XXX wait a bit to allow IOCTL handlers to complete */ 4099 pause("W", hz); 4100 4101 /* stop watchdog timer */ 4102 callout_drain(&priv->watchdog); 4103 4104 if (priv->vlan_attach != NULL) 4105 EVENTHANDLER_DEREGISTER(vlan_config, priv->vlan_attach); 4106 if (priv->vlan_detach != NULL) 4107 EVENTHANDLER_DEREGISTER(vlan_unconfig, priv->vlan_detach); 4108 4109 /* make sure device gets closed */ 4110 PRIV_LOCK(priv); 4111 mlx5e_close_locked(ifp); 4112 PRIV_UNLOCK(priv); 4113 4114 /* unregister device */ 4115 ifmedia_removeall(&priv->media); 4116 ether_ifdetach(ifp); 4117 if_free(ifp); 4118 4119 /* destroy all remaining sysctl nodes */ 4120 sysctl_ctx_free(&priv->stats.vport.ctx); 4121 sysctl_ctx_free(&priv->stats.pport.ctx); 4122 if (priv->sysctl_debug) 4123 sysctl_ctx_free(&priv->stats.port_stats_debug.ctx); 4124 sysctl_ctx_free(&priv->sysctl_ctx); 4125 4126 mlx5_core_destroy_mkey(priv->mdev, &priv->mr); 4127 mlx5_dealloc_transport_domain(priv->mdev, priv->tdn); 4128 mlx5_core_dealloc_pd(priv->mdev, priv->pdn); 4129 mlx5_unmap_free_uar(priv->mdev, &priv->cq_uar); 4130 mlx5e_disable_async_events(priv); 4131 flush_workqueue(priv->wq); 4132 mlx5e_priv_mtx_destroy(priv); 4133 free(priv, M_MLX5EN); 4134} 4135 4136static void * 4137mlx5e_get_ifp(void *vpriv) 4138{ 4139 struct mlx5e_priv *priv = vpriv; 4140 4141 return (priv->ifp); 4142} 4143 4144static struct mlx5_interface mlx5e_interface = { 4145 .add = mlx5e_create_ifp, 4146 .remove = mlx5e_destroy_ifp, 4147 .event = mlx5e_async_event, 4148 .protocol = MLX5_INTERFACE_PROTOCOL_ETH, 4149 .get_dev = mlx5e_get_ifp, 4150}; 4151 4152void 4153mlx5e_init(void) 4154{ 4155 mlx5_register_interface(&mlx5e_interface); 4156} 4157 4158void 4159mlx5e_cleanup(void) 4160{ 4161 mlx5_unregister_interface(&mlx5e_interface); 4162} 4163 4164static void 4165mlx5e_show_version(void __unused *arg) 4166{ 4167 4168 printf("%s", mlx5e_version); 4169} 4170SYSINIT(mlx5e_show_version, SI_SUB_DRIVERS, SI_ORDER_ANY, mlx5e_show_version, NULL); 4171 4172module_init_order(mlx5e_init, SI_ORDER_THIRD); 4173module_exit_order(mlx5e_cleanup, SI_ORDER_THIRD); 4174 4175#if (__FreeBSD_version >= 1100000) 4176MODULE_DEPEND(mlx5en, linuxkpi, 1, 1, 1); 4177#endif 4178MODULE_DEPEND(mlx5en, mlx5, 1, 1, 1); 4179MODULE_VERSION(mlx5en, 1); 4180