1/* 2 * Copyright (c) 2017, Mellanox Technologies. All rights reserved. 3 * 4 * This software is available to you under a choice of one of two 5 * licenses. You may choose to be licensed under the terms of the GNU 6 * General Public License (GPL) Version 2, available from the file 7 * COPYING in the main directory of this source tree, or the 8 * OpenIB.org BSD license below: 9 * 10 * Redistribution and use in source and binary forms, with or 11 * without modification, are permitted provided that the following 12 * conditions are met: 13 * 14 * - Redistributions of source code must retain the above 15 * copyright notice, this list of conditions and the following 16 * disclaimer. 17 * 18 * - Redistributions in binary form must reproduce the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer in the documentation and/or other materials 21 * provided with the distribution. 22 * 23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30 * SOFTWARE. 31 */ 32 33#include <rdma/ib_verbs.h> 34#include <linux/mlx5/fs.h> 35#include "en.h" 36#include "en/params.h" 37#include "ipoib.h" 38#include "en/fs_ethtool.h" 39 40#define IB_DEFAULT_Q_KEY 0xb1b 41#define MLX5I_PARAMS_DEFAULT_LOG_RQ_SIZE 9 42 43static int mlx5i_open(struct net_device *netdev); 44static int mlx5i_close(struct net_device *netdev); 45static int mlx5i_change_mtu(struct net_device *netdev, int new_mtu); 46 47static const struct net_device_ops mlx5i_netdev_ops = { 48 .ndo_open = mlx5i_open, 49 .ndo_stop = mlx5i_close, 50 .ndo_get_stats64 = mlx5i_get_stats, 51 .ndo_init = mlx5i_dev_init, 52 .ndo_uninit = mlx5i_dev_cleanup, 53 .ndo_change_mtu = mlx5i_change_mtu, 54 .ndo_eth_ioctl = mlx5i_ioctl, 55}; 56 57/* IPoIB mlx5 netdev profile */ 58static void mlx5i_build_nic_params(struct mlx5_core_dev *mdev, 59 struct mlx5e_params *params) 60{ 61 /* Override RQ params as IPoIB supports only LINKED LIST RQ for now */ 62 MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_STRIDING_RQ, false); 63 mlx5e_set_rq_type(mdev, params); 64 mlx5e_init_rq_type_params(mdev, params); 65 66 /* RQ size in ipoib by default is 512 */ 67 params->log_rq_mtu_frames = is_kdump_kernel() ? 68 MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE : 69 MLX5I_PARAMS_DEFAULT_LOG_RQ_SIZE; 70 71 params->packet_merge.type = MLX5E_PACKET_MERGE_NONE; 72 params->hard_mtu = MLX5_IB_GRH_BYTES + MLX5_IPOIB_HARD_LEN; 73 74 /* CQE compression is not supported for IPoIB */ 75 params->rx_cqe_compress_def = false; 76 MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS, params->rx_cqe_compress_def); 77} 78 79/* Called directly after IPoIB netdevice was created to initialize SW structs */ 80int mlx5i_init(struct mlx5_core_dev *mdev, struct net_device *netdev) 81{ 82 struct mlx5e_priv *priv = mlx5i_epriv(netdev); 83 84 netif_carrier_off(netdev); 85 mlx5e_set_netdev_mtu_boundaries(priv); 86 netdev->mtu = netdev->max_mtu; 87 88 mlx5e_build_nic_params(priv, NULL, netdev->mtu); 89 mlx5i_build_nic_params(mdev, &priv->channels.params); 90 91 mlx5e_timestamp_init(priv); 92 93 /* netdev init */ 94 netdev->hw_features |= NETIF_F_SG; 95 netdev->hw_features |= NETIF_F_IP_CSUM; 96 netdev->hw_features |= NETIF_F_IPV6_CSUM; 97 netdev->hw_features |= NETIF_F_GRO; 98 netdev->hw_features |= NETIF_F_TSO; 99 netdev->hw_features |= NETIF_F_TSO6; 100 netdev->hw_features |= NETIF_F_RXCSUM; 101 netdev->hw_features |= NETIF_F_RXHASH; 102 103 netdev->netdev_ops = &mlx5i_netdev_ops; 104 netdev->ethtool_ops = &mlx5i_ethtool_ops; 105 106 return 0; 107} 108 109/* Called directly before IPoIB netdevice is destroyed to cleanup SW structs */ 110void mlx5i_cleanup(struct mlx5e_priv *priv) 111{ 112 mlx5e_priv_cleanup(priv); 113} 114 115static void mlx5i_grp_sw_update_stats(struct mlx5e_priv *priv) 116{ 117 struct rtnl_link_stats64 s = {}; 118 int i, j; 119 120 for (i = 0; i < priv->stats_nch; i++) { 121 struct mlx5e_channel_stats *channel_stats; 122 struct mlx5e_rq_stats *rq_stats; 123 124 channel_stats = priv->channel_stats[i]; 125 rq_stats = &channel_stats->rq; 126 127 s.rx_packets += rq_stats->packets; 128 s.rx_bytes += rq_stats->bytes; 129 130 for (j = 0; j < priv->max_opened_tc; j++) { 131 struct mlx5e_sq_stats *sq_stats = &channel_stats->sq[j]; 132 133 s.tx_packets += sq_stats->packets; 134 s.tx_bytes += sq_stats->bytes; 135 s.tx_dropped += sq_stats->dropped; 136 } 137 } 138 139 memset(&priv->stats.sw, 0, sizeof(s)); 140 141 priv->stats.sw.rx_packets = s.rx_packets; 142 priv->stats.sw.rx_bytes = s.rx_bytes; 143 priv->stats.sw.tx_packets = s.tx_packets; 144 priv->stats.sw.tx_bytes = s.tx_bytes; 145 priv->stats.sw.tx_queue_dropped = s.tx_dropped; 146} 147 148void mlx5i_get_stats(struct net_device *dev, struct rtnl_link_stats64 *stats) 149{ 150 struct mlx5e_priv *priv = mlx5i_epriv(dev); 151 struct mlx5e_sw_stats *sstats = &priv->stats.sw; 152 153 mlx5i_grp_sw_update_stats(priv); 154 155 stats->rx_packets = sstats->rx_packets; 156 stats->rx_bytes = sstats->rx_bytes; 157 stats->tx_packets = sstats->tx_packets; 158 stats->tx_bytes = sstats->tx_bytes; 159 stats->tx_dropped = sstats->tx_queue_dropped; 160} 161 162struct net_device *mlx5i_parent_get(struct net_device *netdev) 163{ 164 struct mlx5e_priv *priv = mlx5i_epriv(netdev); 165 struct mlx5i_priv *ipriv, *parent_ipriv; 166 struct net_device *parent_dev; 167 int parent_ifindex; 168 169 ipriv = priv->ppriv; 170 171 parent_ifindex = netdev->netdev_ops->ndo_get_iflink(netdev); 172 parent_dev = dev_get_by_index(dev_net(netdev), parent_ifindex); 173 if (!parent_dev) 174 return NULL; 175 176 parent_ipriv = netdev_priv(parent_dev); 177 178 ASSERT_RTNL(); 179 parent_ipriv->num_sub_interfaces++; 180 181 ipriv->parent_dev = parent_dev; 182 183 return parent_dev; 184} 185 186void mlx5i_parent_put(struct net_device *netdev) 187{ 188 struct mlx5e_priv *priv = mlx5i_epriv(netdev); 189 struct mlx5i_priv *ipriv, *parent_ipriv; 190 191 ipriv = priv->ppriv; 192 parent_ipriv = netdev_priv(ipriv->parent_dev); 193 194 ASSERT_RTNL(); 195 parent_ipriv->num_sub_interfaces--; 196 197 dev_put(ipriv->parent_dev); 198} 199 200int mlx5i_init_underlay_qp(struct mlx5e_priv *priv) 201{ 202 struct mlx5_core_dev *mdev = priv->mdev; 203 struct mlx5i_priv *ipriv = priv->ppriv; 204 int ret; 205 206 { 207 u32 in[MLX5_ST_SZ_DW(rst2init_qp_in)] = {}; 208 u32 *qpc; 209 210 qpc = MLX5_ADDR_OF(rst2init_qp_in, in, qpc); 211 212 MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED); 213 MLX5_SET(qpc, qpc, primary_address_path.pkey_index, 214 ipriv->pkey_index); 215 MLX5_SET(qpc, qpc, primary_address_path.vhca_port_num, 1); 216 MLX5_SET(qpc, qpc, q_key, IB_DEFAULT_Q_KEY); 217 218 MLX5_SET(rst2init_qp_in, in, opcode, MLX5_CMD_OP_RST2INIT_QP); 219 MLX5_SET(rst2init_qp_in, in, qpn, ipriv->qpn); 220 ret = mlx5_cmd_exec_in(mdev, rst2init_qp, in); 221 if (ret) 222 goto err_qp_modify_to_err; 223 } 224 { 225 u32 in[MLX5_ST_SZ_DW(init2rtr_qp_in)] = {}; 226 227 MLX5_SET(init2rtr_qp_in, in, opcode, MLX5_CMD_OP_INIT2RTR_QP); 228 MLX5_SET(init2rtr_qp_in, in, qpn, ipriv->qpn); 229 ret = mlx5_cmd_exec_in(mdev, init2rtr_qp, in); 230 if (ret) 231 goto err_qp_modify_to_err; 232 } 233 { 234 u32 in[MLX5_ST_SZ_DW(rtr2rts_qp_in)] = {}; 235 236 MLX5_SET(rtr2rts_qp_in, in, opcode, MLX5_CMD_OP_RTR2RTS_QP); 237 MLX5_SET(rtr2rts_qp_in, in, qpn, ipriv->qpn); 238 ret = mlx5_cmd_exec_in(mdev, rtr2rts_qp, in); 239 if (ret) 240 goto err_qp_modify_to_err; 241 } 242 return 0; 243 244err_qp_modify_to_err: 245 { 246 u32 in[MLX5_ST_SZ_DW(qp_2err_in)] = {}; 247 248 MLX5_SET(qp_2err_in, in, opcode, MLX5_CMD_OP_2ERR_QP); 249 MLX5_SET(qp_2err_in, in, qpn, ipriv->qpn); 250 mlx5_cmd_exec_in(mdev, qp_2err, in); 251 } 252 return ret; 253} 254 255void mlx5i_uninit_underlay_qp(struct mlx5e_priv *priv) 256{ 257 struct mlx5i_priv *ipriv = priv->ppriv; 258 struct mlx5_core_dev *mdev = priv->mdev; 259 u32 in[MLX5_ST_SZ_DW(qp_2rst_in)] = {}; 260 261 MLX5_SET(qp_2rst_in, in, opcode, MLX5_CMD_OP_2RST_QP); 262 MLX5_SET(qp_2rst_in, in, qpn, ipriv->qpn); 263 mlx5_cmd_exec_in(mdev, qp_2rst, in); 264} 265 266#define MLX5_QP_ENHANCED_ULP_STATELESS_MODE 2 267 268int mlx5i_create_underlay_qp(struct mlx5e_priv *priv) 269{ 270 const unsigned char *dev_addr = priv->netdev->dev_addr; 271 u32 out[MLX5_ST_SZ_DW(create_qp_out)] = {}; 272 u32 in[MLX5_ST_SZ_DW(create_qp_in)] = {}; 273 struct mlx5i_priv *ipriv = priv->ppriv; 274 void *addr_path; 275 int qpn = 0; 276 int ret = 0; 277 void *qpc; 278 279 if (MLX5_CAP_GEN(priv->mdev, mkey_by_name)) { 280 qpn = (dev_addr[1] << 16) + (dev_addr[2] << 8) + dev_addr[3]; 281 MLX5_SET(create_qp_in, in, input_qpn, qpn); 282 } 283 284 qpc = MLX5_ADDR_OF(create_qp_in, in, qpc); 285 MLX5_SET(qpc, qpc, ts_format, mlx5_get_qp_default_ts(priv->mdev)); 286 MLX5_SET(qpc, qpc, st, MLX5_QP_ST_UD); 287 MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED); 288 MLX5_SET(qpc, qpc, ulp_stateless_offload_mode, 289 MLX5_QP_ENHANCED_ULP_STATELESS_MODE); 290 291 addr_path = MLX5_ADDR_OF(qpc, qpc, primary_address_path); 292 MLX5_SET(ads, addr_path, vhca_port_num, 1); 293 MLX5_SET(ads, addr_path, grh, 1); 294 295 MLX5_SET(create_qp_in, in, opcode, MLX5_CMD_OP_CREATE_QP); 296 ret = mlx5_cmd_exec_inout(priv->mdev, create_qp, in, out); 297 if (ret) 298 return ret; 299 300 ipriv->qpn = MLX5_GET(create_qp_out, out, qpn); 301 302 return 0; 303} 304 305void mlx5i_destroy_underlay_qp(struct mlx5_core_dev *mdev, u32 qpn) 306{ 307 u32 in[MLX5_ST_SZ_DW(destroy_qp_in)] = {}; 308 309 MLX5_SET(destroy_qp_in, in, opcode, MLX5_CMD_OP_DESTROY_QP); 310 MLX5_SET(destroy_qp_in, in, qpn, qpn); 311 mlx5_cmd_exec_in(mdev, destroy_qp, in); 312} 313 314int mlx5i_update_nic_rx(struct mlx5e_priv *priv) 315{ 316 return mlx5e_refresh_tirs(priv, true, true); 317} 318 319int mlx5i_create_tis(struct mlx5_core_dev *mdev, u32 underlay_qpn, u32 *tisn) 320{ 321 u32 in[MLX5_ST_SZ_DW(create_tis_in)] = {}; 322 void *tisc; 323 324 tisc = MLX5_ADDR_OF(create_tis_in, in, ctx); 325 326 MLX5_SET(tisc, tisc, underlay_qpn, underlay_qpn); 327 328 return mlx5e_create_tis(mdev, in, tisn); 329} 330 331static int mlx5i_init_tx(struct mlx5e_priv *priv) 332{ 333 struct mlx5i_priv *ipriv = priv->ppriv; 334 int err; 335 336 err = mlx5i_create_underlay_qp(priv); 337 if (err) { 338 mlx5_core_warn(priv->mdev, "create underlay QP failed, %d\n", err); 339 return err; 340 } 341 342 err = mlx5i_create_tis(priv->mdev, ipriv->qpn, &ipriv->tisn); 343 if (err) { 344 mlx5_core_warn(priv->mdev, "create tis failed, %d\n", err); 345 goto err_destroy_underlay_qp; 346 } 347 348 return 0; 349 350err_destroy_underlay_qp: 351 mlx5i_destroy_underlay_qp(priv->mdev, ipriv->qpn); 352 return err; 353} 354 355static void mlx5i_cleanup_tx(struct mlx5e_priv *priv) 356{ 357 struct mlx5i_priv *ipriv = priv->ppriv; 358 359 mlx5e_destroy_tis(priv->mdev, ipriv->tisn); 360 mlx5i_destroy_underlay_qp(priv->mdev, ipriv->qpn); 361} 362 363static int mlx5i_create_flow_steering(struct mlx5e_priv *priv) 364{ 365 struct mlx5_flow_namespace *ns = 366 mlx5_get_flow_namespace(priv->mdev, MLX5_FLOW_NAMESPACE_KERNEL); 367 int err; 368 369 370 if (!ns) 371 return -EINVAL; 372 373 mlx5e_fs_set_ns(priv->fs, ns, false); 374 err = mlx5e_arfs_create_tables(priv->fs, priv->rx_res, 375 !!(priv->netdev->hw_features & NETIF_F_NTUPLE)); 376 if (err) { 377 netdev_err(priv->netdev, "Failed to create arfs tables, err=%d\n", 378 err); 379 priv->netdev->hw_features &= ~NETIF_F_NTUPLE; 380 } 381 382 err = mlx5e_create_ttc_table(priv->fs, priv->rx_res); 383 if (err) { 384 netdev_err(priv->netdev, "Failed to create ttc table, err=%d\n", 385 err); 386 goto err_destroy_arfs_tables; 387 } 388 389 mlx5e_ethtool_init_steering(priv->fs); 390 391 return 0; 392 393err_destroy_arfs_tables: 394 mlx5e_arfs_destroy_tables(priv->fs, 395 !!(priv->netdev->hw_features & NETIF_F_NTUPLE)); 396 397 return err; 398} 399 400static void mlx5i_destroy_flow_steering(struct mlx5e_priv *priv) 401{ 402 mlx5e_destroy_ttc_table(priv->fs); 403 mlx5e_arfs_destroy_tables(priv->fs, 404 !!(priv->netdev->hw_features & NETIF_F_NTUPLE)); 405 mlx5e_ethtool_cleanup_steering(priv->fs); 406} 407 408static int mlx5i_init_rx(struct mlx5e_priv *priv) 409{ 410 struct mlx5_core_dev *mdev = priv->mdev; 411 int err; 412 413 priv->fs = mlx5e_fs_init(priv->profile, mdev, 414 !test_bit(MLX5E_STATE_DESTROYING, &priv->state), 415 priv->dfs_root); 416 if (!priv->fs) { 417 netdev_err(priv->netdev, "FS allocation failed\n"); 418 return -ENOMEM; 419 } 420 421 mlx5e_create_q_counters(priv); 422 423 err = mlx5e_open_drop_rq(priv, &priv->drop_rq); 424 if (err) { 425 mlx5_core_err(mdev, "open drop rq failed, %d\n", err); 426 goto err_destroy_q_counters; 427 } 428 429 priv->rx_res = mlx5e_rx_res_create(priv->mdev, 0, priv->max_nch, priv->drop_rq.rqn, 430 &priv->channels.params.packet_merge, 431 priv->channels.params.num_channels); 432 if (IS_ERR(priv->rx_res)) { 433 err = PTR_ERR(priv->rx_res); 434 goto err_close_drop_rq; 435 } 436 437 err = mlx5i_create_flow_steering(priv); 438 if (err) 439 goto err_destroy_rx_res; 440 441 return 0; 442 443err_destroy_rx_res: 444 mlx5e_rx_res_destroy(priv->rx_res); 445 priv->rx_res = ERR_PTR(-EINVAL); 446err_close_drop_rq: 447 mlx5e_close_drop_rq(&priv->drop_rq); 448err_destroy_q_counters: 449 mlx5e_destroy_q_counters(priv); 450 mlx5e_fs_cleanup(priv->fs); 451 return err; 452} 453 454static void mlx5i_cleanup_rx(struct mlx5e_priv *priv) 455{ 456 mlx5i_destroy_flow_steering(priv); 457 mlx5e_rx_res_destroy(priv->rx_res); 458 priv->rx_res = ERR_PTR(-EINVAL); 459 mlx5e_close_drop_rq(&priv->drop_rq); 460 mlx5e_destroy_q_counters(priv); 461 mlx5e_fs_cleanup(priv->fs); 462} 463 464/* The stats groups order is opposite to the update_stats() order calls */ 465static mlx5e_stats_grp_t mlx5i_stats_grps[] = { 466 &MLX5E_STATS_GRP(sw), 467 &MLX5E_STATS_GRP(qcnt), 468 &MLX5E_STATS_GRP(vnic_env), 469 &MLX5E_STATS_GRP(vport), 470 &MLX5E_STATS_GRP(802_3), 471 &MLX5E_STATS_GRP(2863), 472 &MLX5E_STATS_GRP(2819), 473 &MLX5E_STATS_GRP(phy), 474 &MLX5E_STATS_GRP(pcie), 475 &MLX5E_STATS_GRP(per_prio), 476 &MLX5E_STATS_GRP(pme), 477 &MLX5E_STATS_GRP(channels), 478 &MLX5E_STATS_GRP(per_port_buff_congest), 479}; 480 481static unsigned int mlx5i_stats_grps_num(struct mlx5e_priv *priv) 482{ 483 return ARRAY_SIZE(mlx5i_stats_grps); 484} 485 486u32 mlx5i_get_tisn(struct mlx5_core_dev *mdev, struct mlx5e_priv *priv, u8 lag_port, u8 tc) 487{ 488 struct mlx5i_priv *ipriv = priv->ppriv; 489 490 if (WARN(lag_port || tc, 491 "IPoIB unexpected non-zero value: lag_port (%u), tc (%u)\n", 492 lag_port, tc)) 493 return 0; 494 495 return ipriv->tisn; 496} 497 498static const struct mlx5e_profile mlx5i_nic_profile = { 499 .init = mlx5i_init, 500 .cleanup = mlx5i_cleanup, 501 .init_tx = mlx5i_init_tx, 502 .cleanup_tx = mlx5i_cleanup_tx, 503 .init_rx = mlx5i_init_rx, 504 .cleanup_rx = mlx5i_cleanup_rx, 505 .enable = NULL, /* mlx5i_enable */ 506 .disable = NULL, /* mlx5i_disable */ 507 .update_rx = mlx5i_update_nic_rx, 508 .update_stats = NULL, /* mlx5i_update_stats */ 509 .update_carrier = NULL, /* no HW update in IB link */ 510 .rx_handlers = &mlx5i_rx_handlers, 511 .max_tc = MLX5I_MAX_NUM_TC, 512 .stats_grps = mlx5i_stats_grps, 513 .stats_grps_num = mlx5i_stats_grps_num, 514 .get_tisn = mlx5i_get_tisn, 515}; 516 517/* mlx5i netdev NDos */ 518 519static int mlx5i_change_mtu(struct net_device *netdev, int new_mtu) 520{ 521 struct mlx5e_priv *priv = mlx5i_epriv(netdev); 522 struct mlx5e_params new_params; 523 int err = 0; 524 525 mutex_lock(&priv->state_lock); 526 527 new_params = priv->channels.params; 528 new_params.sw_mtu = new_mtu; 529 530 err = mlx5e_safe_switch_params(priv, &new_params, NULL, NULL, true); 531 if (err) 532 goto out; 533 534 netdev->mtu = new_params.sw_mtu; 535 536out: 537 mutex_unlock(&priv->state_lock); 538 return err; 539} 540 541int mlx5i_dev_init(struct net_device *dev) 542{ 543 struct mlx5e_priv *priv = mlx5i_epriv(dev); 544 struct mlx5i_priv *ipriv = priv->ppriv; 545 u8 addr_mod[3]; 546 547 /* Set dev address using underlay QP */ 548 addr_mod[0] = (ipriv->qpn >> 16) & 0xff; 549 addr_mod[1] = (ipriv->qpn >> 8) & 0xff; 550 addr_mod[2] = (ipriv->qpn) & 0xff; 551 dev_addr_mod(dev, 1, addr_mod, sizeof(addr_mod)); 552 553 /* Add QPN to net-device mapping to HT */ 554 mlx5i_pkey_add_qpn(dev, ipriv->qpn); 555 556 return 0; 557} 558 559int mlx5i_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd) 560{ 561 struct mlx5e_priv *priv = mlx5i_epriv(dev); 562 563 switch (cmd) { 564 case SIOCSHWTSTAMP: 565 return mlx5e_hwstamp_set(priv, ifr); 566 case SIOCGHWTSTAMP: 567 return mlx5e_hwstamp_get(priv, ifr); 568 default: 569 return -EOPNOTSUPP; 570 } 571} 572 573void mlx5i_dev_cleanup(struct net_device *dev) 574{ 575 struct mlx5e_priv *priv = mlx5i_epriv(dev); 576 struct mlx5i_priv *ipriv = priv->ppriv; 577 578 mlx5i_uninit_underlay_qp(priv); 579 580 /* Delete QPN to net-device mapping from HT */ 581 mlx5i_pkey_del_qpn(dev, ipriv->qpn); 582} 583 584static int mlx5i_open(struct net_device *netdev) 585{ 586 struct mlx5e_priv *epriv = mlx5i_epriv(netdev); 587 struct mlx5i_priv *ipriv = epriv->ppriv; 588 struct mlx5_core_dev *mdev = epriv->mdev; 589 int err; 590 591 mutex_lock(&epriv->state_lock); 592 593 set_bit(MLX5E_STATE_OPENED, &epriv->state); 594 595 err = mlx5i_init_underlay_qp(epriv); 596 if (err) { 597 mlx5_core_warn(mdev, "prepare underlay qp state failed, %d\n", err); 598 goto err_clear_state_opened_flag; 599 } 600 601 err = mlx5_fs_add_rx_underlay_qpn(mdev, ipriv->qpn); 602 if (err) { 603 mlx5_core_warn(mdev, "attach underlay qp to ft failed, %d\n", err); 604 goto err_reset_qp; 605 } 606 607 err = mlx5e_open_channels(epriv, &epriv->channels); 608 if (err) 609 goto err_remove_fs_underlay_qp; 610 611 err = epriv->profile->update_rx(epriv); 612 if (err) 613 goto err_close_channels; 614 615 mlx5e_activate_priv_channels(epriv); 616 617 mutex_unlock(&epriv->state_lock); 618 return 0; 619 620err_close_channels: 621 mlx5e_close_channels(&epriv->channels); 622err_remove_fs_underlay_qp: 623 mlx5_fs_remove_rx_underlay_qpn(mdev, ipriv->qpn); 624err_reset_qp: 625 mlx5i_uninit_underlay_qp(epriv); 626err_clear_state_opened_flag: 627 clear_bit(MLX5E_STATE_OPENED, &epriv->state); 628 mutex_unlock(&epriv->state_lock); 629 return err; 630} 631 632static int mlx5i_close(struct net_device *netdev) 633{ 634 struct mlx5e_priv *epriv = mlx5i_epriv(netdev); 635 struct mlx5i_priv *ipriv = epriv->ppriv; 636 struct mlx5_core_dev *mdev = epriv->mdev; 637 638 /* May already be CLOSED in case a previous configuration operation 639 * (e.g RX/TX queue size change) that involves close&open failed. 640 */ 641 mutex_lock(&epriv->state_lock); 642 643 if (!test_bit(MLX5E_STATE_OPENED, &epriv->state)) 644 goto unlock; 645 646 clear_bit(MLX5E_STATE_OPENED, &epriv->state); 647 648 netif_carrier_off(epriv->netdev); 649 mlx5_fs_remove_rx_underlay_qpn(mdev, ipriv->qpn); 650 mlx5e_deactivate_priv_channels(epriv); 651 mlx5e_close_channels(&epriv->channels); 652 mlx5i_uninit_underlay_qp(epriv); 653unlock: 654 mutex_unlock(&epriv->state_lock); 655 return 0; 656} 657 658/* IPoIB RDMA netdev callbacks */ 659static int mlx5i_attach_mcast(struct net_device *netdev, struct ib_device *hca, 660 union ib_gid *gid, u16 lid, int set_qkey, 661 u32 qkey) 662{ 663 struct mlx5e_priv *epriv = mlx5i_epriv(netdev); 664 struct mlx5_core_dev *mdev = epriv->mdev; 665 struct mlx5i_priv *ipriv = epriv->ppriv; 666 int err; 667 668 mlx5_core_dbg(mdev, "attaching QPN 0x%x, MGID %pI6\n", ipriv->qpn, 669 gid->raw); 670 err = mlx5_core_attach_mcg(mdev, gid, ipriv->qpn); 671 if (err) 672 mlx5_core_warn(mdev, "failed attaching QPN 0x%x, MGID %pI6\n", 673 ipriv->qpn, gid->raw); 674 675 if (set_qkey) { 676 mlx5_core_dbg(mdev, "%s setting qkey 0x%x\n", 677 netdev->name, qkey); 678 ipriv->qkey = qkey; 679 } 680 681 return err; 682} 683 684static int mlx5i_detach_mcast(struct net_device *netdev, struct ib_device *hca, 685 union ib_gid *gid, u16 lid) 686{ 687 struct mlx5e_priv *epriv = mlx5i_epriv(netdev); 688 struct mlx5_core_dev *mdev = epriv->mdev; 689 struct mlx5i_priv *ipriv = epriv->ppriv; 690 int err; 691 692 mlx5_core_dbg(mdev, "detaching QPN 0x%x, MGID %pI6\n", ipriv->qpn, 693 gid->raw); 694 695 err = mlx5_core_detach_mcg(mdev, gid, ipriv->qpn); 696 if (err) 697 mlx5_core_dbg(mdev, "failed detaching QPN 0x%x, MGID %pI6\n", 698 ipriv->qpn, gid->raw); 699 700 return err; 701} 702 703static int mlx5i_xmit(struct net_device *dev, struct sk_buff *skb, 704 struct ib_ah *address, u32 dqpn) 705{ 706 struct mlx5e_priv *epriv = mlx5i_epriv(dev); 707 struct mlx5e_txqsq *sq = epriv->txq2sq[skb_get_queue_mapping(skb)]; 708 struct mlx5_ib_ah *mah = to_mah(address); 709 struct mlx5i_priv *ipriv = epriv->ppriv; 710 711 mlx5i_sq_xmit(sq, skb, &mah->av, dqpn, ipriv->qkey, netdev_xmit_more()); 712 713 return NETDEV_TX_OK; 714} 715 716static void mlx5i_set_pkey_index(struct net_device *netdev, int id) 717{ 718 struct mlx5i_priv *ipriv = netdev_priv(netdev); 719 720 ipriv->pkey_index = (u16)id; 721} 722 723static int mlx5i_check_required_hca_cap(struct mlx5_core_dev *mdev) 724{ 725 if (MLX5_CAP_GEN(mdev, port_type) != MLX5_CAP_PORT_TYPE_IB) 726 return -EOPNOTSUPP; 727 728 if (!MLX5_CAP_GEN(mdev, ipoib_enhanced_offloads)) { 729 mlx5_core_warn(mdev, "IPoIB enhanced offloads are not supported\n"); 730 return -EOPNOTSUPP; 731 } 732 733 return 0; 734} 735 736static void mlx5_rdma_netdev_free(struct net_device *netdev) 737{ 738 struct mlx5e_priv *priv = mlx5i_epriv(netdev); 739 struct mlx5_core_dev *mdev = priv->mdev; 740 struct mlx5i_priv *ipriv = priv->ppriv; 741 const struct mlx5e_profile *profile = priv->profile; 742 743 mlx5e_detach_netdev(priv); 744 profile->cleanup(priv); 745 746 if (!ipriv->sub_interface) { 747 mlx5i_pkey_qpn_ht_cleanup(netdev); 748 mlx5e_destroy_mdev_resources(mdev); 749 } 750} 751 752static bool mlx5_is_sub_interface(struct mlx5_core_dev *mdev) 753{ 754 return mdev->mlx5e_res.hw_objs.pdn != 0; 755} 756 757static const struct mlx5e_profile *mlx5_get_profile(struct mlx5_core_dev *mdev) 758{ 759 if (mlx5_is_sub_interface(mdev)) 760 return mlx5i_pkey_get_profile(); 761 return &mlx5i_nic_profile; 762} 763 764static int mlx5_rdma_setup_rn(struct ib_device *ibdev, u32 port_num, 765 struct net_device *netdev, void *param) 766{ 767 struct mlx5_core_dev *mdev = (struct mlx5_core_dev *)param; 768 const struct mlx5e_profile *prof = mlx5_get_profile(mdev); 769 struct mlx5i_priv *ipriv; 770 struct mlx5e_priv *epriv; 771 struct rdma_netdev *rn; 772 int err; 773 774 ipriv = netdev_priv(netdev); 775 epriv = mlx5i_epriv(netdev); 776 777 ipriv->sub_interface = mlx5_is_sub_interface(mdev); 778 if (!ipriv->sub_interface) { 779 err = mlx5i_pkey_qpn_ht_init(netdev); 780 if (err) { 781 mlx5_core_warn(mdev, "allocate qpn_to_netdev ht failed\n"); 782 return err; 783 } 784 785 /* This should only be called once per mdev */ 786 err = mlx5e_create_mdev_resources(mdev, false); 787 if (err) 788 goto destroy_ht; 789 } 790 791 err = mlx5e_priv_init(epriv, prof, netdev, mdev); 792 if (err) 793 goto destroy_mdev_resources; 794 795 epriv->profile = prof; 796 epriv->ppriv = ipriv; 797 798 prof->init(mdev, netdev); 799 800 err = mlx5e_attach_netdev(epriv); 801 if (err) 802 goto detach; 803 netif_carrier_off(netdev); 804 805 /* set rdma_netdev func pointers */ 806 rn = &ipriv->rn; 807 rn->hca = ibdev; 808 rn->send = mlx5i_xmit; 809 rn->attach_mcast = mlx5i_attach_mcast; 810 rn->detach_mcast = mlx5i_detach_mcast; 811 rn->set_id = mlx5i_set_pkey_index; 812 813 netdev->priv_destructor = mlx5_rdma_netdev_free; 814 netdev->needs_free_netdev = 1; 815 816 return 0; 817 818detach: 819 prof->cleanup(epriv); 820 if (ipriv->sub_interface) 821 return err; 822destroy_mdev_resources: 823 mlx5e_destroy_mdev_resources(mdev); 824destroy_ht: 825 mlx5i_pkey_qpn_ht_cleanup(netdev); 826 return err; 827} 828 829int mlx5_rdma_rn_get_params(struct mlx5_core_dev *mdev, 830 struct ib_device *device, 831 struct rdma_netdev_alloc_params *params) 832{ 833 int nch; 834 int rc; 835 836 rc = mlx5i_check_required_hca_cap(mdev); 837 if (rc) 838 return rc; 839 840 nch = mlx5e_get_max_num_channels(mdev); 841 842 *params = (struct rdma_netdev_alloc_params){ 843 .sizeof_priv = sizeof(struct mlx5i_priv) + 844 sizeof(struct mlx5e_priv), 845 .txqs = nch * MLX5_MAX_NUM_TC, 846 .rxqs = nch, 847 .param = mdev, 848 .initialize_rdma_netdev = mlx5_rdma_setup_rn, 849 }; 850 851 return 0; 852} 853EXPORT_SYMBOL(mlx5_rdma_rn_get_params); 854