1/* 2 * Copyright (c) 2014, Mellanox Technologies inc. All rights reserved. 3 * 4 * This software is available to you under a choice of one of two 5 * licenses. You may choose to be licensed under the terms of the GNU 6 * General Public License (GPL) Version 2, available from the file 7 * COPYING in the main directory of this source tree, or the 8 * OpenIB.org BSD license below: 9 * 10 * Redistribution and use in source and binary forms, with or 11 * without modification, are permitted provided that the following 12 * conditions are met: 13 * 14 * - Redistributions of source code must retain the above 15 * copyright notice, this list of conditions and the following 16 * disclaimer. 17 * 18 * - Redistributions in binary form must reproduce the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer in the documentation and/or other materials 21 * provided with the distribution. 22 * 23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30 * SOFTWARE. 31 */ 32 33#include <linux/pci.h> 34#include <linux/mlx5/driver.h> 35#include <linux/mlx5/vport.h> 36#include "mlx5_core.h" 37#include "mlx5_irq.h" 38#include "eswitch.h" 39 40static int sriov_restore_guids(struct mlx5_core_dev *dev, int vf, u16 func_id) 41{ 42 struct mlx5_core_sriov *sriov = &dev->priv.sriov; 43 struct mlx5_hca_vport_context *in; 44 int err = 0; 45 46 /* Restore sriov guid and policy settings */ 47 if (sriov->vfs_ctx[vf].node_guid || 48 sriov->vfs_ctx[vf].port_guid || 49 sriov->vfs_ctx[vf].policy != MLX5_POLICY_INVALID) { 50 in = kzalloc(sizeof(*in), GFP_KERNEL); 51 if (!in) 52 return -ENOMEM; 53 54 in->node_guid = sriov->vfs_ctx[vf].node_guid; 55 in->port_guid = sriov->vfs_ctx[vf].port_guid; 56 in->policy = sriov->vfs_ctx[vf].policy; 57 in->field_select = 58 !!(in->port_guid) * MLX5_HCA_VPORT_SEL_PORT_GUID | 59 !!(in->node_guid) * MLX5_HCA_VPORT_SEL_NODE_GUID | 60 !!(in->policy) * MLX5_HCA_VPORT_SEL_STATE_POLICY; 61 62 err = mlx5_core_modify_hca_vport_context(dev, 1, 1, func_id, in); 63 if (err) 64 mlx5_core_warn(dev, "modify vport context failed, unable to restore VF %d settings\n", vf); 65 66 kfree(in); 67 } 68 69 return err; 70} 71 72static int mlx5_device_enable_sriov(struct mlx5_core_dev *dev, int num_vfs) 73{ 74 struct mlx5_core_sriov *sriov = &dev->priv.sriov; 75 int err, vf, num_msix_count; 76 int vport_num; 77 78 err = mlx5_eswitch_enable(dev->priv.eswitch, num_vfs); 79 if (err) { 80 mlx5_core_warn(dev, 81 "failed to enable eswitch SRIOV (%d)\n", err); 82 return err; 83 } 84 85 num_msix_count = mlx5_get_default_msix_vec_count(dev, num_vfs); 86 for (vf = 0; vf < num_vfs; vf++) { 87 /* Notify the VF before its enablement to let it set 88 * some stuff. 89 */ 90 blocking_notifier_call_chain(&sriov->vfs_ctx[vf].notifier, 91 MLX5_PF_NOTIFY_ENABLE_VF, dev); 92 err = mlx5_core_enable_hca(dev, vf + 1); 93 if (err) { 94 mlx5_core_warn(dev, "failed to enable VF %d (%d)\n", vf, err); 95 continue; 96 } 97 98 err = mlx5_set_msix_vec_count(dev, vf + 1, num_msix_count); 99 if (err) { 100 mlx5_core_warn(dev, 101 "failed to set MSI-X vector counts VF %d, err %d\n", 102 vf, err); 103 continue; 104 } 105 106 sriov->vfs_ctx[vf].enabled = 1; 107 if (MLX5_CAP_GEN(dev, port_type) == MLX5_CAP_PORT_TYPE_IB) { 108 vport_num = mlx5_core_ec_sriov_enabled(dev) ? 109 mlx5_core_ec_vf_vport_base(dev) + vf 110 : vf + 1; 111 err = sriov_restore_guids(dev, vf, vport_num); 112 if (err) { 113 mlx5_core_warn(dev, 114 "failed to restore VF %d settings, err %d\n", 115 vf, err); 116 continue; 117 } 118 } 119 mlx5_core_dbg(dev, "successfully enabled VF* %d\n", vf); 120 } 121 122 return 0; 123} 124 125static void 126mlx5_device_disable_sriov(struct mlx5_core_dev *dev, int num_vfs, bool clear_vf, bool num_vf_change) 127{ 128 struct mlx5_core_sriov *sriov = &dev->priv.sriov; 129 bool wait_for_ec_vf_pages = true; 130 bool wait_for_vf_pages = true; 131 int err; 132 int vf; 133 134 for (vf = num_vfs - 1; vf >= 0; vf--) { 135 if (!sriov->vfs_ctx[vf].enabled) 136 continue; 137 /* Notify the VF before its disablement to let it clean 138 * some resources. 139 */ 140 blocking_notifier_call_chain(&sriov->vfs_ctx[vf].notifier, 141 MLX5_PF_NOTIFY_DISABLE_VF, dev); 142 err = mlx5_core_disable_hca(dev, vf + 1); 143 if (err) { 144 mlx5_core_warn(dev, "failed to disable VF %d\n", vf); 145 continue; 146 } 147 sriov->vfs_ctx[vf].enabled = 0; 148 } 149 150 mlx5_eswitch_disable_sriov(dev->priv.eswitch, clear_vf); 151 152 /* There are a number of scenarios when SRIOV is being disabled: 153 * 1. VFs or ECVFs had been created, and now set back to 0 (num_vf_change == true). 154 * - If EC SRIOV is enabled then this flow is happening on the 155 * embedded platform, wait for only EC VF pages. 156 * - If EC SRIOV is not enabled this flow is happening on non-embedded 157 * platform, wait for the VF pages. 158 * 159 * 2. The driver is being unloaded. In this case wait for all pages. 160 */ 161 if (num_vf_change) { 162 if (mlx5_core_ec_sriov_enabled(dev)) 163 wait_for_vf_pages = false; 164 else 165 wait_for_ec_vf_pages = false; 166 } 167 168 if (wait_for_ec_vf_pages && mlx5_wait_for_pages(dev, &dev->priv.page_counters[MLX5_EC_VF])) 169 mlx5_core_warn(dev, "timeout reclaiming EC VFs pages\n"); 170 171 /* For ECPFs, skip waiting for host VF pages until ECPF is destroyed */ 172 if (mlx5_core_is_ecpf(dev)) 173 return; 174 175 if (wait_for_vf_pages && mlx5_wait_for_pages(dev, &dev->priv.page_counters[MLX5_VF])) 176 mlx5_core_warn(dev, "timeout reclaiming VFs pages\n"); 177} 178 179static int mlx5_sriov_enable(struct pci_dev *pdev, int num_vfs) 180{ 181 struct mlx5_core_dev *dev = pci_get_drvdata(pdev); 182 struct devlink *devlink = priv_to_devlink(dev); 183 int err; 184 185 devl_lock(devlink); 186 err = mlx5_device_enable_sriov(dev, num_vfs); 187 devl_unlock(devlink); 188 if (err) { 189 mlx5_core_warn(dev, "mlx5_device_enable_sriov failed : %d\n", err); 190 return err; 191 } 192 193 err = pci_enable_sriov(pdev, num_vfs); 194 if (err) { 195 mlx5_core_warn(dev, "pci_enable_sriov failed : %d\n", err); 196 mlx5_device_disable_sriov(dev, num_vfs, true, true); 197 } 198 return err; 199} 200 201void mlx5_sriov_disable(struct pci_dev *pdev, bool num_vf_change) 202{ 203 struct mlx5_core_dev *dev = pci_get_drvdata(pdev); 204 struct devlink *devlink = priv_to_devlink(dev); 205 int num_vfs = pci_num_vf(dev->pdev); 206 207 pci_disable_sriov(pdev); 208 devl_lock(devlink); 209 mlx5_device_disable_sriov(dev, num_vfs, true, num_vf_change); 210 devl_unlock(devlink); 211} 212 213int mlx5_core_sriov_configure(struct pci_dev *pdev, int num_vfs) 214{ 215 struct mlx5_core_dev *dev = pci_get_drvdata(pdev); 216 struct mlx5_core_sriov *sriov = &dev->priv.sriov; 217 int err = 0; 218 219 mlx5_core_dbg(dev, "requested num_vfs %d\n", num_vfs); 220 221 if (num_vfs) 222 err = mlx5_sriov_enable(pdev, num_vfs); 223 else 224 mlx5_sriov_disable(pdev, true); 225 226 if (!err) 227 sriov->num_vfs = num_vfs; 228 return err ? err : num_vfs; 229} 230 231int mlx5_core_sriov_set_msix_vec_count(struct pci_dev *vf, int msix_vec_count) 232{ 233 struct pci_dev *pf = pci_physfn(vf); 234 struct mlx5_core_sriov *sriov; 235 struct mlx5_core_dev *dev; 236 int num_vf_msix, id; 237 238 dev = pci_get_drvdata(pf); 239 num_vf_msix = MLX5_CAP_GEN_MAX(dev, num_total_dynamic_vf_msix); 240 if (!num_vf_msix) 241 return -EOPNOTSUPP; 242 243 if (!msix_vec_count) 244 msix_vec_count = 245 mlx5_get_default_msix_vec_count(dev, pci_num_vf(pf)); 246 247 sriov = &dev->priv.sriov; 248 id = pci_iov_vf_id(vf); 249 if (id < 0 || !sriov->vfs_ctx[id].enabled) 250 return -EINVAL; 251 252 return mlx5_set_msix_vec_count(dev, id + 1, msix_vec_count); 253} 254 255int mlx5_sriov_attach(struct mlx5_core_dev *dev) 256{ 257 if (!mlx5_core_is_pf(dev) || !pci_num_vf(dev->pdev)) 258 return 0; 259 260 /* If sriov VFs exist in PCI level, enable them in device level */ 261 return mlx5_device_enable_sriov(dev, pci_num_vf(dev->pdev)); 262} 263 264void mlx5_sriov_detach(struct mlx5_core_dev *dev) 265{ 266 if (!mlx5_core_is_pf(dev)) 267 return; 268 269 mlx5_device_disable_sriov(dev, pci_num_vf(dev->pdev), false, false); 270} 271 272static u16 mlx5_get_max_vfs(struct mlx5_core_dev *dev) 273{ 274 u16 host_total_vfs; 275 const u32 *out; 276 277 if (mlx5_core_is_ecpf_esw_manager(dev)) { 278 out = mlx5_esw_query_functions(dev); 279 280 /* Old FW doesn't support getting total_vfs from esw func 281 * but supports getting it from pci_sriov. 282 */ 283 if (IS_ERR(out)) 284 goto done; 285 host_total_vfs = MLX5_GET(query_esw_functions_out, out, 286 host_params_context.host_total_vfs); 287 kvfree(out); 288 return host_total_vfs; 289 } 290 291done: 292 return pci_sriov_get_totalvfs(dev->pdev); 293} 294 295int mlx5_sriov_init(struct mlx5_core_dev *dev) 296{ 297 struct mlx5_core_sriov *sriov = &dev->priv.sriov; 298 struct pci_dev *pdev = dev->pdev; 299 int total_vfs, i; 300 301 if (!mlx5_core_is_pf(dev)) 302 return 0; 303 304 total_vfs = pci_sriov_get_totalvfs(pdev); 305 sriov->max_vfs = mlx5_get_max_vfs(dev); 306 sriov->num_vfs = pci_num_vf(pdev); 307 sriov->max_ec_vfs = mlx5_core_ec_sriov_enabled(dev) ? pci_sriov_get_totalvfs(dev->pdev) : 0; 308 sriov->vfs_ctx = kcalloc(total_vfs, sizeof(*sriov->vfs_ctx), GFP_KERNEL); 309 if (!sriov->vfs_ctx) 310 return -ENOMEM; 311 312 for (i = 0; i < total_vfs; i++) 313 BLOCKING_INIT_NOTIFIER_HEAD(&sriov->vfs_ctx[i].notifier); 314 315 return 0; 316} 317 318void mlx5_sriov_cleanup(struct mlx5_core_dev *dev) 319{ 320 struct mlx5_core_sriov *sriov = &dev->priv.sriov; 321 322 if (!mlx5_core_is_pf(dev)) 323 return; 324 325 kfree(sriov->vfs_ctx); 326} 327 328/** 329 * mlx5_sriov_blocking_notifier_unregister - Unregister a VF from 330 * a notification block chain. 331 * 332 * @mdev: The mlx5 core device. 333 * @vf_id: The VF id. 334 * @nb: The notifier block to be unregistered. 335 */ 336void mlx5_sriov_blocking_notifier_unregister(struct mlx5_core_dev *mdev, 337 int vf_id, 338 struct notifier_block *nb) 339{ 340 struct mlx5_vf_context *vfs_ctx; 341 struct mlx5_core_sriov *sriov; 342 343 sriov = &mdev->priv.sriov; 344 if (WARN_ON(vf_id < 0 || vf_id >= sriov->num_vfs)) 345 return; 346 347 vfs_ctx = &sriov->vfs_ctx[vf_id]; 348 blocking_notifier_chain_unregister(&vfs_ctx->notifier, nb); 349} 350EXPORT_SYMBOL(mlx5_sriov_blocking_notifier_unregister); 351 352/** 353 * mlx5_sriov_blocking_notifier_register - Register a VF notification 354 * block chain. 355 * 356 * @mdev: The mlx5 core device. 357 * @vf_id: The VF id. 358 * @nb: The notifier block to be called upon the VF events. 359 * 360 * Returns 0 on success or an error code. 361 */ 362int mlx5_sriov_blocking_notifier_register(struct mlx5_core_dev *mdev, 363 int vf_id, 364 struct notifier_block *nb) 365{ 366 struct mlx5_vf_context *vfs_ctx; 367 struct mlx5_core_sriov *sriov; 368 369 sriov = &mdev->priv.sriov; 370 if (vf_id < 0 || vf_id >= sriov->num_vfs) 371 return -EINVAL; 372 373 vfs_ctx = &sriov->vfs_ctx[vf_id]; 374 return blocking_notifier_chain_register(&vfs_ctx->notifier, nb); 375} 376EXPORT_SYMBOL(mlx5_sriov_blocking_notifier_register); 377