/* * Copyright (c) 2014, Mellanox Technologies inc. All rights reserved. * * This software is available to you under a choice of one of two * licenses. You may choose to be licensed under the terms of the GNU * General Public License (GPL) Version 2, available from the file * COPYING in the main directory of this source tree, or the * OpenIB.org BSD license below: * * Redistribution and use in source and binary forms, with or * without modification, are permitted provided that the following * conditions are met: * * - Redistributions of source code must retain the above * copyright notice, this list of conditions and the following * disclaimer. * * - Redistributions in binary form must reproduce the above * copyright notice, this list of conditions and the following * disclaimer in the documentation and/or other materials * provided with the distribution. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. */ #include #include #include #include "mlx5_core.h" #include "mlx5_irq.h" #include "eswitch.h" static int sriov_restore_guids(struct mlx5_core_dev *dev, int vf, u16 func_id) { struct mlx5_core_sriov *sriov = &dev->priv.sriov; struct mlx5_hca_vport_context *in; int err = 0; /* Restore sriov guid and policy settings */ if (sriov->vfs_ctx[vf].node_guid || sriov->vfs_ctx[vf].port_guid || sriov->vfs_ctx[vf].policy != MLX5_POLICY_INVALID) { in = kzalloc(sizeof(*in), GFP_KERNEL); if (!in) return -ENOMEM; in->node_guid = sriov->vfs_ctx[vf].node_guid; in->port_guid = sriov->vfs_ctx[vf].port_guid; in->policy = sriov->vfs_ctx[vf].policy; in->field_select = !!(in->port_guid) * MLX5_HCA_VPORT_SEL_PORT_GUID | !!(in->node_guid) * MLX5_HCA_VPORT_SEL_NODE_GUID | !!(in->policy) * MLX5_HCA_VPORT_SEL_STATE_POLICY; err = mlx5_core_modify_hca_vport_context(dev, 1, 1, func_id, in); if (err) mlx5_core_warn(dev, "modify vport context failed, unable to restore VF %d settings\n", vf); kfree(in); } return err; } static int mlx5_device_enable_sriov(struct mlx5_core_dev *dev, int num_vfs) { struct mlx5_core_sriov *sriov = &dev->priv.sriov; int err, vf, num_msix_count; int vport_num; err = mlx5_eswitch_enable(dev->priv.eswitch, num_vfs); if (err) { mlx5_core_warn(dev, "failed to enable eswitch SRIOV (%d)\n", err); return err; } num_msix_count = mlx5_get_default_msix_vec_count(dev, num_vfs); for (vf = 0; vf < num_vfs; vf++) { /* Notify the VF before its enablement to let it set * some stuff. */ blocking_notifier_call_chain(&sriov->vfs_ctx[vf].notifier, MLX5_PF_NOTIFY_ENABLE_VF, dev); err = mlx5_core_enable_hca(dev, vf + 1); if (err) { mlx5_core_warn(dev, "failed to enable VF %d (%d)\n", vf, err); continue; } err = mlx5_set_msix_vec_count(dev, vf + 1, num_msix_count); if (err) { mlx5_core_warn(dev, "failed to set MSI-X vector counts VF %d, err %d\n", vf, err); continue; } sriov->vfs_ctx[vf].enabled = 1; if (MLX5_CAP_GEN(dev, port_type) == MLX5_CAP_PORT_TYPE_IB) { vport_num = mlx5_core_ec_sriov_enabled(dev) ? mlx5_core_ec_vf_vport_base(dev) + vf : vf + 1; err = sriov_restore_guids(dev, vf, vport_num); if (err) { mlx5_core_warn(dev, "failed to restore VF %d settings, err %d\n", vf, err); continue; } } mlx5_core_dbg(dev, "successfully enabled VF* %d\n", vf); } return 0; } static void mlx5_device_disable_sriov(struct mlx5_core_dev *dev, int num_vfs, bool clear_vf, bool num_vf_change) { struct mlx5_core_sriov *sriov = &dev->priv.sriov; bool wait_for_ec_vf_pages = true; bool wait_for_vf_pages = true; int err; int vf; for (vf = num_vfs - 1; vf >= 0; vf--) { if (!sriov->vfs_ctx[vf].enabled) continue; /* Notify the VF before its disablement to let it clean * some resources. */ blocking_notifier_call_chain(&sriov->vfs_ctx[vf].notifier, MLX5_PF_NOTIFY_DISABLE_VF, dev); err = mlx5_core_disable_hca(dev, vf + 1); if (err) { mlx5_core_warn(dev, "failed to disable VF %d\n", vf); continue; } sriov->vfs_ctx[vf].enabled = 0; } mlx5_eswitch_disable_sriov(dev->priv.eswitch, clear_vf); /* There are a number of scenarios when SRIOV is being disabled: * 1. VFs or ECVFs had been created, and now set back to 0 (num_vf_change == true). * - If EC SRIOV is enabled then this flow is happening on the * embedded platform, wait for only EC VF pages. * - If EC SRIOV is not enabled this flow is happening on non-embedded * platform, wait for the VF pages. * * 2. The driver is being unloaded. In this case wait for all pages. */ if (num_vf_change) { if (mlx5_core_ec_sriov_enabled(dev)) wait_for_vf_pages = false; else wait_for_ec_vf_pages = false; } if (wait_for_ec_vf_pages && mlx5_wait_for_pages(dev, &dev->priv.page_counters[MLX5_EC_VF])) mlx5_core_warn(dev, "timeout reclaiming EC VFs pages\n"); /* For ECPFs, skip waiting for host VF pages until ECPF is destroyed */ if (mlx5_core_is_ecpf(dev)) return; if (wait_for_vf_pages && mlx5_wait_for_pages(dev, &dev->priv.page_counters[MLX5_VF])) mlx5_core_warn(dev, "timeout reclaiming VFs pages\n"); } static int mlx5_sriov_enable(struct pci_dev *pdev, int num_vfs) { struct mlx5_core_dev *dev = pci_get_drvdata(pdev); struct devlink *devlink = priv_to_devlink(dev); int err; devl_lock(devlink); err = mlx5_device_enable_sriov(dev, num_vfs); devl_unlock(devlink); if (err) { mlx5_core_warn(dev, "mlx5_device_enable_sriov failed : %d\n", err); return err; } err = pci_enable_sriov(pdev, num_vfs); if (err) { mlx5_core_warn(dev, "pci_enable_sriov failed : %d\n", err); mlx5_device_disable_sriov(dev, num_vfs, true, true); } return err; } void mlx5_sriov_disable(struct pci_dev *pdev, bool num_vf_change) { struct mlx5_core_dev *dev = pci_get_drvdata(pdev); struct devlink *devlink = priv_to_devlink(dev); int num_vfs = pci_num_vf(dev->pdev); pci_disable_sriov(pdev); devl_lock(devlink); mlx5_device_disable_sriov(dev, num_vfs, true, num_vf_change); devl_unlock(devlink); } int mlx5_core_sriov_configure(struct pci_dev *pdev, int num_vfs) { struct mlx5_core_dev *dev = pci_get_drvdata(pdev); struct mlx5_core_sriov *sriov = &dev->priv.sriov; int err = 0; mlx5_core_dbg(dev, "requested num_vfs %d\n", num_vfs); if (num_vfs) err = mlx5_sriov_enable(pdev, num_vfs); else mlx5_sriov_disable(pdev, true); if (!err) sriov->num_vfs = num_vfs; return err ? err : num_vfs; } int mlx5_core_sriov_set_msix_vec_count(struct pci_dev *vf, int msix_vec_count) { struct pci_dev *pf = pci_physfn(vf); struct mlx5_core_sriov *sriov; struct mlx5_core_dev *dev; int num_vf_msix, id; dev = pci_get_drvdata(pf); num_vf_msix = MLX5_CAP_GEN_MAX(dev, num_total_dynamic_vf_msix); if (!num_vf_msix) return -EOPNOTSUPP; if (!msix_vec_count) msix_vec_count = mlx5_get_default_msix_vec_count(dev, pci_num_vf(pf)); sriov = &dev->priv.sriov; id = pci_iov_vf_id(vf); if (id < 0 || !sriov->vfs_ctx[id].enabled) return -EINVAL; return mlx5_set_msix_vec_count(dev, id + 1, msix_vec_count); } int mlx5_sriov_attach(struct mlx5_core_dev *dev) { if (!mlx5_core_is_pf(dev) || !pci_num_vf(dev->pdev)) return 0; /* If sriov VFs exist in PCI level, enable them in device level */ return mlx5_device_enable_sriov(dev, pci_num_vf(dev->pdev)); } void mlx5_sriov_detach(struct mlx5_core_dev *dev) { if (!mlx5_core_is_pf(dev)) return; mlx5_device_disable_sriov(dev, pci_num_vf(dev->pdev), false, false); } static u16 mlx5_get_max_vfs(struct mlx5_core_dev *dev) { u16 host_total_vfs; const u32 *out; if (mlx5_core_is_ecpf_esw_manager(dev)) { out = mlx5_esw_query_functions(dev); /* Old FW doesn't support getting total_vfs from esw func * but supports getting it from pci_sriov. */ if (IS_ERR(out)) goto done; host_total_vfs = MLX5_GET(query_esw_functions_out, out, host_params_context.host_total_vfs); kvfree(out); return host_total_vfs; } done: return pci_sriov_get_totalvfs(dev->pdev); } int mlx5_sriov_init(struct mlx5_core_dev *dev) { struct mlx5_core_sriov *sriov = &dev->priv.sriov; struct pci_dev *pdev = dev->pdev; int total_vfs, i; if (!mlx5_core_is_pf(dev)) return 0; total_vfs = pci_sriov_get_totalvfs(pdev); sriov->max_vfs = mlx5_get_max_vfs(dev); sriov->num_vfs = pci_num_vf(pdev); sriov->max_ec_vfs = mlx5_core_ec_sriov_enabled(dev) ? pci_sriov_get_totalvfs(dev->pdev) : 0; sriov->vfs_ctx = kcalloc(total_vfs, sizeof(*sriov->vfs_ctx), GFP_KERNEL); if (!sriov->vfs_ctx) return -ENOMEM; for (i = 0; i < total_vfs; i++) BLOCKING_INIT_NOTIFIER_HEAD(&sriov->vfs_ctx[i].notifier); return 0; } void mlx5_sriov_cleanup(struct mlx5_core_dev *dev) { struct mlx5_core_sriov *sriov = &dev->priv.sriov; if (!mlx5_core_is_pf(dev)) return; kfree(sriov->vfs_ctx); } /** * mlx5_sriov_blocking_notifier_unregister - Unregister a VF from * a notification block chain. * * @mdev: The mlx5 core device. * @vf_id: The VF id. * @nb: The notifier block to be unregistered. */ void mlx5_sriov_blocking_notifier_unregister(struct mlx5_core_dev *mdev, int vf_id, struct notifier_block *nb) { struct mlx5_vf_context *vfs_ctx; struct mlx5_core_sriov *sriov; sriov = &mdev->priv.sriov; if (WARN_ON(vf_id < 0 || vf_id >= sriov->num_vfs)) return; vfs_ctx = &sriov->vfs_ctx[vf_id]; blocking_notifier_chain_unregister(&vfs_ctx->notifier, nb); } EXPORT_SYMBOL(mlx5_sriov_blocking_notifier_unregister); /** * mlx5_sriov_blocking_notifier_register - Register a VF notification * block chain. * * @mdev: The mlx5 core device. * @vf_id: The VF id. * @nb: The notifier block to be called upon the VF events. * * Returns 0 on success or an error code. */ int mlx5_sriov_blocking_notifier_register(struct mlx5_core_dev *mdev, int vf_id, struct notifier_block *nb) { struct mlx5_vf_context *vfs_ctx; struct mlx5_core_sriov *sriov; sriov = &mdev->priv.sriov; if (vf_id < 0 || vf_id >= sriov->num_vfs) return -EINVAL; vfs_ctx = &sriov->vfs_ctx[vf_id]; return blocking_notifier_chain_register(&vfs_ctx->notifier, nb); } EXPORT_SYMBOL(mlx5_sriov_blocking_notifier_register);