123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256 |
- /*
- This file is provided under a dual BSD/GPLv2 license. When using or
- redistributing this file, you may do so under either license.
- GPL LICENSE SUMMARY
- Copyright(c) 2014 Intel Corporation.
- This program is free software; you can redistribute it and/or modify
- it under the terms of version 2 of the GNU General Public License as
- published by the Free Software Foundation.
- This program is distributed in the hope that it will be useful, but
- WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- General Public License for more details.
- Contact Information:
- qat-linux@intel.com
- BSD LICENSE
- Copyright(c) 2014 Intel Corporation.
- Redistribution and use in source and binary forms, with or without
- modification, are permitted provided that the following conditions
- are met:
- * Redistributions of source code must retain the above copyright
- notice, this list of conditions and the following disclaimer.
- * Redistributions in binary form must reproduce the above copyright
- notice, this list of conditions and the following disclaimer in
- the documentation and/or other materials provided with the
- distribution.
- * Neither the name of Intel Corporation nor the names of its
- contributors may be used to endorse or promote products derived
- from this software without specific prior written permission.
- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
- OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
- #include <linux/kernel.h>
- #include <linux/pci.h>
- #include <linux/aer.h>
- #include <linux/completion.h>
- #include <linux/workqueue.h>
- #include <linux/delay.h>
- #include "adf_accel_devices.h"
- #include "adf_common_drv.h"
- static struct workqueue_struct *device_reset_wq;
- static pci_ers_result_t adf_error_detected(struct pci_dev *pdev,
- pci_channel_state_t state)
- {
- struct adf_accel_dev *accel_dev = adf_devmgr_pci_to_accel_dev(pdev);
- dev_info(&pdev->dev, "Acceleration driver hardware error detected.\n");
- if (!accel_dev) {
- dev_err(&pdev->dev, "Can't find acceleration device\n");
- return PCI_ERS_RESULT_DISCONNECT;
- }
- if (state == pci_channel_io_perm_failure) {
- dev_err(&pdev->dev, "Can't recover from device error\n");
- return PCI_ERS_RESULT_DISCONNECT;
- }
- return PCI_ERS_RESULT_NEED_RESET;
- }
- /* reset dev data */
- struct adf_reset_dev_data {
- int mode;
- struct adf_accel_dev *accel_dev;
- struct completion compl;
- struct work_struct reset_work;
- };
- static void adf_dev_restore(struct adf_accel_dev *accel_dev)
- {
- struct pci_dev *pdev = accel_to_pci_dev(accel_dev);
- struct pci_dev *parent = pdev->bus->self;
- uint16_t bridge_ctl = 0;
- if (accel_dev->is_vf)
- return;
- dev_info(&GET_DEV(accel_dev), "Resetting device qat_dev%d\n",
- accel_dev->accel_id);
- if (!parent)
- parent = pdev;
- if (!pci_wait_for_pending_transaction(pdev))
- dev_info(&GET_DEV(accel_dev),
- "Transaction still in progress. Proceeding\n");
- pci_read_config_word(parent, PCI_BRIDGE_CONTROL, &bridge_ctl);
- bridge_ctl |= PCI_BRIDGE_CTL_BUS_RESET;
- pci_write_config_word(parent, PCI_BRIDGE_CONTROL, bridge_ctl);
- msleep(100);
- bridge_ctl &= ~PCI_BRIDGE_CTL_BUS_RESET;
- pci_write_config_word(parent, PCI_BRIDGE_CONTROL, bridge_ctl);
- msleep(100);
- pci_restore_state(pdev);
- pci_save_state(pdev);
- }
- static void adf_device_reset_worker(struct work_struct *work)
- {
- struct adf_reset_dev_data *reset_data =
- container_of(work, struct adf_reset_dev_data, reset_work);
- struct adf_accel_dev *accel_dev = reset_data->accel_dev;
- adf_dev_restarting_notify(accel_dev);
- adf_dev_stop(accel_dev);
- adf_dev_shutdown(accel_dev);
- adf_dev_restore(accel_dev);
- if (adf_dev_init(accel_dev) || adf_dev_start(accel_dev)) {
- /* The device hanged and we can't restart it so stop here */
- dev_err(&GET_DEV(accel_dev), "Restart device failed\n");
- kfree(reset_data);
- WARN(1, "QAT: device restart failed. Device is unusable\n");
- return;
- }
- adf_dev_restarted_notify(accel_dev);
- clear_bit(ADF_STATUS_RESTARTING, &accel_dev->status);
- /* The dev is back alive. Notify the caller if in sync mode */
- if (reset_data->mode == ADF_DEV_RESET_SYNC)
- complete(&reset_data->compl);
- else
- kfree(reset_data);
- }
- static int adf_dev_aer_schedule_reset(struct adf_accel_dev *accel_dev,
- enum adf_dev_reset_mode mode)
- {
- struct adf_reset_dev_data *reset_data;
- if (!adf_dev_started(accel_dev) ||
- test_bit(ADF_STATUS_RESTARTING, &accel_dev->status))
- return 0;
- set_bit(ADF_STATUS_RESTARTING, &accel_dev->status);
- reset_data = kzalloc(sizeof(*reset_data), GFP_ATOMIC);
- if (!reset_data)
- return -ENOMEM;
- reset_data->accel_dev = accel_dev;
- init_completion(&reset_data->compl);
- reset_data->mode = mode;
- INIT_WORK(&reset_data->reset_work, adf_device_reset_worker);
- queue_work(device_reset_wq, &reset_data->reset_work);
- /* If in sync mode wait for the result */
- if (mode == ADF_DEV_RESET_SYNC) {
- int ret = 0;
- /* Maximum device reset time is 10 seconds */
- unsigned long wait_jiffies = msecs_to_jiffies(10000);
- unsigned long timeout = wait_for_completion_timeout(
- &reset_data->compl, wait_jiffies);
- if (!timeout) {
- dev_err(&GET_DEV(accel_dev),
- "Reset device timeout expired\n");
- ret = -EFAULT;
- }
- kfree(reset_data);
- return ret;
- }
- return 0;
- }
- static pci_ers_result_t adf_slot_reset(struct pci_dev *pdev)
- {
- struct adf_accel_dev *accel_dev = adf_devmgr_pci_to_accel_dev(pdev);
- if (!accel_dev) {
- pr_err("QAT: Can't find acceleration device\n");
- return PCI_ERS_RESULT_DISCONNECT;
- }
- pci_cleanup_aer_uncorrect_error_status(pdev);
- if (adf_dev_aer_schedule_reset(accel_dev, ADF_DEV_RESET_SYNC))
- return PCI_ERS_RESULT_DISCONNECT;
- return PCI_ERS_RESULT_RECOVERED;
- }
- static void adf_resume(struct pci_dev *pdev)
- {
- dev_info(&pdev->dev, "Acceleration driver reset completed\n");
- dev_info(&pdev->dev, "Device is up and runnig\n");
- }
- static struct pci_error_handlers adf_err_handler = {
- .error_detected = adf_error_detected,
- .slot_reset = adf_slot_reset,
- .resume = adf_resume,
- };
- /**
- * adf_enable_aer() - Enable Advance Error Reporting for acceleration device
- * @accel_dev: Pointer to acceleration device.
- * @adf: PCI device driver owning the given acceleration device.
- *
- * Function enables PCI Advance Error Reporting for the
- * QAT acceleration device accel_dev.
- * To be used by QAT device specific drivers.
- *
- * Return: 0 on success, error code otherwise.
- */
- int adf_enable_aer(struct adf_accel_dev *accel_dev, struct pci_driver *adf)
- {
- struct pci_dev *pdev = accel_to_pci_dev(accel_dev);
- adf->err_handler = &adf_err_handler;
- pci_enable_pcie_error_reporting(pdev);
- return 0;
- }
- EXPORT_SYMBOL_GPL(adf_enable_aer);
- /**
- * adf_disable_aer() - Enable Advance Error Reporting for acceleration device
- * @accel_dev: Pointer to acceleration device.
- *
- * Function disables PCI Advance Error Reporting for the
- * QAT acceleration device accel_dev.
- * To be used by QAT device specific drivers.
- *
- * Return: void
- */
- void adf_disable_aer(struct adf_accel_dev *accel_dev)
- {
- struct pci_dev *pdev = accel_to_pci_dev(accel_dev);
- pci_disable_pcie_error_reporting(pdev);
- }
- EXPORT_SYMBOL_GPL(adf_disable_aer);
- int adf_init_aer(void)
- {
- device_reset_wq = create_workqueue("qat_device_reset_wq");
- return !device_reset_wq ? -EFAULT : 0;
- }
- void adf_exit_aer(void)
- {
- if (device_reset_wq)
- destroy_workqueue(device_reset_wq);
- device_reset_wq = NULL;
- }
|