[PATCH 6/7]: Revised [PATCH 31/42]: ethernet: add PCI error recovery to ixgb dev driver

From: linas (linas_at_austin.ibm.com)
Date: 11/07/05

  • Next message: Jean-Christian de Rivaz: "Re: NTP broken with 2.6.14"
    Date:	Mon, 7 Nov 2005 15:37:27 -0600
    To: Greg KH <greg@kroah.com>
    
    

    On Mon, Nov 07, 2005 at 01:57:27PM -0600, linas was heard to remark:
    > On Mon, Nov 07, 2005 at 10:27:27AM -0800, Greg KH was heard to remark:
    > > 3) realy strong typing that sparse can detect.

    Replace-Subject: PCI Error Recovery: ixgb network device driver

    Various PCI bus errors can be signaled by newer PCI controllers. This
    patch adds the PCI error recovery callbacks to the intel ten-gigabit
    ethernet ixgb device driver. The patch has been tested, and appears
    to work well.

    Signed-off-by: Linas Vepstas <linas@linas.org>

    --
    Index: linux-2.6.14-mm1/drivers/net/ixgb/ixgb_main.c
    ===================================================================
    --- linux-2.6.14-mm1.orig/drivers/net/ixgb/ixgb_main.c	2005-11-07 13:55:25.431278896 -0600
    +++ linux-2.6.14-mm1/drivers/net/ixgb/ixgb_main.c	2005-11-07 15:02:14.779406268 -0600
    @@ -132,6 +132,16 @@
     static void ixgb_netpoll(struct net_device *dev);
     #endif
     
    +static pers_result_t ixgb_io_error_detected (struct pci_dev *pdev, pci_channel_state_t state);
    +static pers_result_t ixgb_io_slot_reset (struct pci_dev *pdev);
    +static void ixgb_io_resume (struct pci_dev *pdev);
    +
    +static struct pci_error_handlers ixgb_err_handler = {
    +	.error_detected = ixgb_io_error_detected,
    +	.slot_reset = ixgb_io_slot_reset,
    +	.resume = ixgb_io_resume,
    +};
    +
     /* Exported from other modules */
     
     extern void ixgb_check_options(struct ixgb_adapter *adapter);
    @@ -141,6 +151,8 @@
     	.id_table = ixgb_pci_tbl,
     	.probe    = ixgb_probe,
     	.remove   = __devexit_p(ixgb_remove),
    +	.err_handler = &ixgb_err_handler,
    +
     };
     
     MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
    @@ -1654,8 +1666,16 @@
     	unsigned int i;
     #endif
     
    +#ifdef XXX_CONFIG_IXGB_EEH_RECOVERY
    +	if(unlikely(icr==EEH_IO_ERROR_VALUE(4))) {
    +		if (eeh_slot_is_isolated (adapter->pdev))
    +		// disable_irq_nosync (adapter->pdev->irq);
    +		return IRQ_NONE;      /* Not our interrupt */
    +	}
    +#else
     	if(unlikely(!icr))
     		return IRQ_NONE;  /* Not our interrupt */
    +#endif /* CONFIG_IXGB_EEH_RECOVERY */
     
     	if(unlikely(icr & (IXGB_INT_RXSEQ | IXGB_INT_LSC))) {
     		mod_timer(&adapter->watchdog_timer, jiffies);
    @@ -2125,4 +2145,70 @@
     }
     #endif
     
    +/* -------------- PCI Error Recovery infrastructure ---------------- */
    +/** ixgb_io_error_detected() is called when PCI error is detected */
    +static pers_result_t ixgb_io_error_detected (struct pci_dev *pdev, pci_channel_state_t state)
    +{
    +	struct net_device *netdev = pci_get_drvdata(pdev);
    +	struct ixgb_adapter *adapter = netdev->priv;
    +
    +	if(netif_running(netdev))
    +		ixgb_down(adapter, TRUE);
    +
    +	/* Request a slot reset. */
    +	return PERS_RESULT_NEED_RESET;
    +}
    +
    +/** ixgb_io_slot_reset is called after the pci bus has been reset.
    + *  Restart the card from scratch.
    + *  Implementation resembles the first-half of the
    + *  ixgb_resume routine.
    + */
    +static pers_result_t ixgb_io_slot_reset (struct pci_dev *pdev)
    +{
    +	struct net_device *netdev = pci_get_drvdata(pdev);
    +	struct ixgb_adapter *adapter = netdev->priv;
    +
    +	if(pci_enable_device(pdev)) {
    +		printk(KERN_ERR "ixgb: Cannot re-enable PCI device after reset.\n");
    +		return PERS_RESULT_DISCONNECT;
    +	}
    +	pci_set_master(pdev);
    +
    +	/* Perform card reset only on one instance of the card */
    +	if (0 != PCI_FUNC (pdev->devfn))
    +		return PERS_RESULT_RECOVERED;
    +
    +	ixgb_reset(adapter);
    +
    +	return PERS_RESULT_RECOVERED;
    +}
    +
    +/** ixgb_io_resume is called when the error recovery driver
    + *  tells us that its OK to resume normal operation.
    + *  Implementation resembles the second-half of the
    + *  ixgb_resume routine.
    + */
    +static void ixgb_io_resume (struct pci_dev *pdev)
    +{
    +	struct net_device *netdev = pci_get_drvdata(pdev);
    +	struct ixgb_adapter *adapter = netdev->priv;
    +
    +	if(netif_running(netdev)) {
    +		if(ixgb_up(adapter)) {
    +			printk ("ixgb: can't bring device back up after reset\n");
    +			return;
    +		}
    +	}
    +
    +	netif_device_attach(netdev);
    +	if(netif_running(netdev))
    +		mod_timer(&adapter->watchdog_timer, jiffies);
    +
    +	/* Reading all-ff's from the adapter will completely hose
    +	 * the counts and statistics. So just clear them out */
    +	memset(&adapter->stats, 0, sizeof(struct ixgb_hw_stats));
    +	ixgb_update_stats(adapter);
    +}
    +
     /* ixgb_main.c */
    -
    To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
    the body of a message to majordomo@vger.kernel.org
    More majordomo info at  http://vger.kernel.org/majordomo-info.html
    Please read the FAQ at  http://www.tux.org/lkml/
    

  • Next message: Jean-Christian de Rivaz: "Re: NTP broken with 2.6.14"

    Relevant Pages