sfc:On MCDI timeout, issue an FLR (and mark MCDI to fail-fast) (e283546c) · Commits · 方亚芬 / linux

drivers/net/ethernet/sfc/ef10.c

+11 −1

Original line number	Diff line number	Diff line
		@@ -738,8 +738,11 @@ static int efx_ef10_reset(struct efx_nic *efx, enum reset_type reset_type)
		/* If it was a port reset, trigger reallocation of MC resources.
		* Note that on an MC reset nothing needs to be done now because we'll
		* detect the MC reset later and handle it then.
		* For an FLR, we never get an MC reset event, but the MC has reset all
		* resources assigned to us, so we have to trigger reallocation now.
		*/
		if (reset_type == RESET_TYPE_ALL && !rc)
		if ((reset_type == RESET_TYPE_ALL \|\|
		reset_type == RESET_TYPE_MCDI_TIMEOUT) && !rc)
		efx_ef10_reset_mc_allocations(efx);
		return rc;
		}
		@@ -2141,6 +2144,11 @@ static int efx_ef10_fini_dmaq(struct efx_nic *efx)
		return 0;
		}

		static void efx_ef10_prepare_flr(struct efx_nic *efx)
		{
		atomic_set(&efx->active_queues, 0);
		}

		static bool efx_ef10_filter_equal(const struct efx_filter_spec *left,
		const struct efx_filter_spec *right)
		{
		@@ -3603,6 +3611,8 @@ const struct efx_nic_type efx_hunt_a0_nic_type = {
		.probe_port = efx_mcdi_port_probe,
		.remove_port = efx_mcdi_port_remove,
		.fini_dmaq = efx_ef10_fini_dmaq,
		.prepare_flr = efx_ef10_prepare_flr,
		.finish_flr = efx_port_dummy_op_void,
		.describe_stats = efx_ef10_describe_stats,
		.update_stats = efx_ef10_update_stats,
		.start_stats = efx_mcdi_mac_start_stats,

drivers/net/ethernet/sfc/efx.c

+16 −3

Original line number	Diff line number	Diff line
		@@ -76,6 +76,7 @@ const char *const efx_reset_type_names[] = {
		[RESET_TYPE_RECOVER_OR_ALL] = "RECOVER_OR_ALL",
		[RESET_TYPE_WORLD] = "WORLD",
		[RESET_TYPE_RECOVER_OR_DISABLE] = "RECOVER_OR_DISABLE",
		[RESET_TYPE_MC_BIST] = "MC_BIST",
		[RESET_TYPE_DISABLE] = "DISABLE",
		[RESET_TYPE_TX_WATCHDOG] = "TX_WATCHDOG",
		[RESET_TYPE_INT_ERROR] = "INT_ERROR",
		@@ -83,7 +84,7 @@ const char *const efx_reset_type_names[] = {
		[RESET_TYPE_DMA_ERROR] = "DMA_ERROR",
		[RESET_TYPE_TX_SKIP] = "TX_SKIP",
		[RESET_TYPE_MC_FAILURE] = "MC_FAILURE",
		[RESET_TYPE_MC_BIST] = "MC_BIST",
		[RESET_TYPE_MCDI_TIMEOUT] = "MCDI_TIMEOUT (FLR)",
		};

		/* Reset workqueue. If any NIC has a hardware failure then a reset will be
		@@ -1739,7 +1740,8 @@ static void efx_start_all(struct efx_nic *efx)

		/* Check that it is appropriate to restart the interface. All
		* of these flags are safe to read under just the rtnl lock */
		if (efx->port_enabled \|\| !netif_running(efx->net_dev))
		if (efx->port_enabled \|\| !netif_running(efx->net_dev) \|\|
		efx->reset_pending)
		return;

		efx_start_port(efx);
		@@ -2334,6 +2336,9 @@ void efx_reset_down(struct efx_nic *efx, enum reset_type method)
		{
		EFX_ASSERT_RESET_SERIALISED(efx);

		if (method == RESET_TYPE_MCDI_TIMEOUT)
		efx->type->prepare_flr(efx);

		efx_stop_all(efx);
		efx_disable_interrupts(efx);

		@@ -2354,6 +2359,10 @@ int efx_reset_up(struct efx_nic *efx, enum reset_type method, bool ok)

		EFX_ASSERT_RESET_SERIALISED(efx);

		if (method == RESET_TYPE_MCDI_TIMEOUT)
		efx->type->finish_flr(efx);

		/* Ensure that SRAM is initialised even if we're disabling the device */
		rc = efx->type->init(efx);
		if (rc) {
		netif_err(efx, drv, efx->net_dev, "failed to initialise NIC\n");
		@@ -2417,7 +2426,10 @@ int efx_reset(struct efx_nic *efx, enum reset_type method)
		/* Clear flags for the scopes we covered. We assume the NIC and
		* driver are now quiescent so that there is no race here.
		*/
		if (method < RESET_TYPE_MAX_METHOD)
		efx->reset_pending &= -(1 << (method + 1));
		else /* it doesn't fit into the well-ordered scope hierarchy */
		__clear_bit(method, &efx->reset_pending);

		/* Reinitialise bus-mastering, which may have been turned off before
		* the reset was scheduled. This is still appropriate, even in the
		@@ -2546,6 +2558,7 @@ void efx_schedule_reset(struct efx_nic *efx, enum reset_type type)
		case RESET_TYPE_DISABLE:
		case RESET_TYPE_RECOVER_OR_DISABLE:
		case RESET_TYPE_MC_BIST:
		case RESET_TYPE_MCDI_TIMEOUT:
		method = type;
		netif_dbg(efx, drv, efx->net_dev, "scheduling %s reset\n",
		RESET_TYPE(method));

drivers/net/ethernet/sfc/enum.h

+16 −7

Original line number	Diff line number	Diff line
		@@ -143,6 +143,7 @@ enum efx_loopback_mode {
		* @RESET_TYPE_WORLD: Reset as much as possible
		* @RESET_TYPE_RECOVER_OR_DISABLE: Try to recover. Apply RESET_TYPE_DISABLE if
		* unsuccessful.
		* @RESET_TYPE_MC_BIST: MC entering BIST mode.
		* @RESET_TYPE_DISABLE: Reset datapath, MAC and PHY; leave NIC disabled
		* @RESET_TYPE_TX_WATCHDOG: reset due to TX watchdog
		* @RESET_TYPE_INT_ERROR: reset due to internal error
		@@ -150,14 +151,16 @@ enum efx_loopback_mode {
		* @RESET_TYPE_DMA_ERROR: DMA error
		* @RESET_TYPE_TX_SKIP: hardware completed empty tx descriptors
		* @RESET_TYPE_MC_FAILURE: MC reboot/assertion
		* @RESET_TYPE_MCDI_TIMEOUT: MCDI timeout.
		*/
		enum reset_type {
		RESET_TYPE_INVISIBLE = 0,
		RESET_TYPE_RECOVER_OR_ALL = 1,
		RESET_TYPE_ALL = 2,
		RESET_TYPE_WORLD = 3,
		RESET_TYPE_RECOVER_OR_DISABLE = 4,
		RESET_TYPE_DISABLE = 5,
		RESET_TYPE_INVISIBLE,
		RESET_TYPE_RECOVER_OR_ALL,
		RESET_TYPE_ALL,
		RESET_TYPE_WORLD,
		RESET_TYPE_RECOVER_OR_DISABLE,
		RESET_TYPE_MC_BIST,
		RESET_TYPE_DISABLE,
		RESET_TYPE_MAX_METHOD,
		RESET_TYPE_TX_WATCHDOG,
		RESET_TYPE_INT_ERROR,
		@@ -165,7 +168,13 @@ enum reset_type {
		RESET_TYPE_DMA_ERROR,
		RESET_TYPE_TX_SKIP,
		RESET_TYPE_MC_FAILURE,
		RESET_TYPE_MC_BIST,
		/* RESET_TYPE_MCDI_TIMEOUT is actually a method, not just a reason, but
		* it doesn't fit the scope hierarchy (not well-ordered by inclusion).
		* We encode this by having its enum value be greater than
		* RESET_TYPE_MAX_METHOD. This also prevents issuing it with
		* efx_ioctl_reset.
		*/
		RESET_TYPE_MCDI_TIMEOUT,
		RESET_TYPE_MAX,
		};

drivers/net/ethernet/sfc/falcon.c

+4 −0

Original line number	Diff line number	Diff line
		@@ -2696,6 +2696,8 @@ const struct efx_nic_type falcon_a1_nic_type = {
		.fini_dmaq = efx_farch_fini_dmaq,
		.prepare_flush = falcon_prepare_flush,
		.finish_flush = efx_port_dummy_op_void,
		.prepare_flr = efx_port_dummy_op_void,
		.finish_flr = efx_farch_finish_flr,
		.describe_stats = falcon_describe_nic_stats,
		.update_stats = falcon_update_nic_stats,
		.start_stats = falcon_start_nic_stats,
		@@ -2790,6 +2792,8 @@ const struct efx_nic_type falcon_b0_nic_type = {
		.fini_dmaq = efx_farch_fini_dmaq,
		.prepare_flush = falcon_prepare_flush,
		.finish_flush = efx_port_dummy_op_void,
		.prepare_flr = efx_port_dummy_op_void,
		.finish_flr = efx_farch_finish_flr,
		.describe_stats = falcon_describe_nic_stats,
		.update_stats = falcon_update_nic_stats,
		.start_stats = falcon_start_nic_stats,

drivers/net/ethernet/sfc/farch.c

+22 −0

Original line number	Diff line number	Diff line
		@@ -741,6 +741,28 @@ int efx_farch_fini_dmaq(struct efx_nic *efx)
		return rc;
		}

		/* Reset queue and flush accounting after FLR
		*
		* One possible cause of FLR recovery is that DMA may be failing (eg. if bus
		* mastering was disabled), in which case we don't receive (RXQ) flush
		* completion events. This means that efx->rxq_flush_outstanding remained at 4
		* after the FLR; also, efx->active_queues was non-zero (as no flush completion
		* events were received, and we didn't go through efx_check_tx_flush_complete())
		* If we don't fix this up, on the next call to efx_realloc_channels() we won't
		* flush any RX queues because efx->rxq_flush_outstanding is at the limit of 4
		* for batched flush requests; and the efx->active_queues gets messed up because
		* we keep incrementing for the newly initialised queues, but it never went to
		* zero previously. Then we get a timeout every time we try to restart the
		* queues, as it doesn't go back to zero when we should be flushing the queues.
		*/
		void efx_farch_finish_flr(struct efx_nic *efx)
		{
		atomic_set(&efx->rxq_flush_pending, 0);
		atomic_set(&efx->rxq_flush_outstanding, 0);
		atomic_set(&efx->active_queues, 0);
		}


		/**************************************************************************
		*
		* Event queue processing