[dpdk-dev] [PATCH v4 4/8] ixgbe: implement device reset on VF

Ananyev, Konstantin konstantin.ananyev at intel.com
Tue Jun 7 12:03:04 CEST 2016



> -----Original Message-----
> From: Tao, Zhe
> Sent: Tuesday, June 07, 2016 7:53 AM
> To: dev at dpdk.org
> Cc: Lu, Wenzhuo; Tao, Zhe; Ananyev, Konstantin; Richardson, Bruce; Chen, Jing D; Liang, Cunming; Wu, Jingjing; Zhang, Helin
> Subject: [PATCH v4 4/8] ixgbe: implement device reset on VF
> 
> Implement the device reset function.
> 1, Add the fake RX/TX functions.
> 2, The reset function tries to stop RX/TX by replacing
>    the RX/TX functions with the fake ones and getting the
>    locks to make sure the regular RX/TX finished.
> 3, After the RX/TX stopped, reset the VF port, and then
>    release the locks and restore the RX/TX functions.
> 
> Signed-off-by: Wenzhuo Lu <wenzhuo.lu at intel.com>
> ---
>  doc/guides/rel_notes/release_16_07.rst |   9 +++
>  drivers/net/ixgbe/ixgbe_ethdev.c       | 108 ++++++++++++++++++++++++++++++++-
>  drivers/net/ixgbe/ixgbe_ethdev.h       |  12 +++-
>  drivers/net/ixgbe/ixgbe_rxtx.c         |  42 ++++++++++++-
>  4 files changed, 168 insertions(+), 3 deletions(-)
> 
> diff --git a/doc/guides/rel_notes/release_16_07.rst b/doc/guides/rel_notes/release_16_07.rst
> index a761e3c..d36c4b1 100644
> --- a/doc/guides/rel_notes/release_16_07.rst
> +++ b/doc/guides/rel_notes/release_16_07.rst
> @@ -53,6 +53,15 @@ New Features
>    VF. To handle this link up/down event, add the mailbox interruption
>    support to receive the message.
> 
> +* **Added device reset support for ixgbe VF.**
> +
> +  Added the device reset API. APP can call this API to reset the VF port
> +  when it's not working.
> +  Based on the mailbox interruption support, when VF reseives the control
> +  message from PF, it means the PF link state changes, VF uses the reset
> +  callback in the message handler to notice the APP. APP need call the device
> +  reset API to reset the VF port.
> +
> 
>  Resolved Issues
>  ---------------
> diff --git a/drivers/net/ixgbe/ixgbe_ethdev.c b/drivers/net/ixgbe/ixgbe_ethdev.c
> index fd2682f..1e3520b 100644
> --- a/drivers/net/ixgbe/ixgbe_ethdev.c
> +++ b/drivers/net/ixgbe/ixgbe_ethdev.c
> @@ -381,6 +381,8 @@ static int ixgbe_dev_udp_tunnel_port_add(struct rte_eth_dev *dev,
>  static int ixgbe_dev_udp_tunnel_port_del(struct rte_eth_dev *dev,
>  					 struct rte_eth_udp_tunnel *udp_tunnel);
> 
> +static int ixgbevf_dev_reset(struct rte_eth_dev *dev);
> +
>  /*
>   * Define VF Stats MACRO for Non "cleared on read" register
>   */
> @@ -586,6 +588,7 @@ static const struct eth_dev_ops ixgbevf_eth_dev_ops = {
>  	.reta_query           = ixgbe_dev_rss_reta_query,
>  	.rss_hash_update      = ixgbe_dev_rss_hash_update,
>  	.rss_hash_conf_get    = ixgbe_dev_rss_hash_conf_get,
> +	.dev_reset            = ixgbevf_dev_reset,
>  };
> 
>  /* store statistics names and its offset in stats structure */
> @@ -4060,7 +4063,8 @@ ixgbevf_dev_start(struct rte_eth_dev *dev)
>  		ETH_VLAN_EXTEND_MASK;
>  	ixgbevf_vlan_offload_set(dev, mask);
> 
> -	ixgbevf_dev_rxtx_start(dev);
> +	if (ixgbevf_dev_rxtx_start(dev))
> +		return -1;
> 
>  	/* check and configure queue intr-vector mapping */
>  	if (dev->data->dev_conf.intr_conf.rxq != 0) {
> @@ -7193,6 +7197,108 @@ static void ixgbevf_mbx_process(struct rte_eth_dev *dev)
>  }
> 
>  static int
> +ixgbevf_dev_reset(struct rte_eth_dev *dev)
> +{
> +	struct ixgbe_hw *hw = IXGBE_DEV_PRIVATE_TO_HW(dev->data->dev_private);
> +	struct ixgbe_adapter *adapter =
> +		(struct ixgbe_adapter *)dev->data->dev_private;
> +	int diag = 0;
> +	uint32_t vteiam;
> +	uint16_t i;
> +	struct ixgbe_rx_queue *rxq;
> +	struct ixgbe_tx_queue *txq;
> +
> +	/* Nothing needs to be done if the device is not started. */
> +	if (!dev->data->dev_started)
> +		return 0;
> +
> +	PMD_DRV_LOG(DEBUG, "Link up/down event detected.");
> +
> +	/**
> +	 * Stop RX/TX by fake functions and locks.
> +	 * Fake functions are used to make RX/TX lock easier.
> +	 */
> +	adapter->rx_backup = dev->rx_pkt_burst;
> +	adapter->tx_backup = dev->tx_pkt_burst;
> +	dev->rx_pkt_burst = ixgbevf_recv_pkts_fake;
> +	dev->tx_pkt_burst = ixgbevf_xmit_pkts_fake;

If you have locking over each queue underneath, why do you still need fake functions?

> +
> +	if (dev->data->rx_queues)
> +		for (i = 0; i < dev->data->nb_rx_queues; i++) {
> +			rxq = dev->data->rx_queues[i];
> +			rte_spinlock_lock(&rxq->rx_lock);
> +		}
> +
> +	if (dev->data->tx_queues)
> +		for (i = 0; i < dev->data->nb_tx_queues; i++) {
> +			txq = dev->data->tx_queues[i];
> +			rte_spinlock_lock(&txq->tx_lock);
> +		}

Probably worth to create a separate function for the lines above:
lock_all_queues(), unlock_all_queues.
But as I sadi in previous mail - I think that code better be in rte_ethdev.

> +
> +	/* Performance VF reset. */
> +	do {
> +		dev->data->dev_started = 0;
> +		ixgbevf_dev_stop(dev);
> +		if (dev->data->dev_conf.intr_conf.lsc == 0)
> +			diag = ixgbe_dev_link_update(dev, 0);
> +		if (diag) {
> +			PMD_INIT_LOG(INFO, "Ixgbe VF reset: "
> +				     "Failed to update link.");
> +		}
> +		rte_delay_ms(1000);
> +
> +		diag = ixgbevf_dev_start(dev);
> +		/*If fail to start the device, need to stop/start it again. */
> +		if (diag) {
> +			PMD_INIT_LOG(ERR, "Ixgbe VF reset: "
> +				     "Failed to start device.");
> +			continue;
> +		}
> +		dev->data->dev_started = 1;
> +		ixgbevf_dev_stats_reset(dev);
> +		if (dev->data->dev_conf.intr_conf.lsc == 0)
> +			diag = ixgbe_dev_link_update(dev, 0);
> +		if (diag) {
> +			PMD_INIT_LOG(INFO, "Ixgbe VF reset: "
> +				     "Failed to update link.");
> +			diag = 0;
> +		}
> +
> +		/**
> +		 * When the PF link is down, there has chance
> +		 * that VF cannot operate its registers. Will
> +		 * check if the registers is written
> +		 * successfully. If not, repeat stop/start until
> +		 * the PF link is up, in other words, until the
> +		 * registers can be written.
> +		 */
> +		vteiam = IXGBE_READ_REG(hw, IXGBE_VTEIAM);
> +	/* Reference ixgbevf_intr_enable when checking */
> +	} while (diag || vteiam != IXGBE_VF_IRQ_ENABLE_MASK);
> +
> +	/**
> +	 * Release the locks for queues.
> +	 * Restore the RX/TX functions.
> +	 */
> +	if (dev->data->rx_queues)
> +		for (i = 0; i < dev->data->nb_rx_queues; i++) {
> +			rxq = dev->data->rx_queues[i];
> +			rte_spinlock_unlock(&rxq->rx_lock);
> +		}
> +
> +	if (dev->data->tx_queues)
> +		for (i = 0; i < dev->data->nb_tx_queues; i++) {
> +			txq = dev->data->tx_queues[i];
> +			rte_spinlock_unlock(&txq->tx_lock);
> +		}
> +
> +	dev->rx_pkt_burst = adapter->rx_backup;
> +	dev->tx_pkt_burst = adapter->tx_backup;
> +
> +	return 0;
> +}
> +
> +static int
>  ixgbevf_dev_interrupt_get_status(struct rte_eth_dev *dev)
>  {
>  	uint32_t eicr;
> diff --git a/drivers/net/ixgbe/ixgbe_ethdev.h b/drivers/net/ixgbe/ixgbe_ethdev.h
> index 701107b..d50fad4 100644
> --- a/drivers/net/ixgbe/ixgbe_ethdev.h
> +++ b/drivers/net/ixgbe/ixgbe_ethdev.h
> @@ -289,6 +289,8 @@ struct ixgbe_adapter {
>  	struct rte_timecounter      systime_tc;
>  	struct rte_timecounter      rx_tstamp_tc;
>  	struct rte_timecounter      tx_tstamp_tc;
> +	eth_rx_burst_t              rx_backup;
> +	eth_tx_burst_t              tx_backup;
>  };
> 
>  #define IXGBE_DEV_PRIVATE_TO_HW(adapter)\
> @@ -377,7 +379,7 @@ int ixgbevf_dev_rx_init(struct rte_eth_dev *dev);
> 
>  void ixgbevf_dev_tx_init(struct rte_eth_dev *dev);
> 
> -void ixgbevf_dev_rxtx_start(struct rte_eth_dev *dev);
> +int ixgbevf_dev_rxtx_start(struct rte_eth_dev *dev);
> 
>  uint16_t ixgbe_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
>  		uint16_t nb_pkts);
> @@ -409,6 +411,14 @@ uint16_t ixgbe_xmit_pkts(void *tx_queue, struct rte_mbuf **tx_pkts,
>  uint16_t ixgbe_xmit_pkts_simple(void *tx_queue, struct rte_mbuf **tx_pkts,
>  		uint16_t nb_pkts);
> 
> +uint16_t ixgbevf_recv_pkts_fake(void *rx_queue,
> +				struct rte_mbuf **rx_pkts,
> +				uint16_t nb_pkts);
> +
> +uint16_t ixgbevf_xmit_pkts_fake(void *tx_queue,
> +				struct rte_mbuf **tx_pkts,
> +				uint16_t nb_pkts);
> +
>  uint16_t ixgbe_xmit_pkts_lock(void *tx_queue,
>  			      struct rte_mbuf **tx_pkts,
>  			      uint16_t nb_pkts);
> diff --git a/drivers/net/ixgbe/ixgbe_rxtx.c b/drivers/net/ixgbe/ixgbe_rxtx.c
> index a45d115..b4e7659 100644
> --- a/drivers/net/ixgbe/ixgbe_rxtx.c
> +++ b/drivers/net/ixgbe/ixgbe_rxtx.c
> @@ -5181,7 +5181,7 @@ ixgbevf_dev_tx_init(struct rte_eth_dev *dev)
>  /*
>   * [VF] Start Transmit and Receive Units.
>   */
> -void __attribute__((cold))
> +int __attribute__((cold))
>  ixgbevf_dev_rxtx_start(struct rte_eth_dev *dev)
>  {
>  	struct ixgbe_hw     *hw;
> @@ -5218,7 +5218,15 @@ ixgbevf_dev_rxtx_start(struct rte_eth_dev *dev)
>  			txdctl = IXGBE_READ_REG(hw, IXGBE_VFTXDCTL(i));
>  		} while (--poll_ms && !(txdctl & IXGBE_TXDCTL_ENABLE));
>  		if (!poll_ms)
> +#ifndef RTE_NEXT_ABI
>  			PMD_INIT_LOG(ERR, "Could not enable Tx Queue %d", i);
> +#else
> +		{
> +			PMD_INIT_LOG(ERR, "Could not enable Tx Queue %d", i);
> +			if (dev->data->dev_conf.txmode.lock_mode)
> +				return -1;
> +		}
> +#endif
>  	}
>  	for (i = 0; i < dev->data->nb_rx_queues; i++) {
> 
> @@ -5235,11 +5243,21 @@ ixgbevf_dev_rxtx_start(struct rte_eth_dev *dev)
>  			rxdctl = IXGBE_READ_REG(hw, IXGBE_VFRXDCTL(i));
>  		} while (--poll_ms && !(rxdctl & IXGBE_RXDCTL_ENABLE));
>  		if (!poll_ms)
> +#ifndef RTE_NEXT_ABI
> +			PMD_INIT_LOG(ERR, "Could not enable Rx Queue %d", i);
> +#else
> +		{
>  			PMD_INIT_LOG(ERR, "Could not enable Rx Queue %d", i);
> +			if (dev->data->dev_conf.rxmode.lock_mode)
> +				return -1;
> +		}
> +#endif


Why the code has to be different here?
Thanks
Konstantin


>  		rte_wmb();
>  		IXGBE_WRITE_REG(hw, IXGBE_VFRDT(i), rxq->nb_rx_desc - 1);
> 
>  	}
> +
> +	return 0;
>  }
> 
>  /* Stubs needed for linkage when CONFIG_RTE_IXGBE_INC_VECTOR is set to 'n' */
> @@ -5290,3 +5308,25 @@ ixgbe_rxq_vec_setup(struct ixgbe_rx_queue __rte_unused *rxq)
>  {
>  	return -1;
>  }
> +
> +/**
> + * A fake function to stop receiption.
> + */
> +uint16_t
> +ixgbevf_recv_pkts_fake(void __rte_unused *rx_queue,
> +		       struct rte_mbuf __rte_unused **rx_pkts,
> +		       uint16_t __rte_unused nb_pkts)
> +{
> +	return 0;
> +}
> +
> +/**
> + * A fake function to stop transmission.
> + */
> +uint16_t
> +ixgbevf_xmit_pkts_fake(void __rte_unused *tx_queue,
> +		       struct rte_mbuf __rte_unused **tx_pkts,
> +		       uint16_t __rte_unused nb_pkts)
> +{
> +	return 0;
> +}
> --
> 2.1.4



More information about the dev mailing list