diff mbox series

[net-next,1/4] gve: Control path for DQO-QPL

Message ID 20230802213338.2391025-2-rushilg@google.com (mailing list archive)
State Superseded
Delegated to: Netdev Maintainers
Headers show
Series Add QPL mode for DQO descriptor format | expand

Checks

Context Check Description
netdev/series_format success Posting correctly formatted
netdev/tree_selection success Clearly marked for net-next
netdev/fixes_present success Fixes tag not required for -next series
netdev/header_inline success No static functions without inline keyword in header files
netdev/build_32bit fail Errors and warnings before: 1328 this patch: 20
netdev/cc_maintainers warning 3 maintainers not CCed: jesse.brandeburg@intel.com jeroendb@google.com shailend@google.com
netdev/build_clang fail Errors and warnings before: 1354 this patch: 24
netdev/verify_signedoff success Signed-off-by tag matches author and committer
netdev/deprecated_api success None detected
netdev/check_selftest success No net selftest shell script
netdev/verify_fixes success No Fixes tag
netdev/build_allmodconfig_warn fail Errors and warnings before: 1351 this patch: 20
netdev/checkpatch warning WARNING: line length of 87 exceeds 80 columns WARNING: line length of 89 exceeds 80 columns WARNING: line length of 90 exceeds 80 columns
netdev/kdoc success Errors and warnings before: 0 this patch: 0
netdev/source_inline success Was 0 now: 0

Commit Message

Rushil Gupta Aug. 2, 2023, 9:33 p.m. UTC
Add checks, abi-changes and device options to support
QPL mode for DQO in addition to GQI. Also, use
pages-per-qpl supplied by device-option to control the
size of the "queue-page-list".

Signed-off-by: Rushil Gupta <rushilg@google.com>
Reviewed-by: Willem de Bruijn <willemb@google.com>
Signed-off-by: Praveen Kaligineedi <pkaligineedi@google.com>
Signed-off-by: Bailey Forrest <bcf@google.com>
---
 drivers/net/ethernet/google/gve/gve.h        | 20 ++++-
 drivers/net/ethernet/google/gve/gve_adminq.c | 93 +++++++++++++++++---
 drivers/net/ethernet/google/gve/gve_adminq.h | 10 +++
 drivers/net/ethernet/google/gve/gve_main.c   | 20 +++--
 4 files changed, 123 insertions(+), 20 deletions(-)

Comments

Jesse Brandeburg Aug. 3, 2023, 1:56 a.m. UTC | #1
On 8/2/2023 2:33 PM, Rushil Gupta wrote:
> Add checks, abi-changes and device options to support
> QPL mode for DQO in addition to GQI. Also, use
> pages-per-qpl supplied by device-option to control the
> size of the "queue-page-list".

That is some serious acronym soup there, maybe expand your acronyms upon
first use in the commit message? how are we to know what you mean?


> 
> Signed-off-by: Rushil Gupta <rushilg@google.com>
> Reviewed-by: Willem de Bruijn <willemb@google.com>
> Signed-off-by: Praveen Kaligineedi <pkaligineedi@google.com>
> Signed-off-by: Bailey Forrest <bcf@google.com>
> ---
>  drivers/net/ethernet/google/gve/gve.h        | 20 ++++-
>  drivers/net/ethernet/google/gve/gve_adminq.c | 93 +++++++++++++++++---
>  drivers/net/ethernet/google/gve/gve_adminq.h | 10 +++
>  drivers/net/ethernet/google/gve/gve_main.c   | 20 +++--
>  4 files changed, 123 insertions(+), 20 deletions(-)
> 
> diff --git a/drivers/net/ethernet/google/gve/gve.h b/drivers/net/ethernet/google/gve/gve.h
> index 4b425bf71ede..517a63b60cb9 100644
> --- a/drivers/net/ethernet/google/gve/gve.h
> +++ b/drivers/net/ethernet/google/gve/gve.h
> @@ -51,6 +51,12 @@
>  
>  #define GVE_GQ_TX_MIN_PKT_DESC_BYTES 182
>  
> +#define DQO_QPL_DEFAULT_TX_PAGES 512
> +#define DQO_QPL_DEFAULT_RX_PAGES 2048
> +
> +/* Maximum TSO size supported on DQO */
> +#define GVE_DQO_TX_MAX	0x3FFFF
> +
>  /* Each slot in the desc ring has a 1:1 mapping to a slot in the data ring */
>  struct gve_rx_desc_queue {
>  	struct gve_rx_desc *desc_ring; /* the descriptor ring */
> @@ -531,6 +537,7 @@ enum gve_queue_format {
>  	GVE_GQI_RDA_FORMAT		= 0x1,
>  	GVE_GQI_QPL_FORMAT		= 0x2,
>  	GVE_DQO_RDA_FORMAT		= 0x3,
> +	GVE_DQO_QPL_FORMAT		= 0x4,
>  };
>  
>  struct gve_priv {
> @@ -550,7 +557,8 @@ struct gve_priv {
>  	u16 num_event_counters;
>  	u16 tx_desc_cnt; /* num desc per ring */
>  	u16 rx_desc_cnt; /* num desc per ring */
> -	u16 tx_pages_per_qpl; /* tx buffer length */
> +	u16 tx_pages_per_qpl; /* Suggested number of pages per qpl for TX queues by NIC */
> +	u16 rx_pages_per_qpl; /* Suggested number of pages per qpl for RX queues by NIC */
>  	u16 rx_data_slot_cnt; /* rx buffer length */
>  	u64 max_registered_pages;
>  	u64 num_registered_pages; /* num pages registered with NIC */
> @@ -808,11 +816,17 @@ static inline u32 gve_rx_idx_to_ntfy(struct gve_priv *priv, u32 queue_idx)
>  	return (priv->num_ntfy_blks / 2) + queue_idx;
>  }
>  
> +static inline bool gve_is_qpl(struct gve_priv *priv)
> +{
> +	return priv->queue_format == GVE_GQI_QPL_FORMAT ||
> +		priv->queue_format == GVE_DQO_QPL_FORMAT;
> +}
> +
>  /* Returns the number of tx queue page lists
>   */
>  static inline u32 gve_num_tx_qpls(struct gve_priv *priv)
>  {
> -	if (priv->queue_format != GVE_GQI_QPL_FORMAT)
> +	if (!gve_is_qpl(priv))
>  		return 0;
>  
>  	return priv->tx_cfg.num_queues + priv->num_xdp_queues;
> @@ -832,7 +846,7 @@ static inline u32 gve_num_xdp_qpls(struct gve_priv *priv)
>   */
>  static inline u32 gve_num_rx_qpls(struct gve_priv *priv)
>  {
> -	if (priv->queue_format != GVE_GQI_QPL_FORMAT)
> +	if (!gve_is_qpl(priv))
>  		return 0;
>  
>  	return priv->rx_cfg.num_queues;
> diff --git a/drivers/net/ethernet/google/gve/gve_adminq.c b/drivers/net/ethernet/google/gve/gve_adminq.c
> index 252974202a3f..a16e7cf21911 100644
> --- a/drivers/net/ethernet/google/gve/gve_adminq.c
> +++ b/drivers/net/ethernet/google/gve/gve_adminq.c
> @@ -39,7 +39,8 @@ void gve_parse_device_option(struct gve_priv *priv,
>  			     struct gve_device_option_gqi_rda **dev_op_gqi_rda,
>  			     struct gve_device_option_gqi_qpl **dev_op_gqi_qpl,
>  			     struct gve_device_option_dqo_rda **dev_op_dqo_rda,
> -			     struct gve_device_option_jumbo_frames **dev_op_jumbo_frames)
> +			     struct gve_device_option_jumbo_frames **dev_op_jumbo_frames,
> +			     struct gve_device_option_dqo_qpl **dev_op_dqo_qpl)
>  {
>  	u32 req_feat_mask = be32_to_cpu(option->required_features_mask);
>  	u16 option_length = be16_to_cpu(option->option_length);
> @@ -112,6 +113,22 @@ void gve_parse_device_option(struct gve_priv *priv,
>  		}
>  		*dev_op_dqo_rda = (void *)(option + 1);
>  		break;
> +	case GVE_DEV_OPT_ID_DQO_QPL:
> +		if (option_length < sizeof(**dev_op_dqo_qpl) ||
> +		    req_feat_mask != GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL) {
> +			dev_warn(&priv->pdev->dev, GVE_DEVICE_OPTION_ERROR_FMT,
> +				 "DQO QPL", (int)sizeof(**dev_op_dqo_qpl),
> +				 GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL,
> +				 option_length, req_feat_mask);
> +			break;
> +		}
> +
> +		if (option_length > sizeof(**dev_op_dqo_qpl)) {
> +			dev_warn(&priv->pdev->dev,
> +				 GVE_DEVICE_OPTION_TOO_BIG_FMT, "DQO QPL");
> +		}
> +		*dev_op_dqo_qpl = (void *)(option + 1);
> +		break;
>  	case GVE_DEV_OPT_ID_JUMBO_FRAMES:
>  		if (option_length < sizeof(**dev_op_jumbo_frames) ||
>  		    req_feat_mask != GVE_DEV_OPT_REQ_FEAT_MASK_JUMBO_FRAMES) {
> @@ -146,7 +163,8 @@ gve_process_device_options(struct gve_priv *priv,
>  			   struct gve_device_option_gqi_rda **dev_op_gqi_rda,
>  			   struct gve_device_option_gqi_qpl **dev_op_gqi_qpl,
>  			   struct gve_device_option_dqo_rda **dev_op_dqo_rda,
> -			   struct gve_device_option_jumbo_frames **dev_op_jumbo_frames)
> +			   struct gve_device_option_jumbo_frames **dev_op_jumbo_frames,
> +			   struct gve_device_option_dqo_qpl **dev_op_dqo_qpl)
>  {
>  	const int num_options = be16_to_cpu(descriptor->num_device_options);
>  	struct gve_device_option *dev_opt;
> @@ -166,7 +184,8 @@ gve_process_device_options(struct gve_priv *priv,
>  
>  		gve_parse_device_option(priv, descriptor, dev_opt,
>  					dev_op_gqi_rda, dev_op_gqi_qpl,
> -					dev_op_dqo_rda, dev_op_jumbo_frames);
> +					dev_op_dqo_rda, dev_op_jumbo_frames,
> +					dev_op_dqo_qpl);
>  		dev_opt = next_opt;
>  	}
>  
> @@ -505,12 +524,24 @@ static int gve_adminq_create_tx_queue(struct gve_priv *priv, u32 queue_index)
>  
>  		cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  	} else {
> +		u16 comp_ring_size = 0;
> +		u32 qpl_id = 0;

these stack initializers are useless, you unconditionally overwrite both
values below.

> +
> +		if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> +			qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
> +			comp_ring_size =
> +				priv->options_dqo_rda.tx_comp_ring_entries;
> +		} else {
> +			qpl_id = tx->dqo.qpl->id;
> +			comp_ring_size = priv->tx_desc_cnt;
> +		}
> +		cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  		cmd.create_tx_queue.tx_ring_size =
>  			cpu_to_be16(priv->tx_desc_cnt);
>  		cmd.create_tx_queue.tx_comp_ring_addr =
>  			cpu_to_be64(tx->complq_bus_dqo);
>  		cmd.create_tx_queue.tx_comp_ring_size =
> -			cpu_to_be16(priv->options_dqo_rda.tx_comp_ring_entries);
> +			cpu_to_be16(comp_ring_size);
>  	}
>  
>  	return gve_adminq_issue_cmd(priv, &cmd);
> @@ -555,6 +586,18 @@ static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
>  		cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  		cmd.create_rx_queue.packet_buffer_size = cpu_to_be16(rx->packet_buffer_size);
>  	} else {
> +		u16 rx_buff_ring_entries = 0;
> +		u32 qpl_id = 0;

same here

> +
> +		if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> +			qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
> +			rx_buff_ring_entries =
> +				priv->options_dqo_rda.rx_buff_ring_entries;
> +		} else {
> +			qpl_id = rx->dqo.qpl->id;
> +			rx_buff_ring_entries = priv->rx_desc_cnt;
> +		}
> +		cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  		cmd.create_rx_queue.rx_ring_size =
>  			cpu_to_be16(priv->rx_desc_cnt);
>  		cmd.create_rx_queue.rx_desc_ring_addr =
> @@ -564,7 +607,7 @@ static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
>  		cmd.create_rx_queue.packet_buffer_size =
>  			cpu_to_be16(priv->data_buffer_size_dqo);
>  		cmd.create_rx_queue.rx_buff_ring_size =
> -			cpu_to_be16(priv->options_dqo_rda.rx_buff_ring_entries);
> +			cpu_to_be16(rx_buff_ring_entries);
>  		cmd.create_rx_queue.enable_rsc =
>  			!!(priv->dev->features & NETIF_F_LRO);
>  	}
> @@ -675,9 +718,13 @@ gve_set_desc_cnt_dqo(struct gve_priv *priv,
>  		     const struct gve_device_option_dqo_rda *dev_op_dqo_rda)
>  {
>  	priv->tx_desc_cnt = be16_to_cpu(descriptor->tx_queue_entries);
> +	priv->rx_desc_cnt = be16_to_cpu(descriptor->rx_queue_entries);
> +
> +	if (priv->queue_format == GVE_DQO_QPL_FORMAT)
> +		return 0;
> +
>  	priv->options_dqo_rda.tx_comp_ring_entries =
>  		be16_to_cpu(dev_op_dqo_rda->tx_comp_ring_entries);
> -	priv->rx_desc_cnt = be16_to_cpu(descriptor->rx_queue_entries);
>  	priv->options_dqo_rda.rx_buff_ring_entries =
>  		be16_to_cpu(dev_op_dqo_rda->rx_buff_ring_entries);
>  
> @@ -687,7 +734,9 @@ gve_set_desc_cnt_dqo(struct gve_priv *priv,
>  static void gve_enable_supported_features(struct gve_priv *priv,
>  					  u32 supported_features_mask,
>  					  const struct gve_device_option_jumbo_frames
> -						  *dev_op_jumbo_frames)
> +					  *dev_op_jumbo_frames,
> +					  const struct gve_device_option_dqo_qpl
> +					  *dev_op_dqo_qpl)
>  {
>  	/* Before control reaches this point, the page-size-capped max MTU from
>  	 * the gve_device_descriptor field has already been stored in
> @@ -699,6 +748,20 @@ static void gve_enable_supported_features(struct gve_priv *priv,
>  			 "JUMBO FRAMES device option enabled.\n");
>  		priv->dev->max_mtu = be16_to_cpu(dev_op_jumbo_frames->max_mtu);
>  	}
> +
> +	/* Override pages for qpl for DQO-QPL */
> +	if (dev_op_dqo_qpl) {
> +		dev_info(&priv->pdev->dev,
> +			 "DQO QPL device option enabled.\n");

How does this message benefit the user?

> +		priv->tx_pages_per_qpl =
> +			be16_to_cpu(dev_op_dqo_qpl->tx_pages_per_qpl);
> +		priv->rx_pages_per_qpl =
> +			be16_to_cpu(dev_op_dqo_qpl->rx_pages_per_qpl);
> +		if (priv->tx_pages_per_qpl == 0)
> +			priv->tx_pages_per_qpl = DQO_QPL_DEFAULT_TX_PAGES;
> +		if (priv->rx_pages_per_qpl == 0)
> +			priv->rx_pages_per_qpl = DQO_QPL_DEFAULT_RX_PAGES;
> +	}
>  }
>  
>  int gve_adminq_describe_device(struct gve_priv *priv)
> @@ -707,6 +770,7 @@ int gve_adminq_describe_device(struct gve_priv *priv)
>  	struct gve_device_option_gqi_rda *dev_op_gqi_rda = NULL;
>  	struct gve_device_option_gqi_qpl *dev_op_gqi_qpl = NULL;
>  	struct gve_device_option_dqo_rda *dev_op_dqo_rda = NULL;
> +	struct gve_device_option_dqo_qpl *dev_op_dqo_qpl = NULL;
>  	struct gve_device_descriptor *descriptor;
>  	u32 supported_features_mask = 0;
>  	union gve_adminq_command cmd;
> @@ -733,13 +797,14 @@ int gve_adminq_describe_device(struct gve_priv *priv)
>  
>  	err = gve_process_device_options(priv, descriptor, &dev_op_gqi_rda,
>  					 &dev_op_gqi_qpl, &dev_op_dqo_rda,
> -					 &dev_op_jumbo_frames);
> +					 &dev_op_jumbo_frames,
> +					 &dev_op_dqo_qpl);
>  	if (err)
>  		goto free_device_descriptor;
>  
>  	/* If the GQI_RAW_ADDRESSING option is not enabled and the queue format
>  	 * is not set to GqiRda, choose the queue format in a priority order:
> -	 * DqoRda, GqiRda, GqiQpl. Use GqiQpl as default.
> +	 * DqoRda, DqoQpl, GqiRda, GqiQpl. Use GqiQpl as default.
>  	 */
>  	if (dev_op_dqo_rda) {
>  		priv->queue_format = GVE_DQO_RDA_FORMAT;
> @@ -747,7 +812,13 @@ int gve_adminq_describe_device(struct gve_priv *priv)
>  			 "Driver is running with DQO RDA queue format.\n");
>  		supported_features_mask =
>  			be32_to_cpu(dev_op_dqo_rda->supported_features_mask);
> -	} else if (dev_op_gqi_rda) {
> +	} else if (dev_op_dqo_qpl) {
> +		priv->queue_format = GVE_DQO_QPL_FORMAT;
> +		dev_info(&priv->pdev->dev,
> +			 "Driver is running with DQO QPL queue format.\n");

I feel like at best these should have been dev_dbg, or at worst just
removed. Messages should always add value for the user if they're printed.

> +		supported_features_mask =
> +			be32_to_cpu(dev_op_dqo_qpl->supported_features_mask);
> +	}  else if (dev_op_gqi_rda) {
>  		priv->queue_format = GVE_GQI_RDA_FORMAT;
>  		dev_info(&priv->pdev->dev,
>  			 "Driver is running with GQI RDA queue format.\n");
> @@ -798,7 +869,7 @@ int gve_adminq_describe_device(struct gve_priv *priv)
>  	priv->default_num_queues = be16_to_cpu(descriptor->default_num_queues);
>  
>  	gve_enable_supported_features(priv, supported_features_mask,
> -				      dev_op_jumbo_frames);
> +				      dev_op_jumbo_frames, dev_op_dqo_qpl);
>  
>  free_device_descriptor:
>  	dma_free_coherent(&priv->pdev->dev, PAGE_SIZE, descriptor,
> diff --git a/drivers/net/ethernet/google/gve/gve_adminq.h b/drivers/net/ethernet/google/gve/gve_adminq.h
> index f894beb3deaf..38a22279e863 100644
> --- a/drivers/net/ethernet/google/gve/gve_adminq.h
> +++ b/drivers/net/ethernet/google/gve/gve_adminq.h
> @@ -109,6 +109,14 @@ struct gve_device_option_dqo_rda {
>  
>  static_assert(sizeof(struct gve_device_option_dqo_rda) == 8);
>  
> +struct gve_device_option_dqo_qpl {
> +	__be32 supported_features_mask;
> +	__be16 tx_pages_per_qpl;
> +	__be16 rx_pages_per_qpl;
> +};
> +
> +static_assert(sizeof(struct gve_device_option_dqo_qpl) == 8);
> +
>  struct gve_device_option_jumbo_frames {
>  	__be32 supported_features_mask;
>  	__be16 max_mtu;
> @@ -130,6 +138,7 @@ enum gve_dev_opt_id {
>  	GVE_DEV_OPT_ID_GQI_RDA = 0x2,
>  	GVE_DEV_OPT_ID_GQI_QPL = 0x3,
>  	GVE_DEV_OPT_ID_DQO_RDA = 0x4,
> +	GVE_DEV_OPT_ID_DQO_QPL = 0x7,
>  	GVE_DEV_OPT_ID_JUMBO_FRAMES = 0x8,
>  };
>  
> @@ -139,6 +148,7 @@ enum gve_dev_opt_req_feat_mask {
>  	GVE_DEV_OPT_REQ_FEAT_MASK_GQI_QPL = 0x0,
>  	GVE_DEV_OPT_REQ_FEAT_MASK_DQO_RDA = 0x0,
>  	GVE_DEV_OPT_REQ_FEAT_MASK_JUMBO_FRAMES = 0x0,
> +	GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL = 0x0,


Maybe this makes sense to others, but an enum full of defines where all
values are zero? Why are we even writing code?

>  };
>  
>  enum gve_sup_feature_mask {
> diff --git a/drivers/net/ethernet/google/gve/gve_main.c b/drivers/net/ethernet/google/gve/gve_main.c
> index e6f1711d9be0..b40fafe1460a 100644
> --- a/drivers/net/ethernet/google/gve/gve_main.c
> +++ b/drivers/net/ethernet/google/gve/gve_main.c
> @@ -31,7 +31,6 @@
>  
>  // Minimum amount of time between queue kicks in msec (10 seconds)
>  #define MIN_TX_TIMEOUT_GAP (1000 * 10)
> -#define DQO_TX_MAX	0x3FFFF
>  
>  char gve_driver_name[] = "gve";
>  const char gve_version_str[] = GVE_VERSION;
> @@ -494,7 +493,7 @@ static int gve_setup_device_resources(struct gve_priv *priv)
>  		goto abort_with_stats_report;
>  	}
>  
> -	if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> +	if (!gve_is_gqi(priv)) {
>  		priv->ptype_lut_dqo = kvzalloc(sizeof(*priv->ptype_lut_dqo),
>  					       GFP_KERNEL);
>  		if (!priv->ptype_lut_dqo) {
> @@ -1085,9 +1084,10 @@ static int gve_alloc_qpls(struct gve_priv *priv)
>  	int max_queues = priv->tx_cfg.max_queues + priv->rx_cfg.max_queues;
>  	int start_id;
>  	int i, j;
> +	int page_count;

RCT please

>  	int err;
>  
> -	if (priv->queue_format != GVE_GQI_QPL_FORMAT)
> +	if (!gve_is_qpl(priv))
>  		return 0;
>  
>  	priv->qpls = kvcalloc(max_queues, sizeof(*priv->qpls), GFP_KERNEL);
> @@ -1095,17 +1095,25 @@ static int gve_alloc_qpls(struct gve_priv *priv)
>  		return -ENOMEM;
>  
>  	start_id = gve_tx_start_qpl_id(priv);
> +	page_count = priv->tx_pages_per_qpl;
>  	for (i = start_id; i < start_id + gve_num_tx_qpls(priv); i++) {
>  		err = gve_alloc_queue_page_list(priv, i,
> -						priv->tx_pages_per_qpl);
> +						page_count);
>  		if (err)
>  			goto free_qpls;
>  	}
>  
>  	start_id = gve_rx_start_qpl_id(priv);
> +
> +	/* For GQI_QPL number of pages allocated have 1:1 relationship with
> +	 * number of descriptors. For DQO, number of pages required are
> +	 * more than descriptors (because of out of order completions).
> +	 */
> +	page_count = priv->queue_format == GVE_GQI_QPL_FORMAT ?
> +		priv->rx_data_slot_cnt : priv->rx_pages_per_qpl;
>  	for (i = start_id; i < start_id + gve_num_rx_qpls(priv); i++) {
>  		err = gve_alloc_queue_page_list(priv, i,
> -						priv->rx_data_slot_cnt);
> +						page_count);
>  		if (err)
>  			goto free_qpls;
>  	}
> @@ -2051,7 +2059,7 @@ static int gve_init_priv(struct gve_priv *priv, bool skip_describe_device)
>  
>  	/* Big TCP is only supported on DQ*/
>  	if (!gve_is_gqi(priv))
> -		netif_set_tso_max_size(priv->dev, DQO_TX_MAX);
> +		netif_set_tso_max_size(priv->dev, GVE_DQO_TX_MAX);
>  
>  	priv->num_registered_pages = 0;
>  	priv->rx_copybreak = GVE_DEFAULT_RX_COPYBREAK;
Simon Horman Aug. 3, 2023, 9:28 a.m. UTC | #2
On Wed, Aug 02, 2023 at 09:33:35PM +0000, Rushil Gupta wrote:

...

Hi Rashil,

> @@ -505,12 +524,24 @@ static int gve_adminq_create_tx_queue(struct gve_priv *priv, u32 queue_index)
>  
>  		cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  	} else {
> +		u16 comp_ring_size = 0;
> +		u32 qpl_id = 0;
> +
> +		if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> +			qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
> +			comp_ring_size =
> +				priv->options_dqo_rda.tx_comp_ring_entries;
> +		} else {
> +			qpl_id = tx->dqo.qpl->id;

The qpl field does not appear to be added to struct gve_tx_ring
until a following patch.

> +			comp_ring_size = priv->tx_desc_cnt;
> +		}
> +		cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  		cmd.create_tx_queue.tx_ring_size =
>  			cpu_to_be16(priv->tx_desc_cnt);
>  		cmd.create_tx_queue.tx_comp_ring_addr =
>  			cpu_to_be64(tx->complq_bus_dqo);
>  		cmd.create_tx_queue.tx_comp_ring_size =
> -			cpu_to_be16(priv->options_dqo_rda.tx_comp_ring_entries);
> +			cpu_to_be16(comp_ring_size);
>  	}
>  
>  	return gve_adminq_issue_cmd(priv, &cmd);
> @@ -555,6 +586,18 @@ static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
>  		cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  		cmd.create_rx_queue.packet_buffer_size = cpu_to_be16(rx->packet_buffer_size);
>  	} else {
> +		u16 rx_buff_ring_entries = 0;
> +		u32 qpl_id = 0;
> +
> +		if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> +			qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
> +			rx_buff_ring_entries =
> +				priv->options_dqo_rda.rx_buff_ring_entries;
> +		} else {
> +			qpl_id = rx->dqo.qpl->id;

Likewise, the qpl field does not appear to be added to struct gve_rx_ring
until a following patch.

> +			rx_buff_ring_entries = priv->rx_desc_cnt;
> +		}
> +		cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
>  		cmd.create_rx_queue.rx_ring_size =
>  			cpu_to_be16(priv->rx_desc_cnt);
>  		cmd.create_rx_queue.rx_desc_ring_addr =

...
Rushil Gupta Aug. 3, 2023, 7:18 p.m. UTC | #3
On Wed, Aug 2, 2023 at 6:56 PM Jesse Brandeburg
<jesse.brandeburg@intel.com> wrote:
>
> On 8/2/2023 2:33 PM, Rushil Gupta wrote:
> > Add checks, abi-changes and device options to support
> > QPL mode for DQO in addition to GQI. Also, use
> > pages-per-qpl supplied by device-option to control the
> > size of the "queue-page-list".
>
> That is some serious acronym soup there, maybe expand your acronyms upon
> first use in the commit message? how are we to know what you mean?

I have provided the acronym explanations in the cover letter and .rst files.
However, I agree I should add them to the commit message as well. Will
fix it in v2.
>
>
> >
> > Signed-off-by: Rushil Gupta <rushilg@google.com>
> > Reviewed-by: Willem de Bruijn <willemb@google.com>
> > Signed-off-by: Praveen Kaligineedi <pkaligineedi@google.com>
> > Signed-off-by: Bailey Forrest <bcf@google.com>
> > ---
> >  drivers/net/ethernet/google/gve/gve.h        | 20 ++++-
> >  drivers/net/ethernet/google/gve/gve_adminq.c | 93 +++++++++++++++++---
> >  drivers/net/ethernet/google/gve/gve_adminq.h | 10 +++
> >  drivers/net/ethernet/google/gve/gve_main.c   | 20 +++--
> >  4 files changed, 123 insertions(+), 20 deletions(-)
> >
> > diff --git a/drivers/net/ethernet/google/gve/gve.h b/drivers/net/ethernet/google/gve/gve.h
> > index 4b425bf71ede..517a63b60cb9 100644
> > --- a/drivers/net/ethernet/google/gve/gve.h
> > +++ b/drivers/net/ethernet/google/gve/gve.h
> > @@ -51,6 +51,12 @@
> >
> >  #define GVE_GQ_TX_MIN_PKT_DESC_BYTES 182
> >
> > +#define DQO_QPL_DEFAULT_TX_PAGES 512
> > +#define DQO_QPL_DEFAULT_RX_PAGES 2048
> > +
> > +/* Maximum TSO size supported on DQO */
> > +#define GVE_DQO_TX_MAX       0x3FFFF
> > +
> >  /* Each slot in the desc ring has a 1:1 mapping to a slot in the data ring */
> >  struct gve_rx_desc_queue {
> >       struct gve_rx_desc *desc_ring; /* the descriptor ring */
> > @@ -531,6 +537,7 @@ enum gve_queue_format {
> >       GVE_GQI_RDA_FORMAT              = 0x1,
> >       GVE_GQI_QPL_FORMAT              = 0x2,
> >       GVE_DQO_RDA_FORMAT              = 0x3,
> > +     GVE_DQO_QPL_FORMAT              = 0x4,
> >  };
> >
> >  struct gve_priv {
> > @@ -550,7 +557,8 @@ struct gve_priv {
> >       u16 num_event_counters;
> >       u16 tx_desc_cnt; /* num desc per ring */
> >       u16 rx_desc_cnt; /* num desc per ring */
> > -     u16 tx_pages_per_qpl; /* tx buffer length */
> > +     u16 tx_pages_per_qpl; /* Suggested number of pages per qpl for TX queues by NIC */
> > +     u16 rx_pages_per_qpl; /* Suggested number of pages per qpl for RX queues by NIC */
> >       u16 rx_data_slot_cnt; /* rx buffer length */
> >       u64 max_registered_pages;
> >       u64 num_registered_pages; /* num pages registered with NIC */
> > @@ -808,11 +816,17 @@ static inline u32 gve_rx_idx_to_ntfy(struct gve_priv *priv, u32 queue_idx)
> >       return (priv->num_ntfy_blks / 2) + queue_idx;
> >  }
> >
> > +static inline bool gve_is_qpl(struct gve_priv *priv)
> > +{
> > +     return priv->queue_format == GVE_GQI_QPL_FORMAT ||
> > +             priv->queue_format == GVE_DQO_QPL_FORMAT;
> > +}
> > +
> >  /* Returns the number of tx queue page lists
> >   */
> >  static inline u32 gve_num_tx_qpls(struct gve_priv *priv)
> >  {
> > -     if (priv->queue_format != GVE_GQI_QPL_FORMAT)
> > +     if (!gve_is_qpl(priv))
> >               return 0;
> >
> >       return priv->tx_cfg.num_queues + priv->num_xdp_queues;
> > @@ -832,7 +846,7 @@ static inline u32 gve_num_xdp_qpls(struct gve_priv *priv)
> >   */
> >  static inline u32 gve_num_rx_qpls(struct gve_priv *priv)
> >  {
> > -     if (priv->queue_format != GVE_GQI_QPL_FORMAT)
> > +     if (!gve_is_qpl(priv))
> >               return 0;
> >
> >       return priv->rx_cfg.num_queues;
> > diff --git a/drivers/net/ethernet/google/gve/gve_adminq.c b/drivers/net/ethernet/google/gve/gve_adminq.c
> > index 252974202a3f..a16e7cf21911 100644
> > --- a/drivers/net/ethernet/google/gve/gve_adminq.c
> > +++ b/drivers/net/ethernet/google/gve/gve_adminq.c
> > @@ -39,7 +39,8 @@ void gve_parse_device_option(struct gve_priv *priv,
> >                            struct gve_device_option_gqi_rda **dev_op_gqi_rda,
> >                            struct gve_device_option_gqi_qpl **dev_op_gqi_qpl,
> >                            struct gve_device_option_dqo_rda **dev_op_dqo_rda,
> > -                          struct gve_device_option_jumbo_frames **dev_op_jumbo_frames)
> > +                          struct gve_device_option_jumbo_frames **dev_op_jumbo_frames,
> > +                          struct gve_device_option_dqo_qpl **dev_op_dqo_qpl)
> >  {
> >       u32 req_feat_mask = be32_to_cpu(option->required_features_mask);
> >       u16 option_length = be16_to_cpu(option->option_length);
> > @@ -112,6 +113,22 @@ void gve_parse_device_option(struct gve_priv *priv,
> >               }
> >               *dev_op_dqo_rda = (void *)(option + 1);
> >               break;
> > +     case GVE_DEV_OPT_ID_DQO_QPL:
> > +             if (option_length < sizeof(**dev_op_dqo_qpl) ||
> > +                 req_feat_mask != GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL) {
> > +                     dev_warn(&priv->pdev->dev, GVE_DEVICE_OPTION_ERROR_FMT,
> > +                              "DQO QPL", (int)sizeof(**dev_op_dqo_qpl),
> > +                              GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL,
> > +                              option_length, req_feat_mask);
> > +                     break;
> > +             }
> > +
> > +             if (option_length > sizeof(**dev_op_dqo_qpl)) {
> > +                     dev_warn(&priv->pdev->dev,
> > +                              GVE_DEVICE_OPTION_TOO_BIG_FMT, "DQO QPL");
> > +             }
> > +             *dev_op_dqo_qpl = (void *)(option + 1);
> > +             break;
> >       case GVE_DEV_OPT_ID_JUMBO_FRAMES:
> >               if (option_length < sizeof(**dev_op_jumbo_frames) ||
> >                   req_feat_mask != GVE_DEV_OPT_REQ_FEAT_MASK_JUMBO_FRAMES) {
> > @@ -146,7 +163,8 @@ gve_process_device_options(struct gve_priv *priv,
> >                          struct gve_device_option_gqi_rda **dev_op_gqi_rda,
> >                          struct gve_device_option_gqi_qpl **dev_op_gqi_qpl,
> >                          struct gve_device_option_dqo_rda **dev_op_dqo_rda,
> > -                        struct gve_device_option_jumbo_frames **dev_op_jumbo_frames)
> > +                        struct gve_device_option_jumbo_frames **dev_op_jumbo_frames,
> > +                        struct gve_device_option_dqo_qpl **dev_op_dqo_qpl)
> >  {
> >       const int num_options = be16_to_cpu(descriptor->num_device_options);
> >       struct gve_device_option *dev_opt;
> > @@ -166,7 +184,8 @@ gve_process_device_options(struct gve_priv *priv,
> >
> >               gve_parse_device_option(priv, descriptor, dev_opt,
> >                                       dev_op_gqi_rda, dev_op_gqi_qpl,
> > -                                     dev_op_dqo_rda, dev_op_jumbo_frames);
> > +                                     dev_op_dqo_rda, dev_op_jumbo_frames,
> > +                                     dev_op_dqo_qpl);
> >               dev_opt = next_opt;
> >       }
> >
> > @@ -505,12 +524,24 @@ static int gve_adminq_create_tx_queue(struct gve_priv *priv, u32 queue_index)
> >
> >               cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
> >       } else {
> > +             u16 comp_ring_size = 0;
> > +             u32 qpl_id = 0;
>
> these stack initializers are useless, you unconditionally overwrite both
> values below.
Will fix.
>
> > +
> > +             if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> > +                     qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
> > +                     comp_ring_size =
> > +                             priv->options_dqo_rda.tx_comp_ring_entries;
> > +             } else {
> > +                     qpl_id = tx->dqo.qpl->id;
> > +                     comp_ring_size = priv->tx_desc_cnt;
> > +             }
> > +             cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
> >               cmd.create_tx_queue.tx_ring_size =
> >                       cpu_to_be16(priv->tx_desc_cnt);
> >               cmd.create_tx_queue.tx_comp_ring_addr =
> >                       cpu_to_be64(tx->complq_bus_dqo);
> >               cmd.create_tx_queue.tx_comp_ring_size =
> > -                     cpu_to_be16(priv->options_dqo_rda.tx_comp_ring_entries);
> > +                     cpu_to_be16(comp_ring_size);
> >       }
> >
> >       return gve_adminq_issue_cmd(priv, &cmd);
> > @@ -555,6 +586,18 @@ static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
> >               cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
> >               cmd.create_rx_queue.packet_buffer_size = cpu_to_be16(rx->packet_buffer_size);
> >       } else {
> > +             u16 rx_buff_ring_entries = 0;
> > +             u32 qpl_id = 0;
>
> same here
Will fix.
>
> > +
> > +             if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> > +                     qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
> > +                     rx_buff_ring_entries =
> > +                             priv->options_dqo_rda.rx_buff_ring_entries;
> > +             } else {
> > +                     qpl_id = rx->dqo.qpl->id;
> > +                     rx_buff_ring_entries = priv->rx_desc_cnt;
> > +             }
> > +             cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
> >               cmd.create_rx_queue.rx_ring_size =
> >                       cpu_to_be16(priv->rx_desc_cnt);
> >               cmd.create_rx_queue.rx_desc_ring_addr =
> > @@ -564,7 +607,7 @@ static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
> >               cmd.create_rx_queue.packet_buffer_size =
> >                       cpu_to_be16(priv->data_buffer_size_dqo);
> >               cmd.create_rx_queue.rx_buff_ring_size =
> > -                     cpu_to_be16(priv->options_dqo_rda.rx_buff_ring_entries);
> > +                     cpu_to_be16(rx_buff_ring_entries);
> >               cmd.create_rx_queue.enable_rsc =
> >                       !!(priv->dev->features & NETIF_F_LRO);
> >       }
> > @@ -675,9 +718,13 @@ gve_set_desc_cnt_dqo(struct gve_priv *priv,
> >                    const struct gve_device_option_dqo_rda *dev_op_dqo_rda)
> >  {
> >       priv->tx_desc_cnt = be16_to_cpu(descriptor->tx_queue_entries);
> > +     priv->rx_desc_cnt = be16_to_cpu(descriptor->rx_queue_entries);
> > +
> > +     if (priv->queue_format == GVE_DQO_QPL_FORMAT)
> > +             return 0;
> > +
> >       priv->options_dqo_rda.tx_comp_ring_entries =
> >               be16_to_cpu(dev_op_dqo_rda->tx_comp_ring_entries);
> > -     priv->rx_desc_cnt = be16_to_cpu(descriptor->rx_queue_entries);
> >       priv->options_dqo_rda.rx_buff_ring_entries =
> >               be16_to_cpu(dev_op_dqo_rda->rx_buff_ring_entries);
> >
> > @@ -687,7 +734,9 @@ gve_set_desc_cnt_dqo(struct gve_priv *priv,
> >  static void gve_enable_supported_features(struct gve_priv *priv,
> >                                         u32 supported_features_mask,
> >                                         const struct gve_device_option_jumbo_frames
> > -                                               *dev_op_jumbo_frames)
> > +                                       *dev_op_jumbo_frames,
> > +                                       const struct gve_device_option_dqo_qpl
> > +                                       *dev_op_dqo_qpl)
> >  {
> >       /* Before control reaches this point, the page-size-capped max MTU from
> >        * the gve_device_descriptor field has already been stored in
> > @@ -699,6 +748,20 @@ static void gve_enable_supported_features(struct gve_priv *priv,
> >                        "JUMBO FRAMES device option enabled.\n");
> >               priv->dev->max_mtu = be16_to_cpu(dev_op_jumbo_frames->max_mtu);
> >       }
> > +
> > +     /* Override pages for qpl for DQO-QPL */
> > +     if (dev_op_dqo_qpl) {
> > +             dev_info(&priv->pdev->dev,
> > +                      "DQO QPL device option enabled.\n");
>
> How does this message benefit the user?
>
> > +             priv->tx_pages_per_qpl =
> > +                     be16_to_cpu(dev_op_dqo_qpl->tx_pages_per_qpl);
> > +             priv->rx_pages_per_qpl =
> > +                     be16_to_cpu(dev_op_dqo_qpl->rx_pages_per_qpl);
> > +             if (priv->tx_pages_per_qpl == 0)
> > +                     priv->tx_pages_per_qpl = DQO_QPL_DEFAULT_TX_PAGES;
> > +             if (priv->rx_pages_per_qpl == 0)
> > +                     priv->rx_pages_per_qpl = DQO_QPL_DEFAULT_RX_PAGES;
> > +     }
> >  }
> >
> >  int gve_adminq_describe_device(struct gve_priv *priv)
> > @@ -707,6 +770,7 @@ int gve_adminq_describe_device(struct gve_priv *priv)
> >       struct gve_device_option_gqi_rda *dev_op_gqi_rda = NULL;
> >       struct gve_device_option_gqi_qpl *dev_op_gqi_qpl = NULL;
> >       struct gve_device_option_dqo_rda *dev_op_dqo_rda = NULL;
> > +     struct gve_device_option_dqo_qpl *dev_op_dqo_qpl = NULL;
> >       struct gve_device_descriptor *descriptor;
> >       u32 supported_features_mask = 0;
> >       union gve_adminq_command cmd;
> > @@ -733,13 +797,14 @@ int gve_adminq_describe_device(struct gve_priv *priv)
> >
> >       err = gve_process_device_options(priv, descriptor, &dev_op_gqi_rda,
> >                                        &dev_op_gqi_qpl, &dev_op_dqo_rda,
> > -                                      &dev_op_jumbo_frames);
> > +                                      &dev_op_jumbo_frames,
> > +                                      &dev_op_dqo_qpl);
> >       if (err)
> >               goto free_device_descriptor;
> >
> >       /* If the GQI_RAW_ADDRESSING option is not enabled and the queue format
> >        * is not set to GqiRda, choose the queue format in a priority order:
> > -      * DqoRda, GqiRda, GqiQpl. Use GqiQpl as default.
> > +      * DqoRda, DqoQpl, GqiRda, GqiQpl. Use GqiQpl as default.
> >        */
> >       if (dev_op_dqo_rda) {
> >               priv->queue_format = GVE_DQO_RDA_FORMAT;
> > @@ -747,7 +812,13 @@ int gve_adminq_describe_device(struct gve_priv *priv)
> >                        "Driver is running with DQO RDA queue format.\n");
> >               supported_features_mask =
> >                       be32_to_cpu(dev_op_dqo_rda->supported_features_mask);
> > -     } else if (dev_op_gqi_rda) {
> > +     } else if (dev_op_dqo_qpl) {
> > +             priv->queue_format = GVE_DQO_QPL_FORMAT;
> > +             dev_info(&priv->pdev->dev,
> > +                      "Driver is running with DQO QPL queue format.\n");
>
> I feel like at best these should have been dev_dbg, or at worst just
> removed. Messages should always add value for the user if they're printed.
This message (and one you pointed above) seems to be convention for
the driver code whenever a new format or device-option is added.
But I agree with you in principle that logging messages are not adding
any value here. Will remove.
>
> > +             supported_features_mask =
> > +                     be32_to_cpu(dev_op_dqo_qpl->supported_features_mask);
> > +     }  else if (dev_op_gqi_rda) {
> >               priv->queue_format = GVE_GQI_RDA_FORMAT;
> >               dev_info(&priv->pdev->dev,
> >                        "Driver is running with GQI RDA queue format.\n");
> > @@ -798,7 +869,7 @@ int gve_adminq_describe_device(struct gve_priv *priv)
> >       priv->default_num_queues = be16_to_cpu(descriptor->default_num_queues);
> >
> >       gve_enable_supported_features(priv, supported_features_mask,
> > -                                   dev_op_jumbo_frames);
> > +                                   dev_op_jumbo_frames, dev_op_dqo_qpl);
> >
> >  free_device_descriptor:
> >       dma_free_coherent(&priv->pdev->dev, PAGE_SIZE, descriptor,
> > diff --git a/drivers/net/ethernet/google/gve/gve_adminq.h b/drivers/net/ethernet/google/gve/gve_adminq.h
> > index f894beb3deaf..38a22279e863 100644
> > --- a/drivers/net/ethernet/google/gve/gve_adminq.h
> > +++ b/drivers/net/ethernet/google/gve/gve_adminq.h
> > @@ -109,6 +109,14 @@ struct gve_device_option_dqo_rda {
> >
> >  static_assert(sizeof(struct gve_device_option_dqo_rda) == 8);
> >
> > +struct gve_device_option_dqo_qpl {
> > +     __be32 supported_features_mask;
> > +     __be16 tx_pages_per_qpl;
> > +     __be16 rx_pages_per_qpl;
> > +};
> > +
> > +static_assert(sizeof(struct gve_device_option_dqo_qpl) == 8);
> > +
> >  struct gve_device_option_jumbo_frames {
> >       __be32 supported_features_mask;
> >       __be16 max_mtu;
> > @@ -130,6 +138,7 @@ enum gve_dev_opt_id {
> >       GVE_DEV_OPT_ID_GQI_RDA = 0x2,
> >       GVE_DEV_OPT_ID_GQI_QPL = 0x3,
> >       GVE_DEV_OPT_ID_DQO_RDA = 0x4,
> > +     GVE_DEV_OPT_ID_DQO_QPL = 0x7,
> >       GVE_DEV_OPT_ID_JUMBO_FRAMES = 0x8,
> >  };
> >
> > @@ -139,6 +148,7 @@ enum gve_dev_opt_req_feat_mask {
> >       GVE_DEV_OPT_REQ_FEAT_MASK_GQI_QPL = 0x0,
> >       GVE_DEV_OPT_REQ_FEAT_MASK_DQO_RDA = 0x0,
> >       GVE_DEV_OPT_REQ_FEAT_MASK_JUMBO_FRAMES = 0x0,
> > +     GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL = 0x0,
>
>
> Maybe this makes sense to others, but an enum full of defines where all
> values are zero? Why are we even writing code?

If there’s a bug that breaks the DQO-QPL feature, we need to set a bug
bit in this mask GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL.
That is why it is 0 to begin with. Although, I can see why it can be
considered useless.
>
> >  };
> >
> >  enum gve_sup_feature_mask {
> > diff --git a/drivers/net/ethernet/google/gve/gve_main.c b/drivers/net/ethernet/google/gve/gve_main.c
> > index e6f1711d9be0..b40fafe1460a 100644
> > --- a/drivers/net/ethernet/google/gve/gve_main.c
> > +++ b/drivers/net/ethernet/google/gve/gve_main.c
> > @@ -31,7 +31,6 @@
> >
> >  // Minimum amount of time between queue kicks in msec (10 seconds)
> >  #define MIN_TX_TIMEOUT_GAP (1000 * 10)
> > -#define DQO_TX_MAX   0x3FFFF
> >
> >  char gve_driver_name[] = "gve";
> >  const char gve_version_str[] = GVE_VERSION;
> > @@ -494,7 +493,7 @@ static int gve_setup_device_resources(struct gve_priv *priv)
> >               goto abort_with_stats_report;
> >       }
> >
> > -     if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
> > +     if (!gve_is_gqi(priv)) {
> >               priv->ptype_lut_dqo = kvzalloc(sizeof(*priv->ptype_lut_dqo),
> >                                              GFP_KERNEL);
> >               if (!priv->ptype_lut_dqo) {
> > @@ -1085,9 +1084,10 @@ static int gve_alloc_qpls(struct gve_priv *priv)
> >       int max_queues = priv->tx_cfg.max_queues + priv->rx_cfg.max_queues;
> >       int start_id;
> >       int i, j;
> > +     int page_count;
>
> RCT please
>
> >       int err;
> >
> > -     if (priv->queue_format != GVE_GQI_QPL_FORMAT)
> > +     if (!gve_is_qpl(priv))
> >               return 0;
> >
> >       priv->qpls = kvcalloc(max_queues, sizeof(*priv->qpls), GFP_KERNEL);
> > @@ -1095,17 +1095,25 @@ static int gve_alloc_qpls(struct gve_priv *priv)
> >               return -ENOMEM;
> >
> >       start_id = gve_tx_start_qpl_id(priv);
> > +     page_count = priv->tx_pages_per_qpl;
> >       for (i = start_id; i < start_id + gve_num_tx_qpls(priv); i++) {
> >               err = gve_alloc_queue_page_list(priv, i,
> > -                                             priv->tx_pages_per_qpl);
> > +                                             page_count);
> >               if (err)
> >                       goto free_qpls;
> >       }
> >
> >       start_id = gve_rx_start_qpl_id(priv);
> > +
> > +     /* For GQI_QPL number of pages allocated have 1:1 relationship with
> > +      * number of descriptors. For DQO, number of pages required are
> > +      * more than descriptors (because of out of order completions).
> > +      */
> > +     page_count = priv->queue_format == GVE_GQI_QPL_FORMAT ?
> > +             priv->rx_data_slot_cnt : priv->rx_pages_per_qpl;
> >       for (i = start_id; i < start_id + gve_num_rx_qpls(priv); i++) {
> >               err = gve_alloc_queue_page_list(priv, i,
> > -                                             priv->rx_data_slot_cnt);
> > +                                             page_count);
> >               if (err)
> >                       goto free_qpls;
> >       }
> > @@ -2051,7 +2059,7 @@ static int gve_init_priv(struct gve_priv *priv, bool skip_describe_device)
> >
> >       /* Big TCP is only supported on DQ*/
> >       if (!gve_is_gqi(priv))
> > -             netif_set_tso_max_size(priv->dev, DQO_TX_MAX);
> > +             netif_set_tso_max_size(priv->dev, GVE_DQO_TX_MAX);
> >
> >       priv->num_registered_pages = 0;
> >       priv->rx_copybreak = GVE_DEFAULT_RX_COPYBREAK;
>
diff mbox series

Patch

diff --git a/drivers/net/ethernet/google/gve/gve.h b/drivers/net/ethernet/google/gve/gve.h
index 4b425bf71ede..517a63b60cb9 100644
--- a/drivers/net/ethernet/google/gve/gve.h
+++ b/drivers/net/ethernet/google/gve/gve.h
@@ -51,6 +51,12 @@ 
 
 #define GVE_GQ_TX_MIN_PKT_DESC_BYTES 182
 
+#define DQO_QPL_DEFAULT_TX_PAGES 512
+#define DQO_QPL_DEFAULT_RX_PAGES 2048
+
+/* Maximum TSO size supported on DQO */
+#define GVE_DQO_TX_MAX	0x3FFFF
+
 /* Each slot in the desc ring has a 1:1 mapping to a slot in the data ring */
 struct gve_rx_desc_queue {
 	struct gve_rx_desc *desc_ring; /* the descriptor ring */
@@ -531,6 +537,7 @@  enum gve_queue_format {
 	GVE_GQI_RDA_FORMAT		= 0x1,
 	GVE_GQI_QPL_FORMAT		= 0x2,
 	GVE_DQO_RDA_FORMAT		= 0x3,
+	GVE_DQO_QPL_FORMAT		= 0x4,
 };
 
 struct gve_priv {
@@ -550,7 +557,8 @@  struct gve_priv {
 	u16 num_event_counters;
 	u16 tx_desc_cnt; /* num desc per ring */
 	u16 rx_desc_cnt; /* num desc per ring */
-	u16 tx_pages_per_qpl; /* tx buffer length */
+	u16 tx_pages_per_qpl; /* Suggested number of pages per qpl for TX queues by NIC */
+	u16 rx_pages_per_qpl; /* Suggested number of pages per qpl for RX queues by NIC */
 	u16 rx_data_slot_cnt; /* rx buffer length */
 	u64 max_registered_pages;
 	u64 num_registered_pages; /* num pages registered with NIC */
@@ -808,11 +816,17 @@  static inline u32 gve_rx_idx_to_ntfy(struct gve_priv *priv, u32 queue_idx)
 	return (priv->num_ntfy_blks / 2) + queue_idx;
 }
 
+static inline bool gve_is_qpl(struct gve_priv *priv)
+{
+	return priv->queue_format == GVE_GQI_QPL_FORMAT ||
+		priv->queue_format == GVE_DQO_QPL_FORMAT;
+}
+
 /* Returns the number of tx queue page lists
  */
 static inline u32 gve_num_tx_qpls(struct gve_priv *priv)
 {
-	if (priv->queue_format != GVE_GQI_QPL_FORMAT)
+	if (!gve_is_qpl(priv))
 		return 0;
 
 	return priv->tx_cfg.num_queues + priv->num_xdp_queues;
@@ -832,7 +846,7 @@  static inline u32 gve_num_xdp_qpls(struct gve_priv *priv)
  */
 static inline u32 gve_num_rx_qpls(struct gve_priv *priv)
 {
-	if (priv->queue_format != GVE_GQI_QPL_FORMAT)
+	if (!gve_is_qpl(priv))
 		return 0;
 
 	return priv->rx_cfg.num_queues;
diff --git a/drivers/net/ethernet/google/gve/gve_adminq.c b/drivers/net/ethernet/google/gve/gve_adminq.c
index 252974202a3f..a16e7cf21911 100644
--- a/drivers/net/ethernet/google/gve/gve_adminq.c
+++ b/drivers/net/ethernet/google/gve/gve_adminq.c
@@ -39,7 +39,8 @@  void gve_parse_device_option(struct gve_priv *priv,
 			     struct gve_device_option_gqi_rda **dev_op_gqi_rda,
 			     struct gve_device_option_gqi_qpl **dev_op_gqi_qpl,
 			     struct gve_device_option_dqo_rda **dev_op_dqo_rda,
-			     struct gve_device_option_jumbo_frames **dev_op_jumbo_frames)
+			     struct gve_device_option_jumbo_frames **dev_op_jumbo_frames,
+			     struct gve_device_option_dqo_qpl **dev_op_dqo_qpl)
 {
 	u32 req_feat_mask = be32_to_cpu(option->required_features_mask);
 	u16 option_length = be16_to_cpu(option->option_length);
@@ -112,6 +113,22 @@  void gve_parse_device_option(struct gve_priv *priv,
 		}
 		*dev_op_dqo_rda = (void *)(option + 1);
 		break;
+	case GVE_DEV_OPT_ID_DQO_QPL:
+		if (option_length < sizeof(**dev_op_dqo_qpl) ||
+		    req_feat_mask != GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL) {
+			dev_warn(&priv->pdev->dev, GVE_DEVICE_OPTION_ERROR_FMT,
+				 "DQO QPL", (int)sizeof(**dev_op_dqo_qpl),
+				 GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL,
+				 option_length, req_feat_mask);
+			break;
+		}
+
+		if (option_length > sizeof(**dev_op_dqo_qpl)) {
+			dev_warn(&priv->pdev->dev,
+				 GVE_DEVICE_OPTION_TOO_BIG_FMT, "DQO QPL");
+		}
+		*dev_op_dqo_qpl = (void *)(option + 1);
+		break;
 	case GVE_DEV_OPT_ID_JUMBO_FRAMES:
 		if (option_length < sizeof(**dev_op_jumbo_frames) ||
 		    req_feat_mask != GVE_DEV_OPT_REQ_FEAT_MASK_JUMBO_FRAMES) {
@@ -146,7 +163,8 @@  gve_process_device_options(struct gve_priv *priv,
 			   struct gve_device_option_gqi_rda **dev_op_gqi_rda,
 			   struct gve_device_option_gqi_qpl **dev_op_gqi_qpl,
 			   struct gve_device_option_dqo_rda **dev_op_dqo_rda,
-			   struct gve_device_option_jumbo_frames **dev_op_jumbo_frames)
+			   struct gve_device_option_jumbo_frames **dev_op_jumbo_frames,
+			   struct gve_device_option_dqo_qpl **dev_op_dqo_qpl)
 {
 	const int num_options = be16_to_cpu(descriptor->num_device_options);
 	struct gve_device_option *dev_opt;
@@ -166,7 +184,8 @@  gve_process_device_options(struct gve_priv *priv,
 
 		gve_parse_device_option(priv, descriptor, dev_opt,
 					dev_op_gqi_rda, dev_op_gqi_qpl,
-					dev_op_dqo_rda, dev_op_jumbo_frames);
+					dev_op_dqo_rda, dev_op_jumbo_frames,
+					dev_op_dqo_qpl);
 		dev_opt = next_opt;
 	}
 
@@ -505,12 +524,24 @@  static int gve_adminq_create_tx_queue(struct gve_priv *priv, u32 queue_index)
 
 		cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
 	} else {
+		u16 comp_ring_size = 0;
+		u32 qpl_id = 0;
+
+		if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
+			qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
+			comp_ring_size =
+				priv->options_dqo_rda.tx_comp_ring_entries;
+		} else {
+			qpl_id = tx->dqo.qpl->id;
+			comp_ring_size = priv->tx_desc_cnt;
+		}
+		cmd.create_tx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
 		cmd.create_tx_queue.tx_ring_size =
 			cpu_to_be16(priv->tx_desc_cnt);
 		cmd.create_tx_queue.tx_comp_ring_addr =
 			cpu_to_be64(tx->complq_bus_dqo);
 		cmd.create_tx_queue.tx_comp_ring_size =
-			cpu_to_be16(priv->options_dqo_rda.tx_comp_ring_entries);
+			cpu_to_be16(comp_ring_size);
 	}
 
 	return gve_adminq_issue_cmd(priv, &cmd);
@@ -555,6 +586,18 @@  static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
 		cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
 		cmd.create_rx_queue.packet_buffer_size = cpu_to_be16(rx->packet_buffer_size);
 	} else {
+		u16 rx_buff_ring_entries = 0;
+		u32 qpl_id = 0;
+
+		if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
+			qpl_id = GVE_RAW_ADDRESSING_QPL_ID;
+			rx_buff_ring_entries =
+				priv->options_dqo_rda.rx_buff_ring_entries;
+		} else {
+			qpl_id = rx->dqo.qpl->id;
+			rx_buff_ring_entries = priv->rx_desc_cnt;
+		}
+		cmd.create_rx_queue.queue_page_list_id = cpu_to_be32(qpl_id);
 		cmd.create_rx_queue.rx_ring_size =
 			cpu_to_be16(priv->rx_desc_cnt);
 		cmd.create_rx_queue.rx_desc_ring_addr =
@@ -564,7 +607,7 @@  static int gve_adminq_create_rx_queue(struct gve_priv *priv, u32 queue_index)
 		cmd.create_rx_queue.packet_buffer_size =
 			cpu_to_be16(priv->data_buffer_size_dqo);
 		cmd.create_rx_queue.rx_buff_ring_size =
-			cpu_to_be16(priv->options_dqo_rda.rx_buff_ring_entries);
+			cpu_to_be16(rx_buff_ring_entries);
 		cmd.create_rx_queue.enable_rsc =
 			!!(priv->dev->features & NETIF_F_LRO);
 	}
@@ -675,9 +718,13 @@  gve_set_desc_cnt_dqo(struct gve_priv *priv,
 		     const struct gve_device_option_dqo_rda *dev_op_dqo_rda)
 {
 	priv->tx_desc_cnt = be16_to_cpu(descriptor->tx_queue_entries);
+	priv->rx_desc_cnt = be16_to_cpu(descriptor->rx_queue_entries);
+
+	if (priv->queue_format == GVE_DQO_QPL_FORMAT)
+		return 0;
+
 	priv->options_dqo_rda.tx_comp_ring_entries =
 		be16_to_cpu(dev_op_dqo_rda->tx_comp_ring_entries);
-	priv->rx_desc_cnt = be16_to_cpu(descriptor->rx_queue_entries);
 	priv->options_dqo_rda.rx_buff_ring_entries =
 		be16_to_cpu(dev_op_dqo_rda->rx_buff_ring_entries);
 
@@ -687,7 +734,9 @@  gve_set_desc_cnt_dqo(struct gve_priv *priv,
 static void gve_enable_supported_features(struct gve_priv *priv,
 					  u32 supported_features_mask,
 					  const struct gve_device_option_jumbo_frames
-						  *dev_op_jumbo_frames)
+					  *dev_op_jumbo_frames,
+					  const struct gve_device_option_dqo_qpl
+					  *dev_op_dqo_qpl)
 {
 	/* Before control reaches this point, the page-size-capped max MTU from
 	 * the gve_device_descriptor field has already been stored in
@@ -699,6 +748,20 @@  static void gve_enable_supported_features(struct gve_priv *priv,
 			 "JUMBO FRAMES device option enabled.\n");
 		priv->dev->max_mtu = be16_to_cpu(dev_op_jumbo_frames->max_mtu);
 	}
+
+	/* Override pages for qpl for DQO-QPL */
+	if (dev_op_dqo_qpl) {
+		dev_info(&priv->pdev->dev,
+			 "DQO QPL device option enabled.\n");
+		priv->tx_pages_per_qpl =
+			be16_to_cpu(dev_op_dqo_qpl->tx_pages_per_qpl);
+		priv->rx_pages_per_qpl =
+			be16_to_cpu(dev_op_dqo_qpl->rx_pages_per_qpl);
+		if (priv->tx_pages_per_qpl == 0)
+			priv->tx_pages_per_qpl = DQO_QPL_DEFAULT_TX_PAGES;
+		if (priv->rx_pages_per_qpl == 0)
+			priv->rx_pages_per_qpl = DQO_QPL_DEFAULT_RX_PAGES;
+	}
 }
 
 int gve_adminq_describe_device(struct gve_priv *priv)
@@ -707,6 +770,7 @@  int gve_adminq_describe_device(struct gve_priv *priv)
 	struct gve_device_option_gqi_rda *dev_op_gqi_rda = NULL;
 	struct gve_device_option_gqi_qpl *dev_op_gqi_qpl = NULL;
 	struct gve_device_option_dqo_rda *dev_op_dqo_rda = NULL;
+	struct gve_device_option_dqo_qpl *dev_op_dqo_qpl = NULL;
 	struct gve_device_descriptor *descriptor;
 	u32 supported_features_mask = 0;
 	union gve_adminq_command cmd;
@@ -733,13 +797,14 @@  int gve_adminq_describe_device(struct gve_priv *priv)
 
 	err = gve_process_device_options(priv, descriptor, &dev_op_gqi_rda,
 					 &dev_op_gqi_qpl, &dev_op_dqo_rda,
-					 &dev_op_jumbo_frames);
+					 &dev_op_jumbo_frames,
+					 &dev_op_dqo_qpl);
 	if (err)
 		goto free_device_descriptor;
 
 	/* If the GQI_RAW_ADDRESSING option is not enabled and the queue format
 	 * is not set to GqiRda, choose the queue format in a priority order:
-	 * DqoRda, GqiRda, GqiQpl. Use GqiQpl as default.
+	 * DqoRda, DqoQpl, GqiRda, GqiQpl. Use GqiQpl as default.
 	 */
 	if (dev_op_dqo_rda) {
 		priv->queue_format = GVE_DQO_RDA_FORMAT;
@@ -747,7 +812,13 @@  int gve_adminq_describe_device(struct gve_priv *priv)
 			 "Driver is running with DQO RDA queue format.\n");
 		supported_features_mask =
 			be32_to_cpu(dev_op_dqo_rda->supported_features_mask);
-	} else if (dev_op_gqi_rda) {
+	} else if (dev_op_dqo_qpl) {
+		priv->queue_format = GVE_DQO_QPL_FORMAT;
+		dev_info(&priv->pdev->dev,
+			 "Driver is running with DQO QPL queue format.\n");
+		supported_features_mask =
+			be32_to_cpu(dev_op_dqo_qpl->supported_features_mask);
+	}  else if (dev_op_gqi_rda) {
 		priv->queue_format = GVE_GQI_RDA_FORMAT;
 		dev_info(&priv->pdev->dev,
 			 "Driver is running with GQI RDA queue format.\n");
@@ -798,7 +869,7 @@  int gve_adminq_describe_device(struct gve_priv *priv)
 	priv->default_num_queues = be16_to_cpu(descriptor->default_num_queues);
 
 	gve_enable_supported_features(priv, supported_features_mask,
-				      dev_op_jumbo_frames);
+				      dev_op_jumbo_frames, dev_op_dqo_qpl);
 
 free_device_descriptor:
 	dma_free_coherent(&priv->pdev->dev, PAGE_SIZE, descriptor,
diff --git a/drivers/net/ethernet/google/gve/gve_adminq.h b/drivers/net/ethernet/google/gve/gve_adminq.h
index f894beb3deaf..38a22279e863 100644
--- a/drivers/net/ethernet/google/gve/gve_adminq.h
+++ b/drivers/net/ethernet/google/gve/gve_adminq.h
@@ -109,6 +109,14 @@  struct gve_device_option_dqo_rda {
 
 static_assert(sizeof(struct gve_device_option_dqo_rda) == 8);
 
+struct gve_device_option_dqo_qpl {
+	__be32 supported_features_mask;
+	__be16 tx_pages_per_qpl;
+	__be16 rx_pages_per_qpl;
+};
+
+static_assert(sizeof(struct gve_device_option_dqo_qpl) == 8);
+
 struct gve_device_option_jumbo_frames {
 	__be32 supported_features_mask;
 	__be16 max_mtu;
@@ -130,6 +138,7 @@  enum gve_dev_opt_id {
 	GVE_DEV_OPT_ID_GQI_RDA = 0x2,
 	GVE_DEV_OPT_ID_GQI_QPL = 0x3,
 	GVE_DEV_OPT_ID_DQO_RDA = 0x4,
+	GVE_DEV_OPT_ID_DQO_QPL = 0x7,
 	GVE_DEV_OPT_ID_JUMBO_FRAMES = 0x8,
 };
 
@@ -139,6 +148,7 @@  enum gve_dev_opt_req_feat_mask {
 	GVE_DEV_OPT_REQ_FEAT_MASK_GQI_QPL = 0x0,
 	GVE_DEV_OPT_REQ_FEAT_MASK_DQO_RDA = 0x0,
 	GVE_DEV_OPT_REQ_FEAT_MASK_JUMBO_FRAMES = 0x0,
+	GVE_DEV_OPT_REQ_FEAT_MASK_DQO_QPL = 0x0,
 };
 
 enum gve_sup_feature_mask {
diff --git a/drivers/net/ethernet/google/gve/gve_main.c b/drivers/net/ethernet/google/gve/gve_main.c
index e6f1711d9be0..b40fafe1460a 100644
--- a/drivers/net/ethernet/google/gve/gve_main.c
+++ b/drivers/net/ethernet/google/gve/gve_main.c
@@ -31,7 +31,6 @@ 
 
 // Minimum amount of time between queue kicks in msec (10 seconds)
 #define MIN_TX_TIMEOUT_GAP (1000 * 10)
-#define DQO_TX_MAX	0x3FFFF
 
 char gve_driver_name[] = "gve";
 const char gve_version_str[] = GVE_VERSION;
@@ -494,7 +493,7 @@  static int gve_setup_device_resources(struct gve_priv *priv)
 		goto abort_with_stats_report;
 	}
 
-	if (priv->queue_format == GVE_DQO_RDA_FORMAT) {
+	if (!gve_is_gqi(priv)) {
 		priv->ptype_lut_dqo = kvzalloc(sizeof(*priv->ptype_lut_dqo),
 					       GFP_KERNEL);
 		if (!priv->ptype_lut_dqo) {
@@ -1085,9 +1084,10 @@  static int gve_alloc_qpls(struct gve_priv *priv)
 	int max_queues = priv->tx_cfg.max_queues + priv->rx_cfg.max_queues;
 	int start_id;
 	int i, j;
+	int page_count;
 	int err;
 
-	if (priv->queue_format != GVE_GQI_QPL_FORMAT)
+	if (!gve_is_qpl(priv))
 		return 0;
 
 	priv->qpls = kvcalloc(max_queues, sizeof(*priv->qpls), GFP_KERNEL);
@@ -1095,17 +1095,25 @@  static int gve_alloc_qpls(struct gve_priv *priv)
 		return -ENOMEM;
 
 	start_id = gve_tx_start_qpl_id(priv);
+	page_count = priv->tx_pages_per_qpl;
 	for (i = start_id; i < start_id + gve_num_tx_qpls(priv); i++) {
 		err = gve_alloc_queue_page_list(priv, i,
-						priv->tx_pages_per_qpl);
+						page_count);
 		if (err)
 			goto free_qpls;
 	}
 
 	start_id = gve_rx_start_qpl_id(priv);
+
+	/* For GQI_QPL number of pages allocated have 1:1 relationship with
+	 * number of descriptors. For DQO, number of pages required are
+	 * more than descriptors (because of out of order completions).
+	 */
+	page_count = priv->queue_format == GVE_GQI_QPL_FORMAT ?
+		priv->rx_data_slot_cnt : priv->rx_pages_per_qpl;
 	for (i = start_id; i < start_id + gve_num_rx_qpls(priv); i++) {
 		err = gve_alloc_queue_page_list(priv, i,
-						priv->rx_data_slot_cnt);
+						page_count);
 		if (err)
 			goto free_qpls;
 	}
@@ -2051,7 +2059,7 @@  static int gve_init_priv(struct gve_priv *priv, bool skip_describe_device)
 
 	/* Big TCP is only supported on DQ*/
 	if (!gve_is_gqi(priv))
-		netif_set_tso_max_size(priv->dev, DQO_TX_MAX);
+		netif_set_tso_max_size(priv->dev, GVE_DQO_TX_MAX);
 
 	priv->num_registered_pages = 0;
 	priv->rx_copybreak = GVE_DEFAULT_RX_COPYBREAK;