Message ID | 20210514141214.2120-5-shiraz.saleem@intel.com (mailing list archive) |
---|---|
State | Superseded |
Delegated to: | Netdev Maintainers |
Headers | show |
Series | Add Intel Ethernet Protocol Driver for RDMA (irdma) | expand |
Context | Check | Description |
---|---|---|
netdev/cover_letter | success | Link |
netdev/fixes_present | success | Link |
netdev/patch_count | fail | Series longer than 15 patches |
netdev/tree_selection | success | Guessed tree name to be net-next |
netdev/subject_prefix | success | Link |
netdev/cc_maintainers | warning | 2 maintainers not CCed: jesse.brandeburg@intel.com intel-wired-lan@lists.osuosl.org |
netdev/source_inline | success | Was 0 now: 0 |
netdev/verify_signedoff | success | Link |
netdev/module_param | success | Was 0 now: 0 |
netdev/build_32bit | success | Errors and warnings before: 0 this patch: 0 |
netdev/kdoc | success | Errors and warnings before: 0 this patch: 0 |
netdev/verify_fixes | success | Link |
netdev/checkpatch | success | total: 0 errors, 0 warnings, 0 checks, 168 lines checked |
netdev/build_allmodconfig_warn | success | Errors and warnings before: 0 this patch: 0 |
netdev/header_inline | success | Link |
On Fri, May 14, 2021 at 09:11:56AM -0500, Shiraz Saleem wrote: > From: Dave Ertman <david.m.ertman@intel.com> > > Register ice client auxiliary RDMA device on the auxiliary bus per > PCIe device function for the auxiliary driver (irdma) to attach to. > It allows to realize a single RDMA driver (irdma) capable of working with > multiple netdev drivers over multi-generation Intel HW supporting RDMA. > There is no load ordering dependencies between ice and irdma. > > Signed-off-by: Dave Ertman <david.m.ertman@intel.com> > Signed-off-by: Tony Nguyen <anthony.l.nguyen@intel.com> > Signed-off-by: Shiraz Saleem <shiraz.saleem@intel.com> > --- > drivers/net/ethernet/intel/Kconfig | 1 + > drivers/net/ethernet/intel/ice/ice.h | 8 +++- > drivers/net/ethernet/intel/ice/ice_idc.c | 71 ++++++++++++++++++++++++++++++- > drivers/net/ethernet/intel/ice/ice_main.c | 11 ++++- > 4 files changed, 87 insertions(+), 4 deletions(-) > > diff --git a/drivers/net/ethernet/intel/Kconfig b/drivers/net/ethernet/intel/Kconfig > index c1d1556..d8a12da 100644 > --- a/drivers/net/ethernet/intel/Kconfig > +++ b/drivers/net/ethernet/intel/Kconfig > @@ -294,6 +294,7 @@ config ICE > tristate "Intel(R) Ethernet Connection E800 Series Support" > default n > depends on PCI_MSI > + select AUXILIARY_BUS > select DIMLIB > select NET_DEVLINK > select PLDMFW > diff --git a/drivers/net/ethernet/intel/ice/ice.h b/drivers/net/ethernet/intel/ice/ice.h > index 225f8a5..228055e 100644 > --- a/drivers/net/ethernet/intel/ice/ice.h > +++ b/drivers/net/ethernet/intel/ice/ice.h > @@ -34,6 +34,7 @@ > #include <linux/if_bridge.h> > #include <linux/ctype.h> > #include <linux/bpf.h> > +#include <linux/auxiliary_bus.h> > #include <linux/avf/virtchnl.h> > #include <linux/cpu_rmap.h> > #include <linux/dim.h> > @@ -647,6 +648,8 @@ static inline void ice_clear_sriov_cap(struct ice_pf *pf) > void ice_fill_rss_lut(u8 *lut, u16 rss_table_size, u16 rss_size); > int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset); > void ice_print_link_msg(struct ice_vsi *vsi, bool isup); > +int ice_plug_aux_dev(struct ice_pf *pf); > +void ice_unplug_aux_dev(struct ice_pf *pf); > int ice_init_rdma(struct ice_pf *pf); > const char *ice_stat_str(enum ice_status stat_err); > const char *ice_aq_str(enum ice_aq_err aq_err); > @@ -678,8 +681,10 @@ int ice_aq_wait_for_event(struct ice_pf *pf, u16 opcode, unsigned long timeout, > */ > static inline void ice_set_rdma_cap(struct ice_pf *pf) > { > - if (pf->hw.func_caps.common_cap.rdma && pf->num_rdma_msix) > + if (pf->hw.func_caps.common_cap.rdma && pf->num_rdma_msix) { > set_bit(ICE_FLAG_RDMA_ENA, pf->flags); > + ice_plug_aux_dev(pf); > + } > } > > /** > @@ -688,6 +693,7 @@ static inline void ice_set_rdma_cap(struct ice_pf *pf) > */ > static inline void ice_clear_rdma_cap(struct ice_pf *pf) > { > + ice_unplug_aux_dev(pf); > clear_bit(ICE_FLAG_RDMA_ENA, pf->flags); > } > #endif /* _ICE_H_ */ > diff --git a/drivers/net/ethernet/intel/ice/ice_idc.c b/drivers/net/ethernet/intel/ice/ice_idc.c > index ffca0d5..e7bb8f6 100644 > --- a/drivers/net/ethernet/intel/ice/ice_idc.c > +++ b/drivers/net/ethernet/intel/ice/ice_idc.c > @@ -255,6 +255,71 @@ static int ice_reserve_rdma_qvector(struct ice_pf *pf) > } > > /** > + * ice_adev_release - function to be mapped to AUX dev's release op > + * @dev: pointer to device to free > + */ > +static void ice_adev_release(struct device *dev) > +{ > + struct iidc_auxiliary_dev *iadev; > + > + iadev = container_of(dev, struct iidc_auxiliary_dev, adev.dev); > + kfree(iadev); > +} > + > +/** > + * ice_plug_aux_dev - allocate and register AUX device > + * @pf: pointer to pf struct > + */ > +int ice_plug_aux_dev(struct ice_pf *pf) > +{ > + struct iidc_auxiliary_dev *iadev; > + struct auxiliary_device *adev; > + int ret; > + > + iadev = kzalloc(sizeof(*iadev), GFP_KERNEL); > + if (!iadev) > + return -ENOMEM; > + > + adev = &iadev->adev; > + pf->adev = adev; > + iadev->pf = pf; > + > + adev->id = pf->aux_idx; > + adev->dev.release = ice_adev_release; > + adev->dev.parent = &pf->pdev->dev; > + adev->name = IIDC_RDMA_ROCE_NAME; You declared IIDC_RDMA_ROCE_NAME as intel_rdma_roce, so it will create extremely awful device name, something like irdma.intel_rdma_roce.0 I would say that "intel" and "rdma" can be probably dropped. Thanks
> Subject: Re: [PATCH v5 04/22] ice: Register auxiliary device to provide RDMA > > On Fri, May 14, 2021 at 09:11:56AM -0500, Shiraz Saleem wrote: > > From: Dave Ertman <david.m.ertman@intel.com> > > > > Register ice client auxiliary RDMA device on the auxiliary bus per > > PCIe device function for the auxiliary driver (irdma) to attach to. > > It allows to realize a single RDMA driver (irdma) capable of working > > with multiple netdev drivers over multi-generation Intel HW supporting RDMA. > > There is no load ordering dependencies between ice and irdma. > > > > Signed-off-by: Dave Ertman <david.m.ertman@intel.com> > > Signed-off-by: Tony Nguyen <anthony.l.nguyen@intel.com> > > Signed-off-by: Shiraz Saleem <shiraz.saleem@intel.com> > > --- > > drivers/net/ethernet/intel/Kconfig | 1 + > > drivers/net/ethernet/intel/ice/ice.h | 8 +++- > > drivers/net/ethernet/intel/ice/ice_idc.c | 71 > > ++++++++++++++++++++++++++++++- > > drivers/net/ethernet/intel/ice/ice_main.c | 11 ++++- > > 4 files changed, 87 insertions(+), 4 deletions(-) > > > > diff --git a/drivers/net/ethernet/intel/Kconfig > > b/drivers/net/ethernet/intel/Kconfig > > index c1d1556..d8a12da 100644 > > --- a/drivers/net/ethernet/intel/Kconfig > > +++ b/drivers/net/ethernet/intel/Kconfig > > @@ -294,6 +294,7 @@ config ICE > > tristate "Intel(R) Ethernet Connection E800 Series Support" > > default n > > depends on PCI_MSI > > + select AUXILIARY_BUS > > select DIMLIB > > select NET_DEVLINK > > select PLDMFW > > diff --git a/drivers/net/ethernet/intel/ice/ice.h > > b/drivers/net/ethernet/intel/ice/ice.h > > index 225f8a5..228055e 100644 > > --- a/drivers/net/ethernet/intel/ice/ice.h > > +++ b/drivers/net/ethernet/intel/ice/ice.h > > @@ -34,6 +34,7 @@ > > #include <linux/if_bridge.h> > > #include <linux/ctype.h> > > #include <linux/bpf.h> > > +#include <linux/auxiliary_bus.h> > > #include <linux/avf/virtchnl.h> > > #include <linux/cpu_rmap.h> > > #include <linux/dim.h> > > @@ -647,6 +648,8 @@ static inline void ice_clear_sriov_cap(struct > > ice_pf *pf) void ice_fill_rss_lut(u8 *lut, u16 rss_table_size, u16 > > rss_size); int ice_schedule_reset(struct ice_pf *pf, enum > > ice_reset_req reset); void ice_print_link_msg(struct ice_vsi *vsi, > > bool isup); > > +int ice_plug_aux_dev(struct ice_pf *pf); void > > +ice_unplug_aux_dev(struct ice_pf *pf); > > int ice_init_rdma(struct ice_pf *pf); const char *ice_stat_str(enum > > ice_status stat_err); const char *ice_aq_str(enum ice_aq_err aq_err); > > @@ -678,8 +681,10 @@ int ice_aq_wait_for_event(struct ice_pf *pf, u16 > opcode, unsigned long timeout, > > */ > > static inline void ice_set_rdma_cap(struct ice_pf *pf) { > > - if (pf->hw.func_caps.common_cap.rdma && pf->num_rdma_msix) > > + if (pf->hw.func_caps.common_cap.rdma && pf->num_rdma_msix) { > > set_bit(ICE_FLAG_RDMA_ENA, pf->flags); > > + ice_plug_aux_dev(pf); > > + } > > } > > > > /** > > @@ -688,6 +693,7 @@ static inline void ice_set_rdma_cap(struct ice_pf *pf) > > */ > > static inline void ice_clear_rdma_cap(struct ice_pf *pf) { > > + ice_unplug_aux_dev(pf); > > clear_bit(ICE_FLAG_RDMA_ENA, pf->flags); } #endif /* _ICE_H_ */ > > diff --git a/drivers/net/ethernet/intel/ice/ice_idc.c > > b/drivers/net/ethernet/intel/ice/ice_idc.c > > index ffca0d5..e7bb8f6 100644 > > --- a/drivers/net/ethernet/intel/ice/ice_idc.c > > +++ b/drivers/net/ethernet/intel/ice/ice_idc.c > > @@ -255,6 +255,71 @@ static int ice_reserve_rdma_qvector(struct ice_pf > > *pf) } > > > > /** > > + * ice_adev_release - function to be mapped to AUX dev's release op > > + * @dev: pointer to device to free > > + */ > > +static void ice_adev_release(struct device *dev) { > > + struct iidc_auxiliary_dev *iadev; > > + > > + iadev = container_of(dev, struct iidc_auxiliary_dev, adev.dev); > > + kfree(iadev); > > +} > > + > > +/** > > + * ice_plug_aux_dev - allocate and register AUX device > > + * @pf: pointer to pf struct > > + */ > > +int ice_plug_aux_dev(struct ice_pf *pf) { > > + struct iidc_auxiliary_dev *iadev; > > + struct auxiliary_device *adev; > > + int ret; > > + > > + iadev = kzalloc(sizeof(*iadev), GFP_KERNEL); > > + if (!iadev) > > + return -ENOMEM; > > + > > + adev = &iadev->adev; > > + pf->adev = adev; > > + iadev->pf = pf; > > + > > + adev->id = pf->aux_idx; > > + adev->dev.release = ice_adev_release; > > + adev->dev.parent = &pf->pdev->dev; > > + adev->name = IIDC_RDMA_ROCE_NAME; > > You declared IIDC_RDMA_ROCE_NAME as intel_rdma_roce, so it will create > extremely awful device name, something like irdma.intel_rdma_roce.0 It is i40e.intel_rdma_iwarp.0 and ice.intel_rdma_roce.0. > > I would say that "intel" and "rdma" can be probably dropped. > I do not feel strongly about this and am ok with your request. Shiraz
diff --git a/drivers/net/ethernet/intel/Kconfig b/drivers/net/ethernet/intel/Kconfig index c1d1556..d8a12da 100644 --- a/drivers/net/ethernet/intel/Kconfig +++ b/drivers/net/ethernet/intel/Kconfig @@ -294,6 +294,7 @@ config ICE tristate "Intel(R) Ethernet Connection E800 Series Support" default n depends on PCI_MSI + select AUXILIARY_BUS select DIMLIB select NET_DEVLINK select PLDMFW diff --git a/drivers/net/ethernet/intel/ice/ice.h b/drivers/net/ethernet/intel/ice/ice.h index 225f8a5..228055e 100644 --- a/drivers/net/ethernet/intel/ice/ice.h +++ b/drivers/net/ethernet/intel/ice/ice.h @@ -34,6 +34,7 @@ #include <linux/if_bridge.h> #include <linux/ctype.h> #include <linux/bpf.h> +#include <linux/auxiliary_bus.h> #include <linux/avf/virtchnl.h> #include <linux/cpu_rmap.h> #include <linux/dim.h> @@ -647,6 +648,8 @@ static inline void ice_clear_sriov_cap(struct ice_pf *pf) void ice_fill_rss_lut(u8 *lut, u16 rss_table_size, u16 rss_size); int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset); void ice_print_link_msg(struct ice_vsi *vsi, bool isup); +int ice_plug_aux_dev(struct ice_pf *pf); +void ice_unplug_aux_dev(struct ice_pf *pf); int ice_init_rdma(struct ice_pf *pf); const char *ice_stat_str(enum ice_status stat_err); const char *ice_aq_str(enum ice_aq_err aq_err); @@ -678,8 +681,10 @@ int ice_aq_wait_for_event(struct ice_pf *pf, u16 opcode, unsigned long timeout, */ static inline void ice_set_rdma_cap(struct ice_pf *pf) { - if (pf->hw.func_caps.common_cap.rdma && pf->num_rdma_msix) + if (pf->hw.func_caps.common_cap.rdma && pf->num_rdma_msix) { set_bit(ICE_FLAG_RDMA_ENA, pf->flags); + ice_plug_aux_dev(pf); + } } /** @@ -688,6 +693,7 @@ static inline void ice_set_rdma_cap(struct ice_pf *pf) */ static inline void ice_clear_rdma_cap(struct ice_pf *pf) { + ice_unplug_aux_dev(pf); clear_bit(ICE_FLAG_RDMA_ENA, pf->flags); } #endif /* _ICE_H_ */ diff --git a/drivers/net/ethernet/intel/ice/ice_idc.c b/drivers/net/ethernet/intel/ice/ice_idc.c index ffca0d5..e7bb8f6 100644 --- a/drivers/net/ethernet/intel/ice/ice_idc.c +++ b/drivers/net/ethernet/intel/ice/ice_idc.c @@ -255,6 +255,71 @@ static int ice_reserve_rdma_qvector(struct ice_pf *pf) } /** + * ice_adev_release - function to be mapped to AUX dev's release op + * @dev: pointer to device to free + */ +static void ice_adev_release(struct device *dev) +{ + struct iidc_auxiliary_dev *iadev; + + iadev = container_of(dev, struct iidc_auxiliary_dev, adev.dev); + kfree(iadev); +} + +/** + * ice_plug_aux_dev - allocate and register AUX device + * @pf: pointer to pf struct + */ +int ice_plug_aux_dev(struct ice_pf *pf) +{ + struct iidc_auxiliary_dev *iadev; + struct auxiliary_device *adev; + int ret; + + iadev = kzalloc(sizeof(*iadev), GFP_KERNEL); + if (!iadev) + return -ENOMEM; + + adev = &iadev->adev; + pf->adev = adev; + iadev->pf = pf; + + adev->id = pf->aux_idx; + adev->dev.release = ice_adev_release; + adev->dev.parent = &pf->pdev->dev; + adev->name = IIDC_RDMA_ROCE_NAME; + + ret = auxiliary_device_init(adev); + if (ret) { + pf->adev = NULL; + kfree(iadev); + return ret; + } + + ret = auxiliary_device_add(adev); + if (ret) { + pf->adev = NULL; + auxiliary_device_uninit(adev); + return ret; + } + + return 0; +} + +/* ice_unplug_aux_dev - unregister and free AUX device + * @pf: pointer to pf struct + */ +void ice_unplug_aux_dev(struct ice_pf *pf) +{ + if (!pf->adev) + return; + + auxiliary_device_delete(pf->adev); + auxiliary_device_uninit(pf->adev); + pf->adev = NULL; +} + +/** * ice_init_rdma - initializes PF for RDMA use * @pf: ptr to ice_pf */ @@ -265,8 +330,10 @@ int ice_init_rdma(struct ice_pf *pf) /* Reserve vector resources */ ret = ice_reserve_rdma_qvector(pf); - if (ret < 0) + if (ret < 0) { dev_err(dev, "failed to reserve vectors for RDMA\n"); + return ret; + } - return ret; + return ice_plug_aux_dev(pf); } diff --git a/drivers/net/ethernet/intel/ice/ice_main.c b/drivers/net/ethernet/intel/ice/ice_main.c index 9d4570b..254cfc1 100644 --- a/drivers/net/ethernet/intel/ice/ice_main.c +++ b/drivers/net/ethernet/intel/ice/ice_main.c @@ -456,6 +456,8 @@ static void ice_pf_dis_all_vsi(struct ice_pf *pf, bool locked) if (test_bit(ICE_PREPARED_FOR_RESET, pf->state)) return; + ice_unplug_aux_dev(pf); + /* Notify VFs of impending reset */ if (ice_check_sq_alive(hw, &hw->mailboxq)) ice_vc_notify_reset(pf); @@ -2120,6 +2122,8 @@ int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset) return -EBUSY; } + ice_unplug_aux_dev(pf); + switch (reset) { case ICE_RESET_PFR: set_bit(ICE_PFR_REQ, pf->state); @@ -4456,11 +4460,12 @@ static void ice_remove(struct pci_dev *pdev) ice_free_vfs(pf); } - set_bit(ICE_DOWN, pf->state); ice_service_task_stop(pf); ice_aq_cancel_waiting_tasks(pf); + ice_unplug_aux_dev(pf); ida_free(&ice_aux_ida, pf->aux_idx); + set_bit(ICE_DOWN, pf->state); mutex_destroy(&(&pf->hw)->fdir_fltr_lock); ice_deinit_lag(pf); @@ -4616,6 +4621,8 @@ static int __maybe_unused ice_suspend(struct device *dev) */ disabled = ice_service_task_stop(pf); + ice_unplug_aux_dev(pf); + /* Already suspended?, then there is nothing to do */ if (test_and_set_bit(ICE_SUSPENDED, pf->state)) { if (!disabled) @@ -6286,6 +6293,8 @@ static void ice_rebuild(struct ice_pf *pf, enum ice_reset_req reset_type) /* if we get here, reset flow is successful */ clear_bit(ICE_RESET_FAILED, pf->state); + + ice_plug_aux_dev(pf); return; err_vsi_rebuild: