diff options
Diffstat (limited to 'include/rdma')
| -rw-r--r-- | include/rdma/ib_cm.h | 32 | ||||
| -rw-r--r-- | include/rdma/ib_mad.h | 40 | ||||
| -rw-r--r-- | include/rdma/ib_umem.h | 4 | ||||
| -rw-r--r-- | include/rdma/ib_umem_odp.h | 86 | ||||
| -rw-r--r-- | include/rdma/ib_verbs.h | 81 | ||||
| -rw-r--r-- | include/rdma/restrack.h | 5 | 
6 files changed, 85 insertions, 163 deletions
| diff --git a/include/rdma/ib_cm.h b/include/rdma/ib_cm.h index 49f4f75499b3..b01a8a8d4de9 100644 --- a/include/rdma/ib_cm.h +++ b/include/rdma/ib_cm.h @@ -1,38 +1,12 @@ +/* SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB */  /*   * Copyright (c) 2004, 2005 Intel Corporation.  All rights reserved.   * Copyright (c) 2004 Topspin Corporation.  All rights reserved.   * Copyright (c) 2004 Voltaire Corporation.  All rights reserved.   * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved. - * - * This software is available to you under a choice of one of two - * licenses.  You may choose to be licensed under the terms of the GNU - * General Public License (GPL) Version 2, available from the file - * COPYING in the main directory of this source tree, or the - * OpenIB.org BSD license below: - * - *     Redistribution and use in source and binary forms, with or - *     without modification, are permitted provided that the following - *     conditions are met: - * - *      - Redistributions of source code must retain the above - *        copyright notice, this list of conditions and the following - *        disclaimer. - * - *      - Redistributions in binary form must reproduce the above - *        copyright notice, this list of conditions and the following - *        disclaimer in the documentation and/or other materials - *        provided with the distribution. - * - * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, - * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF - * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND - * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS - * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN - * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN - * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE - * SOFTWARE. + * Copyright (c) 2019, Mellanox Technologies inc.  All rights reserved.   */ -#if !defined(IB_CM_H) +#ifndef IB_CM_H  #define IB_CM_H  #include <rdma/ib_mad.h> diff --git a/include/rdma/ib_mad.h b/include/rdma/ib_mad.h index eea946fcc819..4e62650e2127 100644 --- a/include/rdma/ib_mad.h +++ b/include/rdma/ib_mad.h @@ -815,46 +815,6 @@ int ib_modify_mad(struct ib_mad_agent *mad_agent,  		  struct ib_mad_send_buf *send_buf, u32 timeout_ms);  /** - * ib_redirect_mad_qp - Registers a QP for MAD services. - * @qp: Reference to a QP that requires MAD services. - * @rmpp_version: If set, indicates that the client will send - *   and receive MADs that contain the RMPP header for the given version. - *   If set to 0, indicates that RMPP is not used by this client. - * @send_handler: The completion callback routine invoked after a send - *   request has completed. - * @recv_handler: The completion callback routine invoked for a received - *   MAD. - * @context: User specified context associated with the registration. - * - * Use of this call allows clients to use MAD services, such as RMPP, - * on user-owned QPs.  After calling this routine, users may send - * MADs on the specified QP by calling ib_mad_post_send. - */ -struct ib_mad_agent *ib_redirect_mad_qp(struct ib_qp *qp, -					u8 rmpp_version, -					ib_mad_send_handler send_handler, -					ib_mad_recv_handler recv_handler, -					void *context); - -/** - * ib_process_mad_wc - Processes a work completion associated with a - *   MAD sent or received on a redirected QP. - * @mad_agent: Specifies the registered MAD service using the redirected QP. - * @wc: References a work completion associated with a sent or received - *   MAD segment. - * - * This routine is used to complete or continue processing on a MAD request. - * If the work completion is associated with a send operation, calling - * this routine is required to continue an RMPP transfer or to wait for a - * corresponding response, if it is a request.  If the work completion is - * associated with a receive operation, calling this routine is required to - * process an inbound or outbound RMPP transfer, or to match a response MAD - * with its corresponding request. - */ -int ib_process_mad_wc(struct ib_mad_agent *mad_agent, -		      struct ib_wc *wc); - -/**   * ib_create_send_mad - Allocate and initialize a data buffer and work request   *   for sending a MAD.   * @mad_agent: Specifies the registered MAD service to associate with the MAD. diff --git a/include/rdma/ib_umem.h b/include/rdma/ib_umem.h index a91b2af64ec4..753f54e17e0a 100644 --- a/include/rdma/ib_umem.h +++ b/include/rdma/ib_umem.h @@ -70,7 +70,7 @@ static inline size_t ib_umem_num_pages(struct ib_umem *umem)  #ifdef CONFIG_INFINIBAND_USER_MEM  struct ib_umem *ib_umem_get(struct ib_udata *udata, unsigned long addr, -			    size_t size, int access, int dmasync); +			    size_t size, int access);  void ib_umem_release(struct ib_umem *umem);  int ib_umem_page_count(struct ib_umem *umem);  int ib_umem_copy_from(void *dst, struct ib_umem *umem, size_t offset, @@ -85,7 +85,7 @@ unsigned long ib_umem_find_best_pgsz(struct ib_umem *umem,  static inline struct ib_umem *ib_umem_get(struct ib_udata *udata,  					  unsigned long addr, size_t size, -					  int access, int dmasync) +					  int access)  {  	return ERR_PTR(-EINVAL);  } diff --git a/include/rdma/ib_umem_odp.h b/include/rdma/ib_umem_odp.h index 253df1a1fa54..81429acc8257 100644 --- a/include/rdma/ib_umem_odp.h +++ b/include/rdma/ib_umem_odp.h @@ -35,11 +35,11 @@  #include <rdma/ib_umem.h>  #include <rdma/ib_verbs.h> -#include <linux/interval_tree.h>  struct ib_umem_odp {  	struct ib_umem umem; -	struct ib_ucontext_per_mm *per_mm; +	struct mmu_interval_notifier notifier; +	struct pid *tgid;  	/*  	 * An array of the pages included in the on-demand paging umem. @@ -62,13 +62,8 @@ struct ib_umem_odp {  	struct mutex		umem_mutex;  	void			*private; /* for the HW driver to use. */ -	int notifiers_seq; -	int notifiers_count;  	int npages; -	/* Tree tracking */ -	struct interval_tree_node interval_tree; -  	/*  	 * An implicit odp umem cannot be DMA mapped, has 0 length, and serves  	 * only as an anchor for the driver to hold onto the per_mm. FIXME: @@ -77,10 +72,7 @@ struct ib_umem_odp {  	 */  	bool is_implicit_odp; -	struct completion	notifier_completion; -	int			dying;  	unsigned int		page_shift; -	struct work_struct	work;  };  static inline struct ib_umem_odp *to_ib_umem_odp(struct ib_umem *umem) @@ -91,13 +83,13 @@ static inline struct ib_umem_odp *to_ib_umem_odp(struct ib_umem *umem)  /* Returns the first page of an ODP umem. */  static inline unsigned long ib_umem_start(struct ib_umem_odp *umem_odp)  { -	return umem_odp->interval_tree.start; +	return umem_odp->notifier.interval_tree.start;  }  /* Returns the address of the page after the last one of an ODP umem. */  static inline unsigned long ib_umem_end(struct ib_umem_odp *umem_odp)  { -	return umem_odp->interval_tree.last + 1; +	return umem_odp->notifier.interval_tree.last + 1;  }  static inline size_t ib_umem_odp_num_pages(struct ib_umem_odp *umem_odp) @@ -121,21 +113,15 @@ static inline size_t ib_umem_odp_num_pages(struct ib_umem_odp *umem_odp)  #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING -struct ib_ucontext_per_mm { -	struct mmu_notifier mn; -	struct pid *tgid; - -	struct rb_root_cached umem_tree; -	/* Protects umem_tree */ -	struct rw_semaphore umem_rwsem; -}; - -struct ib_umem_odp *ib_umem_odp_get(struct ib_udata *udata, unsigned long addr, -				    size_t size, int access); +struct ib_umem_odp * +ib_umem_odp_get(struct ib_udata *udata, unsigned long addr, size_t size, +		int access, const struct mmu_interval_notifier_ops *ops);  struct ib_umem_odp *ib_umem_odp_alloc_implicit(struct ib_udata *udata,  					       int access); -struct ib_umem_odp *ib_umem_odp_alloc_child(struct ib_umem_odp *root_umem, -					    unsigned long addr, size_t size); +struct ib_umem_odp * +ib_umem_odp_alloc_child(struct ib_umem_odp *root_umem, unsigned long addr, +			size_t size, +			const struct mmu_interval_notifier_ops *ops);  void ib_umem_odp_release(struct ib_umem_odp *umem_odp);  int ib_umem_odp_map_dma_pages(struct ib_umem_odp *umem_odp, u64 start_offset, @@ -145,55 +131,11 @@ int ib_umem_odp_map_dma_pages(struct ib_umem_odp *umem_odp, u64 start_offset,  void ib_umem_odp_unmap_dma_pages(struct ib_umem_odp *umem_odp, u64 start_offset,  				 u64 bound); -typedef int (*umem_call_back)(struct ib_umem_odp *item, u64 start, u64 end, -			      void *cookie); -/* - * Call the callback on each ib_umem in the range. Returns the logical or of - * the return values of the functions called. - */ -int rbt_ib_umem_for_each_in_range(struct rb_root_cached *root, -				  u64 start, u64 end, -				  umem_call_back cb, -				  bool blockable, void *cookie); - -/* - * Find first region intersecting with address range. - * Return NULL if not found - */ -static inline struct ib_umem_odp * -rbt_ib_umem_lookup(struct rb_root_cached *root, u64 addr, u64 length) -{ -	struct interval_tree_node *node; - -	node = interval_tree_iter_first(root, addr, addr + length - 1); -	if (!node) -		return NULL; -	return container_of(node, struct ib_umem_odp, interval_tree); - -} - -static inline int ib_umem_mmu_notifier_retry(struct ib_umem_odp *umem_odp, -					     unsigned long mmu_seq) -{ -	/* -	 * This code is strongly based on the KVM code from -	 * mmu_notifier_retry. Should be called with -	 * the relevant locks taken (umem_odp->umem_mutex -	 * and the ucontext umem_mutex semaphore locked for read). -	 */ - -	if (unlikely(umem_odp->notifiers_count)) -		return 1; -	if (umem_odp->notifiers_seq != mmu_seq) -		return 1; -	return 0; -} -  #else /* CONFIG_INFINIBAND_ON_DEMAND_PAGING */ -static inline struct ib_umem_odp *ib_umem_odp_get(struct ib_udata *udata, -						  unsigned long addr, -						  size_t size, int access) +static inline struct ib_umem_odp * +ib_umem_odp_get(struct ib_udata *udata, unsigned long addr, size_t size, +		int access, const struct mmu_interval_notifier_ops *ops)  {  	return ERR_PTR(-EINVAL);  } diff --git a/include/rdma/ib_verbs.h b/include/rdma/ib_verbs.h index e7e733add99f..cacb48faf670 100644 --- a/include/rdma/ib_verbs.h +++ b/include/rdma/ib_verbs.h @@ -445,6 +445,8 @@ struct ib_device_attr {  	struct ib_tm_caps	tm_caps;  	struct ib_cq_caps       cq_caps;  	u64			max_dm_size; +	/* Max entries for sgl for optimized performance per READ */ +	u32			max_sgl_rd;  };  enum ib_mtu { @@ -1471,6 +1473,7 @@ struct ib_ucontext {  	 * Implementation details of the RDMA core, don't use in drivers:  	 */  	struct rdma_restrack_entry res; +	struct xarray mmap_xa;  };  struct ib_uobject { @@ -2120,7 +2123,7 @@ struct ib_flow_action {  	atomic_t			usecnt;  }; -struct ib_mad_hdr; +struct ib_mad;  struct ib_grh;  enum ib_process_mad_flags { @@ -2218,6 +2221,11 @@ struct rdma_netdev_alloc_params {  				      struct net_device *netdev, void *param);  }; +struct ib_odp_counters { +	atomic64_t faults; +	atomic64_t invalidations; +}; +  struct ib_counters {  	struct ib_device	*device;  	struct ib_uobject	*uobject; @@ -2251,6 +2259,21 @@ struct iw_cm_conn_param;  #define DECLARE_RDMA_OBJ_SIZE(ib_struct) size_t size_##ib_struct +struct rdma_user_mmap_entry { +	struct kref ref; +	struct ib_ucontext *ucontext; +	unsigned long start_pgoff; +	size_t npages; +	bool driver_removed; +}; + +/* Return the offset (in bytes) the user should pass to libc's mmap() */ +static inline u64 +rdma_user_mmap_get_offset(const struct rdma_user_mmap_entry *entry) +{ +	return (u64)entry->start_pgoff << PAGE_SHIFT; +} +  /**   * struct ib_device_ops - InfiniBand device operations   * This structure defines all the InfiniBand device operations, providers will @@ -2278,9 +2301,8 @@ struct ib_device_ops {  	int (*process_mad)(struct ib_device *device, int process_mad_flags,  			   u8 port_num, const struct ib_wc *in_wc,  			   const struct ib_grh *in_grh, -			   const struct ib_mad_hdr *in_mad, size_t in_mad_size, -			   struct ib_mad_hdr *out_mad, size_t *out_mad_size, -			   u16 *out_mad_pkey_index); +			   const struct ib_mad *in_mad, struct ib_mad *out_mad, +			   size_t *out_mad_size, u16 *out_mad_pkey_index);  	int (*query_device)(struct ib_device *device,  			    struct ib_device_attr *device_attr,  			    struct ib_udata *udata); @@ -2363,6 +2385,13 @@ struct ib_device_ops {  			      struct ib_udata *udata);  	void (*dealloc_ucontext)(struct ib_ucontext *context);  	int (*mmap)(struct ib_ucontext *context, struct vm_area_struct *vma); +	/** +	 * This will be called once refcount of an entry in mmap_xa reaches +	 * zero. The type of the memory that was mapped may differ between +	 * entries and is opaque to the rdma_user_mmap interface. +	 * Therefore needs to be implemented by the driver in mmap_free. +	 */ +	void (*mmap_free)(struct rdma_user_mmap_entry *entry);  	void (*disassociate_ucontext)(struct ib_ucontext *ibcontext);  	int (*alloc_pd)(struct ib_pd *pd, struct ib_udata *udata);  	void (*dealloc_pd)(struct ib_pd *pd, struct ib_udata *udata); @@ -2422,8 +2451,6 @@ struct ib_device_ops {  			    u64 iova);  	int (*unmap_fmr)(struct list_head *fmr_list);  	int (*dealloc_fmr)(struct ib_fmr *fmr); -	void (*invalidate_range)(struct ib_umem_odp *umem_odp, -				 unsigned long start, unsigned long end);  	int (*attach_mcast)(struct ib_qp *qp, union ib_gid *gid, u16 lid);  	int (*detach_mcast)(struct ib_qp *qp, union ib_gid *gid, u16 lid);  	struct ib_xrcd *(*alloc_xrcd)(struct ib_device *device, @@ -2448,6 +2475,9 @@ struct ib_device_ops {  			     struct ifla_vf_info *ivf);  	int (*get_vf_stats)(struct ib_device *device, int vf, u8 port,  			    struct ifla_vf_stats *stats); +	int (*get_vf_guid)(struct ib_device *device, int vf, u8 port, +			    struct ifla_vf_guid *node_guid, +			    struct ifla_vf_guid *port_guid);  	int (*set_vf_guid)(struct ib_device *device, int vf, u8 port, u64 guid,  			   int type);  	struct ib_wq *(*create_wq)(struct ib_pd *pd, @@ -2563,6 +2593,13 @@ struct ib_device_ops {  	 */  	int (*counter_update_stats)(struct rdma_counter *counter); +	/** +	 * Allows rdma drivers to add their own restrack attributes +	 * dumped via 'rdma stat' iproute2 command. +	 */ +	int (*fill_stat_entry)(struct sk_buff *msg, +			       struct rdma_restrack_entry *entry); +  	DECLARE_RDMA_OBJ_SIZE(ib_ah);  	DECLARE_RDMA_OBJ_SIZE(ib_cq);  	DECLARE_RDMA_OBJ_SIZE(ib_pd); @@ -2789,18 +2826,21 @@ void  ib_set_client_data(struct ib_device *device, struct ib_client *client,  void ib_set_device_ops(struct ib_device *device,  		       const struct ib_device_ops *ops); -#if IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS)  int rdma_user_mmap_io(struct ib_ucontext *ucontext, struct vm_area_struct *vma, -		      unsigned long pfn, unsigned long size, pgprot_t prot); -#else -static inline int rdma_user_mmap_io(struct ib_ucontext *ucontext, -				    struct vm_area_struct *vma, -				    unsigned long pfn, unsigned long size, -				    pgprot_t prot) -{ -	return -EINVAL; -} -#endif +		      unsigned long pfn, unsigned long size, pgprot_t prot, +		      struct rdma_user_mmap_entry *entry); +int rdma_user_mmap_entry_insert(struct ib_ucontext *ucontext, +				struct rdma_user_mmap_entry *entry, +				size_t length); +struct rdma_user_mmap_entry * +rdma_user_mmap_entry_get_pgoff(struct ib_ucontext *ucontext, +			       unsigned long pgoff); +struct rdma_user_mmap_entry * +rdma_user_mmap_entry_get(struct ib_ucontext *ucontext, +			 struct vm_area_struct *vma); +void rdma_user_mmap_entry_put(struct rdma_user_mmap_entry *entry); + +void rdma_user_mmap_entry_remove(struct rdma_user_mmap_entry *entry);  static inline int ib_copy_from_udata(void *dest, struct ib_udata *udata, size_t len)  { @@ -3303,6 +3343,9 @@ int ib_get_vf_config(struct ib_device *device, int vf, u8 port,  		     struct ifla_vf_info *info);  int ib_get_vf_stats(struct ib_device *device, int vf, u8 port,  		    struct ifla_vf_stats *stats); +int ib_get_vf_guid(struct ib_device *device, int vf, u8 port, +		    struct ifla_vf_guid *node_guid, +		    struct ifla_vf_guid *port_guid);  int ib_set_vf_guid(struct ib_device *device, int vf, u8 port, u64 guid,  		   int type); @@ -4043,9 +4086,7 @@ static inline void ib_dma_unmap_sg_attrs(struct ib_device *dev,   */  static inline unsigned int ib_dma_max_seg_size(struct ib_device *dev)  { -	struct device_dma_parameters *p = dev->dma_device->dma_parms; - -	return p ? p->max_segment_size : UINT_MAX; +	return dma_get_max_seg_size(dev->dma_device);  }  /** diff --git a/include/rdma/restrack.h b/include/rdma/restrack.h index 83df1ec6664e..7682d1bcf789 100644 --- a/include/rdma/restrack.h +++ b/include/rdma/restrack.h @@ -156,6 +156,11 @@ int rdma_nl_put_driver_u32_hex(struct sk_buff *msg, const char *name,  int rdma_nl_put_driver_u64(struct sk_buff *msg, const char *name, u64 value);  int rdma_nl_put_driver_u64_hex(struct sk_buff *msg, const char *name,  			       u64 value); +int rdma_nl_put_driver_string(struct sk_buff *msg, const char *name, +			      const char *str); +int rdma_nl_stat_hwcounter_entry(struct sk_buff *msg, const char *name, +				 u64 value); +  struct rdma_restrack_entry *rdma_restrack_get_byid(struct ib_device *dev,  						   enum rdma_restrack_type type,  						   u32 id); | 

