blob: ec6446864b08e9847b35c5e68b6ac46018b52e26 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (c) 2004 Mellanox Technologies Ltd. All rights reserved.
3 * Copyright (c) 2004 Infinicon Corporation. All rights reserved.
4 * Copyright (c) 2004 Intel Corporation. All rights reserved.
5 * Copyright (c) 2004 Topspin Corporation. All rights reserved.
6 * Copyright (c) 2004 Voltaire Corporation. All rights reserved.
Roland Dreier2a1d9b72005-08-10 23:03:10 -07007 * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
Roland Dreierf7c6a7b2007-03-04 16:15:11 -08008 * Copyright (c) 2005, 2006, 2007 Cisco Systems. All rights reserved.
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 *
10 * This software is available to you under a choice of one of two
11 * licenses. You may choose to be licensed under the terms of the GNU
12 * General Public License (GPL) Version 2, available from the file
13 * COPYING in the main directory of this source tree, or the
14 * OpenIB.org BSD license below:
15 *
16 * Redistribution and use in source and binary forms, with or
17 * without modification, are permitted provided that the following
18 * conditions are met:
19 *
20 * - Redistributions of source code must retain the above
21 * copyright notice, this list of conditions and the following
22 * disclaimer.
23 *
24 * - Redistributions in binary form must reproduce the above
25 * copyright notice, this list of conditions and the following
26 * disclaimer in the documentation and/or other materials
27 * provided with the distribution.
28 *
29 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
30 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
31 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
32 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
33 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
34 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
35 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
36 * SOFTWARE.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
39#if !defined(IB_VERBS_H)
40#define IB_VERBS_H
41
42#include <linux/types.h>
43#include <linux/device.h>
Ralph Campbell9b513092006-12-12 14:27:41 -080044#include <linux/dma-mapping.h>
Michael S. Tsirkin459d6e22007-02-04 14:11:55 -080045#include <linux/kref.h>
Dotan Barakbfb3ea12007-07-31 16:49:15 +030046#include <linux/list.h>
47#include <linux/rwsem.h>
Tejun Heof0626712010-10-19 15:24:36 +000048#include <linux/workqueue.h>
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -080049#include <linux/irq_poll.h>
Matan Barakdd5f03b2013-12-12 18:03:11 +020050#include <uapi/linux/if_ether.h>
Somnath Koturc865f242015-12-23 14:56:51 +020051#include <net/ipv6.h>
52#include <net/ip.h>
Matan Barak301a7212015-12-15 20:30:10 +020053#include <linux/string.h>
54#include <linux/slab.h>
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -070055#include <linux/netdevice.h>
Parav Pandit01b67112018-11-16 03:50:57 +020056#include <linux/refcount.h>
Eli Cohen50174a72016-03-11 22:58:38 +020057#include <linux/if_link.h>
Arun Sharma600634972011-07-26 16:09:06 -070058#include <linux/atomic.h>
Haggai Eran882214e2014-12-11 17:04:18 +020059#include <linux/mmu_notifier.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080060#include <linux/uaccess.h>
Parav Pandit43579b52017-01-10 00:02:14 +000061#include <linux/cgroup_rdma.h>
Leon Romanovskyf6316032019-03-28 15:12:58 +020062#include <linux/irqflags.h>
63#include <linux/preempt.h>
Nicolas Dichtelea6819e2017-03-27 14:20:14 +020064#include <uapi/rdma/ib_user_verbs.h>
Leon Romanovsky02d88832018-01-28 11:17:20 +020065#include <rdma/restrack.h>
Matan Barak0ede73b2018-03-19 15:02:34 +020066#include <uapi/rdma/rdma_user_ioctl.h>
Matan Barak2eb9bea2018-03-28 09:27:45 +030067#include <uapi/rdma/ib_user_ioctl_verbs.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Leon Romanovsky9abb0d12017-06-27 16:49:53 +030069#define IB_FW_VERSION_NAME_MAX ETHTOOL_FWVERS_LEN
70
Jason Gunthorpeb5231b02018-09-16 20:48:04 +030071struct ib_umem_odp;
72
Tejun Heof0626712010-10-19 15:24:36 +000073extern struct workqueue_struct *ib_wq;
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -080074extern struct workqueue_struct *ib_comp_wq;
Jack Morgensteinf7948092018-08-27 08:35:55 +030075extern struct workqueue_struct *ib_comp_unbound_wq;
Tejun Heof0626712010-10-19 15:24:36 +000076
Gal Pressman923abb92019-05-01 13:48:13 +030077__printf(3, 4) __cold
78void ibdev_printk(const char *level, const struct ib_device *ibdev,
79 const char *format, ...);
80__printf(2, 3) __cold
81void ibdev_emerg(const struct ib_device *ibdev, const char *format, ...);
82__printf(2, 3) __cold
83void ibdev_alert(const struct ib_device *ibdev, const char *format, ...);
84__printf(2, 3) __cold
85void ibdev_crit(const struct ib_device *ibdev, const char *format, ...);
86__printf(2, 3) __cold
87void ibdev_err(const struct ib_device *ibdev, const char *format, ...);
88__printf(2, 3) __cold
89void ibdev_warn(const struct ib_device *ibdev, const char *format, ...);
90__printf(2, 3) __cold
91void ibdev_notice(const struct ib_device *ibdev, const char *format, ...);
92__printf(2, 3) __cold
93void ibdev_info(const struct ib_device *ibdev, const char *format, ...);
94
95#if defined(CONFIG_DYNAMIC_DEBUG)
96#define ibdev_dbg(__dev, format, args...) \
97 dynamic_ibdev_dbg(__dev, format, ##args)
98#elif defined(DEBUG)
99#define ibdev_dbg(__dev, format, args...) \
100 ibdev_printk(KERN_DEBUG, __dev, format, ##args)
101#else
102__printf(2, 3) __cold
103static inline
104void ibdev_dbg(const struct ib_device *ibdev, const char *format, ...) {}
105#endif
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107union ib_gid {
108 u8 raw[16];
109 struct {
Sean Hefty97f52eb2005-08-13 21:05:57 -0700110 __be64 subnet_prefix;
111 __be64 interface_id;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 } global;
113};
114
Moni Shouae26be1b2015-07-30 18:33:29 +0300115extern union ib_gid zgid;
116
Matan Barakb39ffa12015-12-23 14:56:47 +0200117enum ib_gid_type {
118 /* If link layer is Ethernet, this is RoCE V1 */
119 IB_GID_TYPE_IB = 0,
120 IB_GID_TYPE_ROCE = 0,
Matan Barak7766a992015-12-23 14:56:50 +0200121 IB_GID_TYPE_ROCE_UDP_ENCAP = 1,
Matan Barakb39ffa12015-12-23 14:56:47 +0200122 IB_GID_TYPE_SIZE
123};
124
Moni Shoua7ead4bc2016-01-14 17:50:38 +0200125#define ROCE_V2_UDP_DPORT 4791
Matan Barak03db3a22015-07-30 18:33:26 +0300126struct ib_gid_attr {
Parav Pandit943bd982019-05-02 10:48:07 +0300127 struct net_device __rcu *ndev;
Parav Pandit598ff6b2018-04-01 15:08:21 +0300128 struct ib_device *device;
Parav Panditb150c382018-06-05 08:40:15 +0300129 union ib_gid gid;
Parav Pandit598ff6b2018-04-01 15:08:21 +0300130 enum ib_gid_type gid_type;
131 u16 index;
132 u8 port_num;
Matan Barak03db3a22015-07-30 18:33:26 +0300133};
134
Tom Tucker07ebafb2006-08-03 16:02:42 -0500135enum rdma_node_type {
136 /* IB values map to NodeInfo:NodeType. */
137 RDMA_NODE_IB_CA = 1,
138 RDMA_NODE_IB_SWITCH,
139 RDMA_NODE_IB_ROUTER,
Upinder Malhi \(umalhi\)180771a2013-09-10 03:36:59 +0000140 RDMA_NODE_RNIC,
141 RDMA_NODE_USNIC,
Upinder Malhi5db57652014-01-15 17:02:36 -0800142 RDMA_NODE_USNIC_UDP,
Gal Pressmanf95be3d2019-05-05 20:59:21 +0300143 RDMA_NODE_UNSPECIFIED,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144};
145
Eli Cohena0c1b2a2016-03-11 22:58:37 +0200146enum {
147 /* set the local administered indication */
148 IB_SA_WELL_KNOWN_GUID = BIT_ULL(57) | 2,
149};
150
Tom Tucker07ebafb2006-08-03 16:02:42 -0500151enum rdma_transport_type {
152 RDMA_TRANSPORT_IB,
Upinder Malhi \(umalhi\)180771a2013-09-10 03:36:59 +0000153 RDMA_TRANSPORT_IWARP,
Upinder Malhi248567f2014-01-09 14:48:19 -0800154 RDMA_TRANSPORT_USNIC,
Gal Pressmanf95be3d2019-05-05 20:59:21 +0300155 RDMA_TRANSPORT_USNIC_UDP,
156 RDMA_TRANSPORT_UNSPECIFIED,
Tom Tucker07ebafb2006-08-03 16:02:42 -0500157};
158
Michael Wang6b90a6d2015-05-05 14:50:18 +0200159enum rdma_protocol_type {
160 RDMA_PROTOCOL_IB,
161 RDMA_PROTOCOL_IBOE,
162 RDMA_PROTOCOL_IWARP,
163 RDMA_PROTOCOL_USNIC_UDP
164};
165
Roland Dreier8385fd82014-06-04 10:00:16 -0700166__attribute_const__ enum rdma_transport_type
167rdma_node_get_transport(enum rdma_node_type node_type);
Tom Tucker07ebafb2006-08-03 16:02:42 -0500168
Somnath Koturc865f242015-12-23 14:56:51 +0200169enum rdma_network_type {
170 RDMA_NETWORK_IB,
171 RDMA_NETWORK_ROCE_V1 = RDMA_NETWORK_IB,
172 RDMA_NETWORK_IPV4,
173 RDMA_NETWORK_IPV6
174};
175
176static inline enum ib_gid_type ib_network_to_gid_type(enum rdma_network_type network_type)
177{
178 if (network_type == RDMA_NETWORK_IPV4 ||
179 network_type == RDMA_NETWORK_IPV6)
180 return IB_GID_TYPE_ROCE_UDP_ENCAP;
181
182 /* IB_GID_TYPE_IB same as RDMA_NETWORK_ROCE_V1 */
183 return IB_GID_TYPE_IB;
184}
185
Parav Pandit47ec3862018-06-13 10:22:06 +0300186static inline enum rdma_network_type
187rdma_gid_attr_network_type(const struct ib_gid_attr *attr)
Somnath Koturc865f242015-12-23 14:56:51 +0200188{
Parav Pandit47ec3862018-06-13 10:22:06 +0300189 if (attr->gid_type == IB_GID_TYPE_IB)
Somnath Koturc865f242015-12-23 14:56:51 +0200190 return RDMA_NETWORK_IB;
191
Parav Pandit47ec3862018-06-13 10:22:06 +0300192 if (ipv6_addr_v4mapped((struct in6_addr *)&attr->gid))
Somnath Koturc865f242015-12-23 14:56:51 +0200193 return RDMA_NETWORK_IPV4;
194 else
195 return RDMA_NETWORK_IPV6;
196}
197
Eli Cohena3f5ada2010-09-27 17:51:10 -0700198enum rdma_link_layer {
199 IB_LINK_LAYER_UNSPECIFIED,
200 IB_LINK_LAYER_INFINIBAND,
201 IB_LINK_LAYER_ETHERNET,
202};
203
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204enum ib_device_cap_flags {
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200205 IB_DEVICE_RESIZE_MAX_WR = (1 << 0),
206 IB_DEVICE_BAD_PKEY_CNTR = (1 << 1),
207 IB_DEVICE_BAD_QKEY_CNTR = (1 << 2),
208 IB_DEVICE_RAW_MULTI = (1 << 3),
209 IB_DEVICE_AUTO_PATH_MIG = (1 << 4),
210 IB_DEVICE_CHANGE_PHY_PORT = (1 << 5),
211 IB_DEVICE_UD_AV_PORT_ENFORCE = (1 << 6),
212 IB_DEVICE_CURR_QP_STATE_MOD = (1 << 7),
213 IB_DEVICE_SHUTDOWN_PORT = (1 << 8),
Leon Romanovsky78b57f92017-08-17 15:50:37 +0300214 /* Not in use, former INIT_TYPE = (1 << 9),*/
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200215 IB_DEVICE_PORT_ACTIVE_EVENT = (1 << 10),
216 IB_DEVICE_SYS_IMAGE_GUID = (1 << 11),
217 IB_DEVICE_RC_RNR_NAK_GEN = (1 << 12),
218 IB_DEVICE_SRQ_RESIZE = (1 << 13),
219 IB_DEVICE_N_NOTIFY_CQ = (1 << 14),
Christoph Hellwigb1adc712015-12-23 19:12:45 +0100220
221 /*
222 * This device supports a per-device lkey or stag that can be
223 * used without performing a memory registration for the local
224 * memory. Note that ULPs should never check this flag, but
225 * instead of use the local_dma_lkey flag in the ib_pd structure,
226 * which will always contain a usable lkey.
227 */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200228 IB_DEVICE_LOCAL_DMA_LKEY = (1 << 15),
Leon Romanovsky78b57f92017-08-17 15:50:37 +0300229 /* Reserved, old SEND_W_INV = (1 << 16),*/
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200230 IB_DEVICE_MEM_WINDOW = (1 << 17),
Eli Cohene0605d92008-01-30 18:30:57 +0200231 /*
232 * Devices should set IB_DEVICE_UD_IP_SUM if they support
233 * insertion of UDP and TCP checksum on outgoing UD IPoIB
234 * messages and can verify the validity of checksum for
235 * incoming messages. Setting this flag implies that the
236 * IPoIB driver may set NETIF_F_IP_CSUM for datagram mode.
237 */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200238 IB_DEVICE_UD_IP_CSUM = (1 << 18),
239 IB_DEVICE_UD_TSO = (1 << 19),
240 IB_DEVICE_XRC = (1 << 20),
Christoph Hellwigb1adc712015-12-23 19:12:45 +0100241
242 /*
243 * This device supports the IB "base memory management extension",
244 * which includes support for fast registrations (IB_WR_REG_MR,
245 * IB_WR_LOCAL_INV and IB_WR_SEND_WITH_INV verbs). This flag should
246 * also be set by any iWarp device which must support FRs to comply
247 * to the iWarp verbs spec. iWarp devices also support the
248 * IB_WR_RDMA_READ_WITH_INV verb for RDMA READs that invalidate the
249 * stag.
250 */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200251 IB_DEVICE_MEM_MGT_EXTENSIONS = (1 << 21),
252 IB_DEVICE_BLOCK_MULTICAST_LOOPBACK = (1 << 22),
253 IB_DEVICE_MEM_WINDOW_TYPE_2A = (1 << 23),
254 IB_DEVICE_MEM_WINDOW_TYPE_2B = (1 << 24),
255 IB_DEVICE_RC_IP_CSUM = (1 << 25),
Noa Osherovichebaaee22017-01-18 15:39:54 +0200256 /* Deprecated. Please use IB_RAW_PACKET_CAP_IP_CSUM. */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200257 IB_DEVICE_RAW_IP_CSUM = (1 << 26),
Leon Romanovsky8a06ce52015-12-20 12:16:10 +0200258 /*
259 * Devices should set IB_DEVICE_CROSS_CHANNEL if they
260 * support execution of WQEs that involve synchronization
261 * of I/O operations with single completion queue managed
262 * by hardware.
263 */
Leon Romanovsky78b57f92017-08-17 15:50:37 +0300264 IB_DEVICE_CROSS_CHANNEL = (1 << 27),
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200265 IB_DEVICE_MANAGED_FLOW_STEERING = (1 << 29),
266 IB_DEVICE_SIGNATURE_HANDOVER = (1 << 30),
Max Gurtovoy47355b32016-06-06 19:34:39 +0300267 IB_DEVICE_ON_DEMAND_PAGING = (1ULL << 31),
Sagi Grimbergf5aa9152016-02-29 19:07:32 +0200268 IB_DEVICE_SG_GAPS_REG = (1ULL << 32),
Max Gurtovoyc7e162a2016-06-06 19:34:40 +0300269 IB_DEVICE_VIRTUAL_FUNCTION = (1ULL << 33),
Noa Osherovichebaaee22017-01-18 15:39:54 +0200270 /* Deprecated. Please use IB_RAW_PACKET_CAP_SCATTER_FCS. */
Max Gurtovoyc7e162a2016-06-06 19:34:40 +0300271 IB_DEVICE_RAW_SCATTER_FCS = (1ULL << 34),
Vishwanathapura, Niranjana62e45942017-04-12 20:29:21 -0700272 IB_DEVICE_RDMA_NETDEV_OPA_VNIC = (1ULL << 35),
Noa Osheroviche1d2e882017-10-29 13:59:44 +0200273 /* The device supports padding incoming writes to cacheline. */
274 IB_DEVICE_PCI_WRITE_END_PADDING = (1ULL << 36),
Steve Wise3856ec42019-02-15 11:03:53 -0800275 IB_DEVICE_ALLOW_USER_UNREG = (1ULL << 37),
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200276};
277
278enum ib_signature_prot_cap {
279 IB_PROT_T10DIF_TYPE_1 = 1,
280 IB_PROT_T10DIF_TYPE_2 = 1 << 1,
281 IB_PROT_T10DIF_TYPE_3 = 1 << 2,
282};
283
284enum ib_signature_guard_cap {
285 IB_GUARD_T10DIF_CRC = 1,
286 IB_GUARD_T10DIF_CSUM = 1 << 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287};
288
289enum ib_atomic_cap {
290 IB_ATOMIC_NONE,
291 IB_ATOMIC_HCA,
292 IB_ATOMIC_GLOB
293};
294
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200295enum ib_odp_general_cap_bits {
Artemy Kovalyov25bf14d2017-01-18 16:58:06 +0200296 IB_ODP_SUPPORT = 1 << 0,
297 IB_ODP_SUPPORT_IMPLICIT = 1 << 1,
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200298};
299
300enum ib_odp_transport_cap_bits {
301 IB_ODP_SUPPORT_SEND = 1 << 0,
302 IB_ODP_SUPPORT_RECV = 1 << 1,
303 IB_ODP_SUPPORT_WRITE = 1 << 2,
304 IB_ODP_SUPPORT_READ = 1 << 3,
305 IB_ODP_SUPPORT_ATOMIC = 1 << 4,
Moni Shouada823342019-01-22 08:48:41 +0200306 IB_ODP_SUPPORT_SRQ_RECV = 1 << 5,
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200307};
308
309struct ib_odp_caps {
310 uint64_t general_caps;
311 struct {
312 uint32_t rc_odp_caps;
313 uint32_t uc_odp_caps;
314 uint32_t ud_odp_caps;
Moni Shoua52a72e22019-01-22 08:48:42 +0200315 uint32_t xrc_odp_caps;
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200316 } per_transport_caps;
317};
318
Yishai Hadasccf20562016-08-28 11:28:43 +0300319struct ib_rss_caps {
320 /* Corresponding bit will be set if qp type from
321 * 'enum ib_qp_type' is supported, e.g.
322 * supported_qpts |= 1 << IB_QPT_UD
323 */
324 u32 supported_qpts;
325 u32 max_rwq_indirection_tables;
326 u32 max_rwq_indirection_table_size;
327};
328
Artemy Kovalyov6938fc1e2017-08-17 15:52:03 +0300329enum ib_tm_cap_flags {
330 /* Support tag matching on RC transport */
331 IB_TM_CAP_RC = 1 << 0,
332};
333
Leon Romanovsky78b1beb2017-09-24 21:46:29 +0300334struct ib_tm_caps {
Artemy Kovalyov6938fc1e2017-08-17 15:52:03 +0300335 /* Max size of RNDV header */
336 u32 max_rndv_hdr_size;
337 /* Max number of entries in tag matching list */
338 u32 max_num_tags;
339 /* From enum ib_tm_cap_flags */
340 u32 flags;
341 /* Max number of outstanding list operations */
342 u32 max_ops;
343 /* Max number of SGE in tag matching entry */
344 u32 max_sge;
345};
346
Matan Barakbcf4c1e2015-06-11 16:35:20 +0300347struct ib_cq_init_attr {
348 unsigned int cqe;
349 int comp_vector;
350 u32 flags;
351};
352
Yonatan Cohen869ddcf2017-11-13 10:51:13 +0200353enum ib_cq_attr_mask {
354 IB_CQ_MODERATE = 1 << 0,
355};
356
Yonatan Cohen18bd9072017-11-13 10:51:16 +0200357struct ib_cq_caps {
358 u16 max_cq_moderation_count;
359 u16 max_cq_moderation_period;
360};
361
Ariel Levkovichbe934cc2018-04-05 18:53:25 +0300362struct ib_dm_mr_attr {
363 u64 length;
364 u64 offset;
365 u32 access_flags;
366};
367
Ariel Levkovichbee76d72018-04-05 18:53:24 +0300368struct ib_dm_alloc_attr {
369 u64 length;
370 u32 alignment;
371 u32 flags;
372};
373
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374struct ib_device_attr {
375 u64 fw_ver;
Sean Hefty97f52eb2005-08-13 21:05:57 -0700376 __be64 sys_image_guid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 u64 max_mr_size;
378 u64 page_size_cap;
379 u32 vendor_id;
380 u32 vendor_part_id;
381 u32 hw_ver;
382 int max_qp;
383 int max_qp_wr;
Leon Romanovskyfb532d62016-02-23 10:25:25 +0200384 u64 device_cap_flags;
Steve Wise33023fb2018-06-18 08:05:26 -0700385 int max_send_sge;
386 int max_recv_sge;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387 int max_sge_rd;
388 int max_cq;
389 int max_cqe;
390 int max_mr;
391 int max_pd;
392 int max_qp_rd_atom;
393 int max_ee_rd_atom;
394 int max_res_rd_atom;
395 int max_qp_init_rd_atom;
396 int max_ee_init_rd_atom;
397 enum ib_atomic_cap atomic_cap;
Vladimir Sokolovsky5e80ba82010-04-14 17:23:01 +0300398 enum ib_atomic_cap masked_atomic_cap;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 int max_ee;
400 int max_rdd;
401 int max_mw;
402 int max_raw_ipv6_qp;
403 int max_raw_ethy_qp;
404 int max_mcast_grp;
405 int max_mcast_qp_attach;
406 int max_total_mcast_qp_attach;
407 int max_ah;
408 int max_fmr;
409 int max_map_per_fmr;
410 int max_srq;
411 int max_srq_wr;
412 int max_srq_sge;
Steve Wise00f7ec32008-07-14 23:48:45 -0700413 unsigned int max_fast_reg_page_list_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 u16 max_pkeys;
415 u8 local_ca_ack_delay;
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200416 int sig_prot_cap;
417 int sig_guard_cap;
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200418 struct ib_odp_caps odp_caps;
Matan Barak24306dc2015-06-11 16:35:24 +0300419 uint64_t timestamp_mask;
420 uint64_t hca_core_clock; /* in KHZ */
Yishai Hadasccf20562016-08-28 11:28:43 +0300421 struct ib_rss_caps rss_caps;
422 u32 max_wq_type_rq;
Noa Osherovichebaaee22017-01-18 15:39:54 +0200423 u32 raw_packet_caps; /* Use ib_raw_packet_caps enum */
Leon Romanovsky78b1beb2017-09-24 21:46:29 +0300424 struct ib_tm_caps tm_caps;
Yonatan Cohen18bd9072017-11-13 10:51:16 +0200425 struct ib_cq_caps cq_caps;
Ariel Levkovich1d8eeb92018-04-05 18:53:23 +0300426 u64 max_dm_size;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427};
428
429enum ib_mtu {
430 IB_MTU_256 = 1,
431 IB_MTU_512 = 2,
432 IB_MTU_1024 = 3,
433 IB_MTU_2048 = 4,
434 IB_MTU_4096 = 5
435};
436
437static inline int ib_mtu_enum_to_int(enum ib_mtu mtu)
438{
439 switch (mtu) {
440 case IB_MTU_256: return 256;
441 case IB_MTU_512: return 512;
442 case IB_MTU_1024: return 1024;
443 case IB_MTU_2048: return 2048;
444 case IB_MTU_4096: return 4096;
445 default: return -1;
446 }
447}
448
Amrani, Ramd3f4aad2016-12-26 08:40:57 +0200449static inline enum ib_mtu ib_mtu_int_to_enum(int mtu)
450{
451 if (mtu >= 4096)
452 return IB_MTU_4096;
453 else if (mtu >= 2048)
454 return IB_MTU_2048;
455 else if (mtu >= 1024)
456 return IB_MTU_1024;
457 else if (mtu >= 512)
458 return IB_MTU_512;
459 else
460 return IB_MTU_256;
461}
462
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463enum ib_port_state {
464 IB_PORT_NOP = 0,
465 IB_PORT_DOWN = 1,
466 IB_PORT_INIT = 2,
467 IB_PORT_ARMED = 3,
468 IB_PORT_ACTIVE = 4,
469 IB_PORT_ACTIVE_DEFER = 5
470};
471
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472enum ib_port_width {
473 IB_WIDTH_1X = 1,
Michael Guralnikdbabf682018-12-09 11:49:49 +0200474 IB_WIDTH_2X = 16,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700475 IB_WIDTH_4X = 2,
476 IB_WIDTH_8X = 4,
477 IB_WIDTH_12X = 8
478};
479
480static inline int ib_width_enum_to_int(enum ib_port_width width)
481{
482 switch (width) {
483 case IB_WIDTH_1X: return 1;
Michael Guralnikdbabf682018-12-09 11:49:49 +0200484 case IB_WIDTH_2X: return 2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485 case IB_WIDTH_4X: return 4;
486 case IB_WIDTH_8X: return 8;
487 case IB_WIDTH_12X: return 12;
488 default: return -1;
489 }
490}
491
Or Gerlitz2e966912012-02-28 18:49:50 +0200492enum ib_port_speed {
493 IB_SPEED_SDR = 1,
494 IB_SPEED_DDR = 2,
495 IB_SPEED_QDR = 4,
496 IB_SPEED_FDR10 = 8,
497 IB_SPEED_FDR = 16,
Noa Osherovich12113a32017-04-20 20:53:31 +0300498 IB_SPEED_EDR = 32,
499 IB_SPEED_HDR = 64
Or Gerlitz2e966912012-02-28 18:49:50 +0200500};
501
Christoph Lameterb40f4752016-05-16 12:49:33 -0500502/**
503 * struct rdma_hw_stats
Mark Bloche9451302018-03-27 15:51:05 +0300504 * @lock - Mutex to protect parallel write access to lifespan and values
505 * of counters, which are 64bits and not guaranteeed to be written
506 * atomicaly on 32bits systems.
Christoph Lameterb40f4752016-05-16 12:49:33 -0500507 * @timestamp - Used by the core code to track when the last update was
508 * @lifespan - Used by the core code to determine how old the counters
509 * should be before being updated again. Stored in jiffies, defaults
510 * to 10 milliseconds, drivers can override the default be specifying
511 * their own value during their allocation routine.
512 * @name - Array of pointers to static names used for the counters in
513 * directory.
514 * @num_counters - How many hardware counters there are. If name is
515 * shorter than this number, a kernel oops will result. Driver authors
516 * are encouraged to leave BUILD_BUG_ON(ARRAY_SIZE(@name) < num_counters)
517 * in their code to prevent this.
518 * @value - Array of u64 counters that are accessed by the sysfs code and
519 * filled in by the drivers get_stats routine
520 */
521struct rdma_hw_stats {
Mark Bloche9451302018-03-27 15:51:05 +0300522 struct mutex lock; /* Protect lifespan and values[] */
Christoph Lameterb40f4752016-05-16 12:49:33 -0500523 unsigned long timestamp;
524 unsigned long lifespan;
525 const char * const *names;
526 int num_counters;
527 u64 value[];
Steve Wise7f624d02008-07-14 23:48:48 -0700528};
529
Christoph Lameterb40f4752016-05-16 12:49:33 -0500530#define RDMA_HW_STATS_DEFAULT_LIFESPAN 10
531/**
532 * rdma_alloc_hw_stats_struct - Helper function to allocate dynamic struct
533 * for drivers.
534 * @names - Array of static const char *
535 * @num_counters - How many elements in array
536 * @lifespan - How many milliseconds between updates
537 */
538static inline struct rdma_hw_stats *rdma_alloc_hw_stats_struct(
539 const char * const *names, int num_counters,
540 unsigned long lifespan)
541{
542 struct rdma_hw_stats *stats;
Steve Wise7f624d02008-07-14 23:48:48 -0700543
Christoph Lameterb40f4752016-05-16 12:49:33 -0500544 stats = kzalloc(sizeof(*stats) + num_counters * sizeof(u64),
545 GFP_KERNEL);
546 if (!stats)
547 return NULL;
548 stats->names = names;
549 stats->num_counters = num_counters;
550 stats->lifespan = msecs_to_jiffies(lifespan);
Steve Wise7f624d02008-07-14 23:48:48 -0700551
Christoph Lameterb40f4752016-05-16 12:49:33 -0500552 return stats;
553}
554
Steve Wise7f624d02008-07-14 23:48:48 -0700555
Ira Weinyf9b22e32015-05-13 20:02:59 -0400556/* Define bits for the various functionality this port needs to be supported by
557 * the core.
558 */
559/* Management 0x00000FFF */
560#define RDMA_CORE_CAP_IB_MAD 0x00000001
561#define RDMA_CORE_CAP_IB_SMI 0x00000002
562#define RDMA_CORE_CAP_IB_CM 0x00000004
563#define RDMA_CORE_CAP_IW_CM 0x00000008
564#define RDMA_CORE_CAP_IB_SA 0x00000010
Ira Weiny65995fe2015-06-06 14:38:32 -0400565#define RDMA_CORE_CAP_OPA_MAD 0x00000020
Ira Weinyf9b22e32015-05-13 20:02:59 -0400566
567/* Address format 0x000FF000 */
568#define RDMA_CORE_CAP_AF_IB 0x00001000
569#define RDMA_CORE_CAP_ETH_AH 0x00002000
Dasaratharaman Chandramouli94d595c2017-03-20 19:38:09 -0400570#define RDMA_CORE_CAP_OPA_AH 0x00004000
Artemy Kovalyovb02289b2018-07-04 15:57:50 +0300571#define RDMA_CORE_CAP_IB_GRH_REQUIRED 0x00008000
Ira Weinyf9b22e32015-05-13 20:02:59 -0400572
573/* Protocol 0xFFF00000 */
574#define RDMA_CORE_CAP_PROT_IB 0x00100000
575#define RDMA_CORE_CAP_PROT_ROCE 0x00200000
576#define RDMA_CORE_CAP_PROT_IWARP 0x00400000
Matan Barak7766a992015-12-23 14:56:50 +0200577#define RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP 0x00800000
Or Gerlitzaa773bd2017-01-24 13:02:35 +0200578#define RDMA_CORE_CAP_PROT_RAW_PACKET 0x01000000
Or Gerlitzce1e0552017-01-24 13:02:38 +0200579#define RDMA_CORE_CAP_PROT_USNIC 0x02000000
Ira Weinyf9b22e32015-05-13 20:02:59 -0400580
Artemy Kovalyovb02289b2018-07-04 15:57:50 +0300581#define RDMA_CORE_PORT_IB_GRH_REQUIRED (RDMA_CORE_CAP_IB_GRH_REQUIRED \
582 | RDMA_CORE_CAP_PROT_ROCE \
583 | RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP)
584
Ira Weinyf9b22e32015-05-13 20:02:59 -0400585#define RDMA_CORE_PORT_IBA_IB (RDMA_CORE_CAP_PROT_IB \
586 | RDMA_CORE_CAP_IB_MAD \
587 | RDMA_CORE_CAP_IB_SMI \
588 | RDMA_CORE_CAP_IB_CM \
589 | RDMA_CORE_CAP_IB_SA \
590 | RDMA_CORE_CAP_AF_IB)
591#define RDMA_CORE_PORT_IBA_ROCE (RDMA_CORE_CAP_PROT_ROCE \
592 | RDMA_CORE_CAP_IB_MAD \
593 | RDMA_CORE_CAP_IB_CM \
Ira Weinyf9b22e32015-05-13 20:02:59 -0400594 | RDMA_CORE_CAP_AF_IB \
595 | RDMA_CORE_CAP_ETH_AH)
Matan Barak7766a992015-12-23 14:56:50 +0200596#define RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP \
597 (RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP \
598 | RDMA_CORE_CAP_IB_MAD \
599 | RDMA_CORE_CAP_IB_CM \
600 | RDMA_CORE_CAP_AF_IB \
601 | RDMA_CORE_CAP_ETH_AH)
Ira Weinyf9b22e32015-05-13 20:02:59 -0400602#define RDMA_CORE_PORT_IWARP (RDMA_CORE_CAP_PROT_IWARP \
603 | RDMA_CORE_CAP_IW_CM)
Ira Weiny65995fe2015-06-06 14:38:32 -0400604#define RDMA_CORE_PORT_INTEL_OPA (RDMA_CORE_PORT_IBA_IB \
605 | RDMA_CORE_CAP_OPA_MAD)
Ira Weinyf9b22e32015-05-13 20:02:59 -0400606
Or Gerlitzaa773bd2017-01-24 13:02:35 +0200607#define RDMA_CORE_PORT_RAW_PACKET (RDMA_CORE_CAP_PROT_RAW_PACKET)
608
Or Gerlitzce1e0552017-01-24 13:02:38 +0200609#define RDMA_CORE_PORT_USNIC (RDMA_CORE_CAP_PROT_USNIC)
610
Linus Torvalds1da177e2005-04-16 15:20:36 -0700611struct ib_port_attr {
Eli Cohenfad61ad2016-03-11 22:58:36 +0200612 u64 subnet_prefix;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 enum ib_port_state state;
614 enum ib_mtu max_mtu;
615 enum ib_mtu active_mtu;
616 int gid_tbl_len;
Jason Gunthorpe2f944c02018-07-04 15:57:48 +0300617 unsigned int ip_gids:1;
618 /* This is the value from PortInfo CapabilityMask, defined by IBA */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 u32 port_cap_flags;
620 u32 max_msg_sz;
621 u32 bad_pkey_cntr;
622 u32 qkey_viol_cntr;
623 u16 pkey_tbl_len;
Dasaratharaman Chandramoulidb585402017-06-08 13:37:48 -0400624 u32 sm_lid;
Dasaratharaman Chandramouli582faf32017-06-08 13:37:47 -0400625 u32 lid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 u8 lmc;
627 u8 max_vl_num;
628 u8 sm_sl;
629 u8 subnet_timeout;
630 u8 init_type_reply;
631 u8 active_width;
632 u8 active_speed;
633 u8 phys_state;
Michael Guralnik1e8f43b2018-12-09 11:49:48 +0200634 u16 port_cap_flags2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635};
636
637enum ib_device_modify_flags {
Roland Dreierc5bcbbb2006-02-02 09:47:14 -0800638 IB_DEVICE_MODIFY_SYS_IMAGE_GUID = 1 << 0,
639 IB_DEVICE_MODIFY_NODE_DESC = 1 << 1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640};
641
Yuval Shaiabd99fde2016-08-25 10:57:07 -0700642#define IB_DEVICE_NODE_DESC_MAX 64
643
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644struct ib_device_modify {
645 u64 sys_image_guid;
Yuval Shaiabd99fde2016-08-25 10:57:07 -0700646 char node_desc[IB_DEVICE_NODE_DESC_MAX];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700647};
648
649enum ib_port_modify_flags {
650 IB_PORT_SHUTDOWN = 1,
651 IB_PORT_INIT_TYPE = (1<<2),
Vishwanathapura, Niranjanacb493662017-06-01 17:04:02 -0700652 IB_PORT_RESET_QKEY_CNTR = (1<<3),
653 IB_PORT_OPA_MASK_CHG = (1<<4)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654};
655
656struct ib_port_modify {
657 u32 set_port_cap_mask;
658 u32 clr_port_cap_mask;
659 u8 init_type;
660};
661
662enum ib_event_type {
663 IB_EVENT_CQ_ERR,
664 IB_EVENT_QP_FATAL,
665 IB_EVENT_QP_REQ_ERR,
666 IB_EVENT_QP_ACCESS_ERR,
667 IB_EVENT_COMM_EST,
668 IB_EVENT_SQ_DRAINED,
669 IB_EVENT_PATH_MIG,
670 IB_EVENT_PATH_MIG_ERR,
671 IB_EVENT_DEVICE_FATAL,
672 IB_EVENT_PORT_ACTIVE,
673 IB_EVENT_PORT_ERR,
674 IB_EVENT_LID_CHANGE,
675 IB_EVENT_PKEY_CHANGE,
Roland Dreierd41fcc62005-08-18 12:23:08 -0700676 IB_EVENT_SM_CHANGE,
677 IB_EVENT_SRQ_ERR,
678 IB_EVENT_SRQ_LIMIT_REACHED,
Leonid Arsh63942c92006-06-17 20:37:35 -0700679 IB_EVENT_QP_LAST_WQE_REACHED,
Or Gerlitz761d90e2011-06-15 14:39:29 +0000680 IB_EVENT_CLIENT_REREGISTER,
681 IB_EVENT_GID_CHANGE,
Yishai Hadasf213c052016-05-23 15:20:49 +0300682 IB_EVENT_WQ_FATAL,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700683};
684
Bart Van Asschedb7489e2015-08-03 10:01:52 -0700685const char *__attribute_const__ ib_event_msg(enum ib_event_type event);
Sagi Grimberg2b1b5b62015-05-18 13:40:28 +0300686
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687struct ib_event {
688 struct ib_device *device;
689 union {
690 struct ib_cq *cq;
691 struct ib_qp *qp;
Roland Dreierd41fcc62005-08-18 12:23:08 -0700692 struct ib_srq *srq;
Yishai Hadasf213c052016-05-23 15:20:49 +0300693 struct ib_wq *wq;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 u8 port_num;
695 } element;
696 enum ib_event_type event;
697};
698
699struct ib_event_handler {
700 struct ib_device *device;
701 void (*handler)(struct ib_event_handler *, struct ib_event *);
702 struct list_head list;
703};
704
705#define INIT_IB_EVENT_HANDLER(_ptr, _device, _handler) \
706 do { \
707 (_ptr)->device = _device; \
708 (_ptr)->handler = _handler; \
709 INIT_LIST_HEAD(&(_ptr)->list); \
710 } while (0)
711
712struct ib_global_route {
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +0300713 const struct ib_gid_attr *sgid_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714 union ib_gid dgid;
715 u32 flow_label;
716 u8 sgid_index;
717 u8 hop_limit;
718 u8 traffic_class;
719};
720
Hal Rosenstock513789e2005-07-27 11:45:34 -0700721struct ib_grh {
Sean Hefty97f52eb2005-08-13 21:05:57 -0700722 __be32 version_tclass_flow;
723 __be16 paylen;
Hal Rosenstock513789e2005-07-27 11:45:34 -0700724 u8 next_hdr;
725 u8 hop_limit;
726 union ib_gid sgid;
727 union ib_gid dgid;
728};
729
Somnath Koturc865f242015-12-23 14:56:51 +0200730union rdma_network_hdr {
731 struct ib_grh ibgrh;
732 struct {
733 /* The IB spec states that if it's IPv4, the header
734 * is located in the last 20 bytes of the header.
735 */
736 u8 reserved[20];
737 struct iphdr roce4grh;
738 };
739};
740
Don Hiatt7dafbab2017-05-12 09:19:55 -0700741#define IB_QPN_MASK 0xFFFFFF
742
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743enum {
744 IB_MULTICAST_QPN = 0xffffff
745};
746
Harvey Harrisonf3a7c662009-02-14 22:58:35 -0800747#define IB_LID_PERMISSIVE cpu_to_be16(0xFFFF)
Dennis Dalessandrob4e64392016-01-06 10:04:31 -0800748#define IB_MULTICAST_LID_BASE cpu_to_be16(0xC000)
Sean Hefty97f52eb2005-08-13 21:05:57 -0700749
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750enum ib_ah_flags {
751 IB_AH_GRH = 1
752};
753
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700754enum ib_rate {
755 IB_RATE_PORT_CURRENT = 0,
756 IB_RATE_2_5_GBPS = 2,
757 IB_RATE_5_GBPS = 5,
758 IB_RATE_10_GBPS = 3,
759 IB_RATE_20_GBPS = 6,
760 IB_RATE_30_GBPS = 4,
761 IB_RATE_40_GBPS = 7,
762 IB_RATE_60_GBPS = 8,
763 IB_RATE_80_GBPS = 9,
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300764 IB_RATE_120_GBPS = 10,
765 IB_RATE_14_GBPS = 11,
766 IB_RATE_56_GBPS = 12,
767 IB_RATE_112_GBPS = 13,
768 IB_RATE_168_GBPS = 14,
769 IB_RATE_25_GBPS = 15,
770 IB_RATE_100_GBPS = 16,
771 IB_RATE_200_GBPS = 17,
Michael Guralnika5a5d192018-12-09 11:49:50 +0200772 IB_RATE_300_GBPS = 18,
773 IB_RATE_28_GBPS = 19,
774 IB_RATE_50_GBPS = 20,
775 IB_RATE_400_GBPS = 21,
776 IB_RATE_600_GBPS = 22,
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700777};
778
779/**
780 * ib_rate_to_mult - Convert the IB rate enum to a multiple of the
781 * base rate of 2.5 Gbit/sec. For example, IB_RATE_5_GBPS will be
782 * converted to 2, since 5 Gbit/sec is 2 * 2.5 Gbit/sec.
783 * @rate: rate to convert.
784 */
Roland Dreier8385fd82014-06-04 10:00:16 -0700785__attribute_const__ int ib_rate_to_mult(enum ib_rate rate);
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700786
787/**
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300788 * ib_rate_to_mbps - Convert the IB rate enum to Mbps.
789 * For example, IB_RATE_2_5_GBPS will be converted to 2500.
790 * @rate: rate to convert.
791 */
Roland Dreier8385fd82014-06-04 10:00:16 -0700792__attribute_const__ int ib_rate_to_mbps(enum ib_rate rate);
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300793
Sagi Grimberg17cd3a22014-02-23 14:19:04 +0200794
795/**
Sagi Grimberg9bee1782015-07-30 10:32:35 +0300796 * enum ib_mr_type - memory region type
797 * @IB_MR_TYPE_MEM_REG: memory region that is used for
798 * normal registration
799 * @IB_MR_TYPE_SIGNATURE: memory region that is used for
800 * signature operations (data-integrity
801 * capable regions)
Sagi Grimbergf5aa9152016-02-29 19:07:32 +0200802 * @IB_MR_TYPE_SG_GAPS: memory region that is capable to
803 * register any arbitrary sg lists (without
804 * the normal mr constraints - see
805 * ib_map_mr_sg)
Sagi Grimberg17cd3a22014-02-23 14:19:04 +0200806 */
Sagi Grimberg9bee1782015-07-30 10:32:35 +0300807enum ib_mr_type {
808 IB_MR_TYPE_MEM_REG,
809 IB_MR_TYPE_SIGNATURE,
Sagi Grimbergf5aa9152016-02-29 19:07:32 +0200810 IB_MR_TYPE_SG_GAPS,
Sagi Grimberg17cd3a22014-02-23 14:19:04 +0200811};
812
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200813/**
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300814 * Signature types
815 * IB_SIG_TYPE_NONE: Unprotected.
816 * IB_SIG_TYPE_T10_DIF: Type T10-DIF
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200817 */
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300818enum ib_signature_type {
819 IB_SIG_TYPE_NONE,
820 IB_SIG_TYPE_T10_DIF,
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200821};
822
823/**
824 * Signature T10-DIF block-guard types
825 * IB_T10DIF_CRC: Corresponds to T10-PI mandated CRC checksum rules.
826 * IB_T10DIF_CSUM: Corresponds to IP checksum rules.
827 */
828enum ib_t10_dif_bg_type {
829 IB_T10DIF_CRC,
830 IB_T10DIF_CSUM
831};
832
833/**
834 * struct ib_t10_dif_domain - Parameters specific for T10-DIF
835 * domain.
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200836 * @bg_type: T10-DIF block guard type (CRC|CSUM)
837 * @pi_interval: protection information interval.
838 * @bg: seed of guard computation.
839 * @app_tag: application tag of guard block
840 * @ref_tag: initial guard block reference tag.
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300841 * @ref_remap: Indicate wethear the reftag increments each block
842 * @app_escape: Indicate to skip block check if apptag=0xffff
843 * @ref_escape: Indicate to skip block check if reftag=0xffffffff
844 * @apptag_check_mask: check bitmask of application tag.
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200845 */
846struct ib_t10_dif_domain {
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200847 enum ib_t10_dif_bg_type bg_type;
848 u16 pi_interval;
849 u16 bg;
850 u16 app_tag;
851 u32 ref_tag;
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300852 bool ref_remap;
853 bool app_escape;
854 bool ref_escape;
855 u16 apptag_check_mask;
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200856};
857
858/**
859 * struct ib_sig_domain - Parameters for signature domain
860 * @sig_type: specific signauture type
861 * @sig: union of all signature domain attributes that may
862 * be used to set domain layout.
863 */
864struct ib_sig_domain {
865 enum ib_signature_type sig_type;
866 union {
867 struct ib_t10_dif_domain dif;
868 } sig;
869};
870
871/**
872 * struct ib_sig_attrs - Parameters for signature handover operation
873 * @check_mask: bitmask for signature byte check (8 bytes)
874 * @mem: memory domain layout desciptor.
875 * @wire: wire domain layout desciptor.
876 */
877struct ib_sig_attrs {
878 u8 check_mask;
879 struct ib_sig_domain mem;
880 struct ib_sig_domain wire;
881};
882
883enum ib_sig_err_type {
884 IB_SIG_BAD_GUARD,
885 IB_SIG_BAD_REFTAG,
886 IB_SIG_BAD_APPTAG,
887};
888
889/**
Max Gurtovoyca24da02018-05-31 11:05:24 +0300890 * Signature check masks (8 bytes in total) according to the T10-PI standard:
891 * -------- -------- ------------
892 * | GUARD | APPTAG | REFTAG |
893 * | 2B | 2B | 4B |
894 * -------- -------- ------------
895 */
896enum {
897 IB_SIG_CHECK_GUARD = 0xc0,
898 IB_SIG_CHECK_APPTAG = 0x30,
899 IB_SIG_CHECK_REFTAG = 0x0f,
900};
901
902/**
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200903 * struct ib_sig_err - signature error descriptor
904 */
905struct ib_sig_err {
906 enum ib_sig_err_type err_type;
907 u32 expected;
908 u32 actual;
909 u64 sig_err_offset;
910 u32 key;
911};
912
913enum ib_mr_status_check {
914 IB_MR_CHECK_SIG_STATUS = 1,
915};
916
917/**
918 * struct ib_mr_status - Memory region status container
919 *
920 * @fail_status: Bitmask of MR checks status. For each
921 * failed check a corresponding status bit is set.
922 * @sig_err: Additional info for IB_MR_CEHCK_SIG_STATUS
923 * failure.
924 */
925struct ib_mr_status {
926 u32 fail_status;
927 struct ib_sig_err sig_err;
928};
929
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300930/**
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700931 * mult_to_ib_rate - Convert a multiple of 2.5 Gbit/sec to an IB rate
932 * enum.
933 * @mult: multiple to convert.
934 */
Roland Dreier8385fd82014-06-04 10:00:16 -0700935__attribute_const__ enum ib_rate mult_to_ib_rate(int mult);
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700936
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400937enum rdma_ah_attr_type {
Don Hiatt87daac62018-02-01 10:57:03 -0800938 RDMA_AH_ATTR_TYPE_UNDEFINED,
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400939 RDMA_AH_ATTR_TYPE_IB,
940 RDMA_AH_ATTR_TYPE_ROCE,
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400941 RDMA_AH_ATTR_TYPE_OPA,
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400942};
943
944struct ib_ah_attr {
945 u16 dlid;
946 u8 src_path_bits;
947};
948
949struct roce_ah_attr {
950 u8 dmac[ETH_ALEN];
951};
952
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400953struct opa_ah_attr {
954 u32 dlid;
955 u8 src_path_bits;
Don Hiattd98bb7f2017-08-04 13:54:16 -0700956 bool make_grd;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400957};
958
Dasaratharaman Chandramouli90898852017-04-29 14:41:18 -0400959struct rdma_ah_attr {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700960 struct ib_global_route grh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700961 u8 sl;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700962 u8 static_rate;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700963 u8 port_num;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400964 u8 ah_flags;
965 enum rdma_ah_attr_type type;
966 union {
967 struct ib_ah_attr ib;
968 struct roce_ah_attr roce;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400969 struct opa_ah_attr opa;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400970 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700971};
972
973enum ib_wc_status {
974 IB_WC_SUCCESS,
975 IB_WC_LOC_LEN_ERR,
976 IB_WC_LOC_QP_OP_ERR,
977 IB_WC_LOC_EEC_OP_ERR,
978 IB_WC_LOC_PROT_ERR,
979 IB_WC_WR_FLUSH_ERR,
980 IB_WC_MW_BIND_ERR,
981 IB_WC_BAD_RESP_ERR,
982 IB_WC_LOC_ACCESS_ERR,
983 IB_WC_REM_INV_REQ_ERR,
984 IB_WC_REM_ACCESS_ERR,
985 IB_WC_REM_OP_ERR,
986 IB_WC_RETRY_EXC_ERR,
987 IB_WC_RNR_RETRY_EXC_ERR,
988 IB_WC_LOC_RDD_VIOL_ERR,
989 IB_WC_REM_INV_RD_REQ_ERR,
990 IB_WC_REM_ABORT_ERR,
991 IB_WC_INV_EECN_ERR,
992 IB_WC_INV_EEC_STATE_ERR,
993 IB_WC_FATAL_ERR,
994 IB_WC_RESP_TIMEOUT_ERR,
995 IB_WC_GENERAL_ERR
996};
997
Bart Van Asschedb7489e2015-08-03 10:01:52 -0700998const char *__attribute_const__ ib_wc_status_msg(enum ib_wc_status status);
Sagi Grimberg2b1b5b62015-05-18 13:40:28 +0300999
Linus Torvalds1da177e2005-04-16 15:20:36 -07001000enum ib_wc_opcode {
1001 IB_WC_SEND,
1002 IB_WC_RDMA_WRITE,
1003 IB_WC_RDMA_READ,
1004 IB_WC_COMP_SWAP,
1005 IB_WC_FETCH_ADD,
Eli Cohenc93570f2008-04-16 21:09:27 -07001006 IB_WC_LSO,
Steve Wise00f7ec32008-07-14 23:48:45 -07001007 IB_WC_LOCAL_INV,
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001008 IB_WC_REG_MR,
Vladimir Sokolovsky5e80ba82010-04-14 17:23:01 +03001009 IB_WC_MASKED_COMP_SWAP,
1010 IB_WC_MASKED_FETCH_ADD,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011/*
1012 * Set value of IB_WC_RECV so consumers can test if a completion is a
1013 * receive by testing (opcode & IB_WC_RECV).
1014 */
1015 IB_WC_RECV = 1 << 7,
1016 IB_WC_RECV_RDMA_WITH_IMM
1017};
1018
1019enum ib_wc_flags {
1020 IB_WC_GRH = 1,
Steve Wise00f7ec32008-07-14 23:48:45 -07001021 IB_WC_WITH_IMM = (1<<1),
1022 IB_WC_WITH_INVALIDATE = (1<<2),
Or Gerlitzd927d502012-01-11 19:03:51 +02001023 IB_WC_IP_CSUM_OK = (1<<3),
Matan Barakdd5f03b2013-12-12 18:03:11 +02001024 IB_WC_WITH_SMAC = (1<<4),
1025 IB_WC_WITH_VLAN = (1<<5),
Somnath Koturc865f242015-12-23 14:56:51 +02001026 IB_WC_WITH_NETWORK_HDR_TYPE = (1<<6),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001027};
1028
1029struct ib_wc {
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001030 union {
1031 u64 wr_id;
1032 struct ib_cqe *wr_cqe;
1033 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 enum ib_wc_status status;
1035 enum ib_wc_opcode opcode;
1036 u32 vendor_err;
1037 u32 byte_len;
Michael S. Tsirkin062dbb62006-12-31 21:09:42 +02001038 struct ib_qp *qp;
Steve Wise00f7ec32008-07-14 23:48:45 -07001039 union {
1040 __be32 imm_data;
1041 u32 invalidate_rkey;
1042 } ex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043 u32 src_qp;
Bodong Wangcd2a6e72018-01-12 07:58:41 +02001044 u32 slid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045 int wc_flags;
1046 u16 pkey_index;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001047 u8 sl;
1048 u8 dlid_path_bits;
1049 u8 port_num; /* valid only for DR SMPs on switches */
Matan Barakdd5f03b2013-12-12 18:03:11 +02001050 u8 smac[ETH_ALEN];
1051 u16 vlan_id;
Somnath Koturc865f242015-12-23 14:56:51 +02001052 u8 network_hdr_type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053};
1054
Roland Dreiered23a722007-05-06 21:02:48 -07001055enum ib_cq_notify_flags {
1056 IB_CQ_SOLICITED = 1 << 0,
1057 IB_CQ_NEXT_COMP = 1 << 1,
1058 IB_CQ_SOLICITED_MASK = IB_CQ_SOLICITED | IB_CQ_NEXT_COMP,
1059 IB_CQ_REPORT_MISSED_EVENTS = 1 << 2,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001060};
1061
Sean Hefty96104ed2011-05-23 16:31:36 -07001062enum ib_srq_type {
Sean Hefty418d5132011-05-23 19:42:29 -07001063 IB_SRQT_BASIC,
Artemy Kovalyov9c2c8492017-08-17 15:52:05 +03001064 IB_SRQT_XRC,
1065 IB_SRQT_TM,
Sean Hefty96104ed2011-05-23 16:31:36 -07001066};
1067
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001068static inline bool ib_srq_has_cq(enum ib_srq_type srq_type)
1069{
Artemy Kovalyov9c2c8492017-08-17 15:52:05 +03001070 return srq_type == IB_SRQT_XRC ||
1071 srq_type == IB_SRQT_TM;
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001072}
1073
Roland Dreierd41fcc62005-08-18 12:23:08 -07001074enum ib_srq_attr_mask {
1075 IB_SRQ_MAX_WR = 1 << 0,
1076 IB_SRQ_LIMIT = 1 << 1,
1077};
1078
1079struct ib_srq_attr {
1080 u32 max_wr;
1081 u32 max_sge;
1082 u32 srq_limit;
1083};
1084
1085struct ib_srq_init_attr {
1086 void (*event_handler)(struct ib_event *, void *);
1087 void *srq_context;
1088 struct ib_srq_attr attr;
Sean Hefty96104ed2011-05-23 16:31:36 -07001089 enum ib_srq_type srq_type;
Sean Hefty418d5132011-05-23 19:42:29 -07001090
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001091 struct {
1092 struct ib_cq *cq;
1093 union {
1094 struct {
1095 struct ib_xrcd *xrcd;
1096 } xrc;
Artemy Kovalyov9c2c8492017-08-17 15:52:05 +03001097
1098 struct {
1099 u32 max_num_tags;
1100 } tag_matching;
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001101 };
Sean Hefty418d5132011-05-23 19:42:29 -07001102 } ext;
Roland Dreierd41fcc62005-08-18 12:23:08 -07001103};
1104
Linus Torvalds1da177e2005-04-16 15:20:36 -07001105struct ib_qp_cap {
1106 u32 max_send_wr;
1107 u32 max_recv_wr;
1108 u32 max_send_sge;
1109 u32 max_recv_sge;
1110 u32 max_inline_data;
Christoph Hellwiga060b562016-05-03 18:01:09 +02001111
1112 /*
1113 * Maximum number of rdma_rw_ctx structures in flight at a time.
1114 * ib_create_qp() will calculate the right amount of neededed WRs
1115 * and MRs based on this.
1116 */
1117 u32 max_rdma_ctxs;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001118};
1119
1120enum ib_sig_type {
1121 IB_SIGNAL_ALL_WR,
1122 IB_SIGNAL_REQ_WR
1123};
1124
1125enum ib_qp_type {
1126 /*
1127 * IB_QPT_SMI and IB_QPT_GSI have to be the first two entries
1128 * here (and in that order) since the MAD layer uses them as
1129 * indices into a 2-entry table.
1130 */
1131 IB_QPT_SMI,
1132 IB_QPT_GSI,
1133
1134 IB_QPT_RC,
1135 IB_QPT_UC,
1136 IB_QPT_UD,
1137 IB_QPT_RAW_IPV6,
Sean Heftyb42b63c2011-05-23 19:59:25 -07001138 IB_QPT_RAW_ETHERTYPE,
Or Gerlitzc938a612012-03-01 12:17:51 +02001139 IB_QPT_RAW_PACKET = 8,
Sean Heftyb42b63c2011-05-23 19:59:25 -07001140 IB_QPT_XRC_INI = 9,
1141 IB_QPT_XRC_TGT,
Jack Morgenstein0134f162013-07-07 17:25:52 +03001142 IB_QPT_MAX,
Moni Shoua8011c1e2018-01-02 16:19:30 +02001143 IB_QPT_DRIVER = 0xFF,
Jack Morgenstein0134f162013-07-07 17:25:52 +03001144 /* Reserve a range for qp types internal to the low level driver.
1145 * These qp types will not be visible at the IB core layer, so the
1146 * IB_QPT_MAX usages should not be affected in the core layer
1147 */
1148 IB_QPT_RESERVED1 = 0x1000,
1149 IB_QPT_RESERVED2,
1150 IB_QPT_RESERVED3,
1151 IB_QPT_RESERVED4,
1152 IB_QPT_RESERVED5,
1153 IB_QPT_RESERVED6,
1154 IB_QPT_RESERVED7,
1155 IB_QPT_RESERVED8,
1156 IB_QPT_RESERVED9,
1157 IB_QPT_RESERVED10,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158};
1159
Eli Cohenb846f252008-04-16 21:09:27 -07001160enum ib_qp_create_flags {
Ron Livne47ee1b92008-07-14 23:48:48 -07001161 IB_QP_CREATE_IPOIB_UD_LSO = 1 << 0,
1162 IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK = 1 << 1,
Leon Romanovsky8a06ce52015-12-20 12:16:10 +02001163 IB_QP_CREATE_CROSS_CHANNEL = 1 << 2,
1164 IB_QP_CREATE_MANAGED_SEND = 1 << 3,
1165 IB_QP_CREATE_MANAGED_RECV = 1 << 4,
Matan Barak90f1d1b2013-11-07 15:25:12 +02001166 IB_QP_CREATE_NETIF_QP = 1 << 5,
Sagi Grimberg1b01d332014-02-23 14:19:05 +02001167 IB_QP_CREATE_SIGNATURE_EN = 1 << 6,
Leon Romanovsky7855f582017-05-23 14:38:16 +03001168 /* FREE = 1 << 7, */
Majd Dibbinyb531b902016-04-17 17:19:36 +03001169 IB_QP_CREATE_SCATTER_FCS = 1 << 8,
Noa Osherovich9c2b2702017-01-18 15:39:56 +02001170 IB_QP_CREATE_CVLAN_STRIPPING = 1 << 9,
Yishai Hadas02984cc2017-06-08 16:15:06 +03001171 IB_QP_CREATE_SOURCE_QPN = 1 << 10,
Noa Osheroviche1d2e882017-10-29 13:59:44 +02001172 IB_QP_CREATE_PCI_WRITE_END_PADDING = 1 << 11,
Jack Morgensteind2b57062012-08-03 08:40:37 +00001173 /* reserve bits 26-31 for low level drivers' internal use */
1174 IB_QP_CREATE_RESERVED_START = 1 << 26,
1175 IB_QP_CREATE_RESERVED_END = 1 << 31,
Eli Cohenb846f252008-04-16 21:09:27 -07001176};
1177
Yishai Hadas73c40c62013-08-01 18:49:53 +03001178/*
1179 * Note: users may not call ib_close_qp or ib_destroy_qp from the event_handler
1180 * callback to destroy the passed in QP.
1181 */
1182
Linus Torvalds1da177e2005-04-16 15:20:36 -07001183struct ib_qp_init_attr {
Chuck Levereb93c82e2018-09-04 11:45:20 -04001184 /* Consumer's event_handler callback must not block */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001185 void (*event_handler)(struct ib_event *, void *);
Chuck Levereb93c82e2018-09-04 11:45:20 -04001186
Linus Torvalds1da177e2005-04-16 15:20:36 -07001187 void *qp_context;
1188 struct ib_cq *send_cq;
1189 struct ib_cq *recv_cq;
1190 struct ib_srq *srq;
Sean Heftyb42b63c2011-05-23 19:59:25 -07001191 struct ib_xrcd *xrcd; /* XRC TGT QPs only */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192 struct ib_qp_cap cap;
1193 enum ib_sig_type sq_sig_type;
1194 enum ib_qp_type qp_type;
Nathan Chancellorb56511c2018-09-24 12:57:16 -07001195 u32 create_flags;
Christoph Hellwiga060b562016-05-03 18:01:09 +02001196
1197 /*
1198 * Only needed for special QP types, or when using the RW API.
1199 */
1200 u8 port_num;
Yishai Hadasa9017e22016-05-23 15:20:54 +03001201 struct ib_rwq_ind_table *rwq_ind_tbl;
Yishai Hadas02984cc2017-06-08 16:15:06 +03001202 u32 source_qpn;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001203};
1204
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07001205struct ib_qp_open_attr {
1206 void (*event_handler)(struct ib_event *, void *);
1207 void *qp_context;
1208 u32 qp_num;
1209 enum ib_qp_type qp_type;
1210};
1211
Linus Torvalds1da177e2005-04-16 15:20:36 -07001212enum ib_rnr_timeout {
1213 IB_RNR_TIMER_655_36 = 0,
1214 IB_RNR_TIMER_000_01 = 1,
1215 IB_RNR_TIMER_000_02 = 2,
1216 IB_RNR_TIMER_000_03 = 3,
1217 IB_RNR_TIMER_000_04 = 4,
1218 IB_RNR_TIMER_000_06 = 5,
1219 IB_RNR_TIMER_000_08 = 6,
1220 IB_RNR_TIMER_000_12 = 7,
1221 IB_RNR_TIMER_000_16 = 8,
1222 IB_RNR_TIMER_000_24 = 9,
1223 IB_RNR_TIMER_000_32 = 10,
1224 IB_RNR_TIMER_000_48 = 11,
1225 IB_RNR_TIMER_000_64 = 12,
1226 IB_RNR_TIMER_000_96 = 13,
1227 IB_RNR_TIMER_001_28 = 14,
1228 IB_RNR_TIMER_001_92 = 15,
1229 IB_RNR_TIMER_002_56 = 16,
1230 IB_RNR_TIMER_003_84 = 17,
1231 IB_RNR_TIMER_005_12 = 18,
1232 IB_RNR_TIMER_007_68 = 19,
1233 IB_RNR_TIMER_010_24 = 20,
1234 IB_RNR_TIMER_015_36 = 21,
1235 IB_RNR_TIMER_020_48 = 22,
1236 IB_RNR_TIMER_030_72 = 23,
1237 IB_RNR_TIMER_040_96 = 24,
1238 IB_RNR_TIMER_061_44 = 25,
1239 IB_RNR_TIMER_081_92 = 26,
1240 IB_RNR_TIMER_122_88 = 27,
1241 IB_RNR_TIMER_163_84 = 28,
1242 IB_RNR_TIMER_245_76 = 29,
1243 IB_RNR_TIMER_327_68 = 30,
1244 IB_RNR_TIMER_491_52 = 31
1245};
1246
1247enum ib_qp_attr_mask {
1248 IB_QP_STATE = 1,
1249 IB_QP_CUR_STATE = (1<<1),
1250 IB_QP_EN_SQD_ASYNC_NOTIFY = (1<<2),
1251 IB_QP_ACCESS_FLAGS = (1<<3),
1252 IB_QP_PKEY_INDEX = (1<<4),
1253 IB_QP_PORT = (1<<5),
1254 IB_QP_QKEY = (1<<6),
1255 IB_QP_AV = (1<<7),
1256 IB_QP_PATH_MTU = (1<<8),
1257 IB_QP_TIMEOUT = (1<<9),
1258 IB_QP_RETRY_CNT = (1<<10),
1259 IB_QP_RNR_RETRY = (1<<11),
1260 IB_QP_RQ_PSN = (1<<12),
1261 IB_QP_MAX_QP_RD_ATOMIC = (1<<13),
1262 IB_QP_ALT_PATH = (1<<14),
1263 IB_QP_MIN_RNR_TIMER = (1<<15),
1264 IB_QP_SQ_PSN = (1<<16),
1265 IB_QP_MAX_DEST_RD_ATOMIC = (1<<17),
1266 IB_QP_PATH_MIG_STATE = (1<<18),
1267 IB_QP_CAP = (1<<19),
Matan Barakdd5f03b2013-12-12 18:03:11 +02001268 IB_QP_DEST_QPN = (1<<20),
Matan Barakaa744cc2015-10-15 18:38:53 +03001269 IB_QP_RESERVED1 = (1<<21),
1270 IB_QP_RESERVED2 = (1<<22),
1271 IB_QP_RESERVED3 = (1<<23),
1272 IB_QP_RESERVED4 = (1<<24),
Bodong Wang528e5a12016-12-01 13:43:14 +02001273 IB_QP_RATE_LIMIT = (1<<25),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001274};
1275
1276enum ib_qp_state {
1277 IB_QPS_RESET,
1278 IB_QPS_INIT,
1279 IB_QPS_RTR,
1280 IB_QPS_RTS,
1281 IB_QPS_SQD,
1282 IB_QPS_SQE,
1283 IB_QPS_ERR
1284};
1285
1286enum ib_mig_state {
1287 IB_MIG_MIGRATED,
1288 IB_MIG_REARM,
1289 IB_MIG_ARMED
1290};
1291
Shani Michaeli7083e422013-02-06 16:19:12 +00001292enum ib_mw_type {
1293 IB_MW_TYPE_1 = 1,
1294 IB_MW_TYPE_2 = 2
1295};
1296
Linus Torvalds1da177e2005-04-16 15:20:36 -07001297struct ib_qp_attr {
1298 enum ib_qp_state qp_state;
1299 enum ib_qp_state cur_qp_state;
1300 enum ib_mtu path_mtu;
1301 enum ib_mig_state path_mig_state;
1302 u32 qkey;
1303 u32 rq_psn;
1304 u32 sq_psn;
1305 u32 dest_qp_num;
1306 int qp_access_flags;
1307 struct ib_qp_cap cap;
Dasaratharaman Chandramouli90898852017-04-29 14:41:18 -04001308 struct rdma_ah_attr ah_attr;
1309 struct rdma_ah_attr alt_ah_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 u16 pkey_index;
1311 u16 alt_pkey_index;
1312 u8 en_sqd_async_notify;
1313 u8 sq_draining;
1314 u8 max_rd_atomic;
1315 u8 max_dest_rd_atomic;
1316 u8 min_rnr_timer;
1317 u8 port_num;
1318 u8 timeout;
1319 u8 retry_cnt;
1320 u8 rnr_retry;
1321 u8 alt_port_num;
1322 u8 alt_timeout;
Bodong Wang528e5a12016-12-01 13:43:14 +02001323 u32 rate_limit;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324};
1325
1326enum ib_wr_opcode {
Jason Gunthorpe9a597392018-08-14 15:33:02 -07001327 /* These are shared with userspace */
1328 IB_WR_RDMA_WRITE = IB_UVERBS_WR_RDMA_WRITE,
1329 IB_WR_RDMA_WRITE_WITH_IMM = IB_UVERBS_WR_RDMA_WRITE_WITH_IMM,
1330 IB_WR_SEND = IB_UVERBS_WR_SEND,
1331 IB_WR_SEND_WITH_IMM = IB_UVERBS_WR_SEND_WITH_IMM,
1332 IB_WR_RDMA_READ = IB_UVERBS_WR_RDMA_READ,
1333 IB_WR_ATOMIC_CMP_AND_SWP = IB_UVERBS_WR_ATOMIC_CMP_AND_SWP,
1334 IB_WR_ATOMIC_FETCH_AND_ADD = IB_UVERBS_WR_ATOMIC_FETCH_AND_ADD,
1335 IB_WR_LSO = IB_UVERBS_WR_TSO,
1336 IB_WR_SEND_WITH_INV = IB_UVERBS_WR_SEND_WITH_INV,
1337 IB_WR_RDMA_READ_WITH_INV = IB_UVERBS_WR_RDMA_READ_WITH_INV,
1338 IB_WR_LOCAL_INV = IB_UVERBS_WR_LOCAL_INV,
1339 IB_WR_MASKED_ATOMIC_CMP_AND_SWP =
1340 IB_UVERBS_WR_MASKED_ATOMIC_CMP_AND_SWP,
1341 IB_WR_MASKED_ATOMIC_FETCH_AND_ADD =
1342 IB_UVERBS_WR_MASKED_ATOMIC_FETCH_AND_ADD,
1343
1344 /* These are kernel only and can not be issued by userspace */
1345 IB_WR_REG_MR = 0x20,
Sagi Grimberg1b01d332014-02-23 14:19:05 +02001346 IB_WR_REG_SIG_MR,
Jason Gunthorpe9a597392018-08-14 15:33:02 -07001347
Jack Morgenstein0134f162013-07-07 17:25:52 +03001348 /* reserve values for low level drivers' internal use.
1349 * These values will not be used at all in the ib core layer.
1350 */
1351 IB_WR_RESERVED1 = 0xf0,
1352 IB_WR_RESERVED2,
1353 IB_WR_RESERVED3,
1354 IB_WR_RESERVED4,
1355 IB_WR_RESERVED5,
1356 IB_WR_RESERVED6,
1357 IB_WR_RESERVED7,
1358 IB_WR_RESERVED8,
1359 IB_WR_RESERVED9,
1360 IB_WR_RESERVED10,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001361};
1362
1363enum ib_send_flags {
1364 IB_SEND_FENCE = 1,
1365 IB_SEND_SIGNALED = (1<<1),
1366 IB_SEND_SOLICITED = (1<<2),
Eli Cohene0605d92008-01-30 18:30:57 +02001367 IB_SEND_INLINE = (1<<3),
Jack Morgenstein0134f162013-07-07 17:25:52 +03001368 IB_SEND_IP_CSUM = (1<<4),
1369
1370 /* reserve bits 26-31 for low level drivers' internal use */
1371 IB_SEND_RESERVED_START = (1 << 26),
1372 IB_SEND_RESERVED_END = (1 << 31),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001373};
1374
1375struct ib_sge {
1376 u64 addr;
1377 u32 length;
1378 u32 lkey;
1379};
1380
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001381struct ib_cqe {
1382 void (*done)(struct ib_cq *cq, struct ib_wc *wc);
1383};
1384
Linus Torvalds1da177e2005-04-16 15:20:36 -07001385struct ib_send_wr {
1386 struct ib_send_wr *next;
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001387 union {
1388 u64 wr_id;
1389 struct ib_cqe *wr_cqe;
1390 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001391 struct ib_sge *sg_list;
1392 int num_sge;
1393 enum ib_wr_opcode opcode;
1394 int send_flags;
Roland Dreier0f39cf32008-04-16 21:09:32 -07001395 union {
1396 __be32 imm_data;
1397 u32 invalidate_rkey;
1398 } ex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001399};
1400
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001401struct ib_rdma_wr {
1402 struct ib_send_wr wr;
1403 u64 remote_addr;
1404 u32 rkey;
1405};
1406
Bart Van Asschef696bf62018-07-18 09:25:14 -07001407static inline const struct ib_rdma_wr *rdma_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001408{
1409 return container_of(wr, struct ib_rdma_wr, wr);
1410}
1411
1412struct ib_atomic_wr {
1413 struct ib_send_wr wr;
1414 u64 remote_addr;
1415 u64 compare_add;
1416 u64 swap;
1417 u64 compare_add_mask;
1418 u64 swap_mask;
1419 u32 rkey;
1420};
1421
Bart Van Asschef696bf62018-07-18 09:25:14 -07001422static inline const struct ib_atomic_wr *atomic_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001423{
1424 return container_of(wr, struct ib_atomic_wr, wr);
1425}
1426
1427struct ib_ud_wr {
1428 struct ib_send_wr wr;
1429 struct ib_ah *ah;
1430 void *header;
1431 int hlen;
1432 int mss;
1433 u32 remote_qpn;
1434 u32 remote_qkey;
1435 u16 pkey_index; /* valid for GSI only */
1436 u8 port_num; /* valid for DR SMPs on switch only */
1437};
1438
Bart Van Asschef696bf62018-07-18 09:25:14 -07001439static inline const struct ib_ud_wr *ud_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001440{
1441 return container_of(wr, struct ib_ud_wr, wr);
1442}
1443
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001444struct ib_reg_wr {
1445 struct ib_send_wr wr;
1446 struct ib_mr *mr;
1447 u32 key;
1448 int access;
1449};
1450
Bart Van Asschef696bf62018-07-18 09:25:14 -07001451static inline const struct ib_reg_wr *reg_wr(const struct ib_send_wr *wr)
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001452{
1453 return container_of(wr, struct ib_reg_wr, wr);
1454}
1455
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001456struct ib_sig_handover_wr {
1457 struct ib_send_wr wr;
1458 struct ib_sig_attrs *sig_attrs;
1459 struct ib_mr *sig_mr;
1460 int access_flags;
1461 struct ib_sge *prot;
1462};
1463
Bart Van Asschef696bf62018-07-18 09:25:14 -07001464static inline const struct ib_sig_handover_wr *
1465sig_handover_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001466{
1467 return container_of(wr, struct ib_sig_handover_wr, wr);
1468}
1469
Linus Torvalds1da177e2005-04-16 15:20:36 -07001470struct ib_recv_wr {
1471 struct ib_recv_wr *next;
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001472 union {
1473 u64 wr_id;
1474 struct ib_cqe *wr_cqe;
1475 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476 struct ib_sge *sg_list;
1477 int num_sge;
1478};
1479
1480enum ib_access_flags {
Jason Gunthorpe4fca0372018-07-11 16:20:44 -06001481 IB_ACCESS_LOCAL_WRITE = IB_UVERBS_ACCESS_LOCAL_WRITE,
1482 IB_ACCESS_REMOTE_WRITE = IB_UVERBS_ACCESS_REMOTE_WRITE,
1483 IB_ACCESS_REMOTE_READ = IB_UVERBS_ACCESS_REMOTE_READ,
1484 IB_ACCESS_REMOTE_ATOMIC = IB_UVERBS_ACCESS_REMOTE_ATOMIC,
1485 IB_ACCESS_MW_BIND = IB_UVERBS_ACCESS_MW_BIND,
1486 IB_ZERO_BASED = IB_UVERBS_ACCESS_ZERO_BASED,
1487 IB_ACCESS_ON_DEMAND = IB_UVERBS_ACCESS_ON_DEMAND,
1488 IB_ACCESS_HUGETLB = IB_UVERBS_ACCESS_HUGETLB,
1489
1490 IB_ACCESS_SUPPORTED = ((IB_ACCESS_HUGETLB << 1) - 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001491};
1492
Christoph Hellwigb7d3e0a2015-12-23 19:12:47 +01001493/*
1494 * XXX: these are apparently used for ->rereg_user_mr, no idea why they
1495 * are hidden here instead of a uapi header!
1496 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497enum ib_mr_rereg_flags {
1498 IB_MR_REREG_TRANS = 1,
1499 IB_MR_REREG_PD = (1<<1),
Matan Barak7e6edb92014-07-31 11:01:28 +03001500 IB_MR_REREG_ACCESS = (1<<2),
1501 IB_MR_REREG_SUPPORTED = ((IB_MR_REREG_ACCESS << 1) - 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001502};
1503
Linus Torvalds1da177e2005-04-16 15:20:36 -07001504struct ib_fmr_attr {
1505 int max_pages;
1506 int max_maps;
Or Gerlitzd36f34a2006-02-02 10:43:45 -08001507 u8 page_shift;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001508};
1509
Haggai Eran882214e2014-12-11 17:04:18 +02001510struct ib_umem;
1511
Matan Barak38321252017-04-04 13:31:42 +03001512enum rdma_remove_reason {
Yishai Hadas1c774832018-06-20 17:11:39 +03001513 /*
1514 * Userspace requested uobject deletion or initial try
1515 * to remove uobject via cleanup. Call could fail
1516 */
Matan Barak38321252017-04-04 13:31:42 +03001517 RDMA_REMOVE_DESTROY,
1518 /* Context deletion. This call should delete the actual object itself */
1519 RDMA_REMOVE_CLOSE,
1520 /* Driver is being hot-unplugged. This call should delete the actual object itself */
1521 RDMA_REMOVE_DRIVER_REMOVE,
Jason Gunthorpe87ad80a2018-07-25 21:40:12 -06001522 /* uobj is being cleaned-up before being committed */
1523 RDMA_REMOVE_ABORT,
Matan Barak38321252017-04-04 13:31:42 +03001524};
1525
Parav Pandit43579b52017-01-10 00:02:14 +00001526struct ib_rdmacg_object {
1527#ifdef CONFIG_CGROUP_RDMA
1528 struct rdma_cgroup *cg; /* owner rdma cgroup */
1529#endif
1530};
1531
Roland Dreiere2773c02005-07-07 17:57:10 -07001532struct ib_ucontext {
1533 struct ib_device *device;
Matan Barak771addf2017-04-04 13:31:41 +03001534 struct ib_uverbs_file *ufile;
Jason Gunthorpee9517472018-07-10 20:55:19 -06001535 /*
1536 * 'closing' can be read by the driver only during a destroy callback,
1537 * it is set when we are closing the file descriptor and indicates
1538 * that mm_sem may be locked.
1539 */
Leon Romanovsky6ceb6332018-09-03 20:18:03 +03001540 bool closing;
Shachar Raindel8ada2c12014-12-11 17:04:17 +02001541
Yishai Hadas1c774832018-06-20 17:11:39 +03001542 bool cleanup_retryable;
Matan Barak38321252017-04-04 13:31:42 +03001543
Jason Gunthorpeb5231b02018-09-16 20:48:04 +03001544 void (*invalidate_range)(struct ib_umem_odp *umem_odp,
Haggai Eran882214e2014-12-11 17:04:18 +02001545 unsigned long start, unsigned long end);
Jason Gunthorpef27a0d52018-09-16 20:48:08 +03001546 struct mutex per_mm_list_lock;
1547 struct list_head per_mm_list;
Parav Pandit43579b52017-01-10 00:02:14 +00001548
1549 struct ib_rdmacg_object cg_obj;
Leon Romanovsky60615212018-11-28 13:16:43 +02001550 /*
1551 * Implementation details of the RDMA core, don't use in drivers:
1552 */
1553 struct rdma_restrack_entry res;
Roland Dreiere2773c02005-07-07 17:57:10 -07001554};
1555
1556struct ib_uobject {
1557 u64 user_handle; /* handle given to us by userspace */
Jason Gunthorpe6a5e9c82018-07-04 11:32:07 +03001558 /* ufile & ucontext owning this object */
1559 struct ib_uverbs_file *ufile;
1560 /* FIXME, save memory: ufile->context == context */
Roland Dreiere2773c02005-07-07 17:57:10 -07001561 struct ib_ucontext *context; /* associated user context */
Roland Dreier9ead1902006-06-17 20:44:49 -07001562 void *object; /* containing object */
Roland Dreiere2773c02005-07-07 17:57:10 -07001563 struct list_head list; /* link to context's list */
Parav Pandit43579b52017-01-10 00:02:14 +00001564 struct ib_rdmacg_object cg_obj; /* rdmacg object */
Roland Dreierb3d636b2008-04-16 21:01:06 -07001565 int id; /* index into kernel idr */
Roland Dreier9ead1902006-06-17 20:44:49 -07001566 struct kref ref;
Matan Barak38321252017-04-04 13:31:42 +03001567 atomic_t usecnt; /* protects exclusive access */
Mike Marciniszynd144da82015-11-02 12:13:25 -05001568 struct rcu_head rcu; /* kfree_rcu() overhead */
Matan Barak38321252017-04-04 13:31:42 +03001569
Jason Gunthorpe6b0d08f2018-08-09 20:14:37 -06001570 const struct uverbs_api_object *uapi_object;
Roland Dreiere2773c02005-07-07 17:57:10 -07001571};
1572
Roland Dreiere2773c02005-07-07 17:57:10 -07001573struct ib_udata {
Yann Droneaud309243e2013-12-11 23:01:44 +01001574 const void __user *inbuf;
Roland Dreiere2773c02005-07-07 17:57:10 -07001575 void __user *outbuf;
1576 size_t inlen;
1577 size_t outlen;
1578};
1579
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580struct ib_pd {
Jason Gunthorpe96249d72015-08-05 14:14:45 -06001581 u32 local_dma_lkey;
Christoph Hellwiged082d32016-09-05 12:56:17 +02001582 u32 flags;
Roland Dreiere2773c02005-07-07 17:57:10 -07001583 struct ib_device *device;
1584 struct ib_uobject *uobject;
1585 atomic_t usecnt; /* count all resources */
Christoph Hellwig50d46332016-09-05 12:56:16 +02001586
Christoph Hellwiged082d32016-09-05 12:56:17 +02001587 u32 unsafe_global_rkey;
1588
Christoph Hellwig50d46332016-09-05 12:56:16 +02001589 /*
1590 * Implementation details of the RDMA core, don't use in drivers:
1591 */
1592 struct ib_mr *__internal_mr;
Leon Romanovsky02d88832018-01-28 11:17:20 +02001593 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001594};
1595
Sean Hefty59991f92011-05-23 17:52:46 -07001596struct ib_xrcd {
1597 struct ib_device *device;
Sean Heftyd3d72d92011-05-26 23:06:44 -07001598 atomic_t usecnt; /* count all exposed resources */
Sean Hefty53d0bd12011-05-24 08:33:46 -07001599 struct inode *inode;
Sean Heftyd3d72d92011-05-26 23:06:44 -07001600
1601 struct mutex tgt_qp_mutex;
1602 struct list_head tgt_qp_list;
Sean Hefty59991f92011-05-23 17:52:46 -07001603};
1604
Linus Torvalds1da177e2005-04-16 15:20:36 -07001605struct ib_ah {
1606 struct ib_device *device;
1607 struct ib_pd *pd;
Roland Dreiere2773c02005-07-07 17:57:10 -07001608 struct ib_uobject *uobject;
Jason Gunthorpe1a1f4602018-06-13 10:22:08 +03001609 const struct ib_gid_attr *sgid_attr;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04001610 enum rdma_ah_attr_type type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001611};
1612
1613typedef void (*ib_comp_handler)(struct ib_cq *cq, void *cq_context);
1614
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001615enum ib_poll_context {
Jack Morgensteinf7948092018-08-27 08:35:55 +03001616 IB_POLL_DIRECT, /* caller context, no hw completions */
1617 IB_POLL_SOFTIRQ, /* poll from softirq context */
1618 IB_POLL_WORKQUEUE, /* poll from workqueue */
1619 IB_POLL_UNBOUND_WORKQUEUE, /* poll from unbound workqueue */
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001620};
1621
Linus Torvalds1da177e2005-04-16 15:20:36 -07001622struct ib_cq {
Roland Dreiere2773c02005-07-07 17:57:10 -07001623 struct ib_device *device;
1624 struct ib_uobject *uobject;
1625 ib_comp_handler comp_handler;
1626 void (*event_handler)(struct ib_event *, void *);
Dotan Barak4deccd62008-07-14 23:48:44 -07001627 void *cq_context;
Roland Dreiere2773c02005-07-07 17:57:10 -07001628 int cqe;
1629 atomic_t usecnt; /* count number of work queues */
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001630 enum ib_poll_context poll_ctx;
1631 struct ib_wc *wc;
1632 union {
1633 struct irq_poll iop;
1634 struct work_struct work;
1635 };
Jack Morgensteinf7948092018-08-27 08:35:55 +03001636 struct workqueue_struct *comp_wq;
Leon Romanovsky02d88832018-01-28 11:17:20 +02001637 /*
1638 * Implementation details of the RDMA core, don't use in drivers:
1639 */
1640 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001641};
1642
1643struct ib_srq {
Roland Dreierd41fcc62005-08-18 12:23:08 -07001644 struct ib_device *device;
1645 struct ib_pd *pd;
1646 struct ib_uobject *uobject;
1647 void (*event_handler)(struct ib_event *, void *);
1648 void *srq_context;
Sean Hefty96104ed2011-05-23 16:31:36 -07001649 enum ib_srq_type srq_type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001650 atomic_t usecnt;
Sean Hefty418d5132011-05-23 19:42:29 -07001651
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001652 struct {
1653 struct ib_cq *cq;
1654 union {
1655 struct {
1656 struct ib_xrcd *xrcd;
1657 u32 srq_num;
1658 } xrc;
1659 };
Sean Hefty418d5132011-05-23 19:42:29 -07001660 } ext;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001661};
1662
Noa Osherovichebaaee22017-01-18 15:39:54 +02001663enum ib_raw_packet_caps {
1664 /* Strip cvlan from incoming packet and report it in the matching work
1665 * completion is supported.
1666 */
1667 IB_RAW_PACKET_CAP_CVLAN_STRIPPING = (1 << 0),
1668 /* Scatter FCS field of an incoming packet to host memory is supported.
1669 */
1670 IB_RAW_PACKET_CAP_SCATTER_FCS = (1 << 1),
1671 /* Checksum offloads are supported (for both send and receive). */
1672 IB_RAW_PACKET_CAP_IP_CSUM = (1 << 2),
Maor Gottlieb7d9336d2017-05-30 10:29:10 +03001673 /* When a packet is received for an RQ with no receive WQEs, the
1674 * packet processing is delayed.
1675 */
1676 IB_RAW_PACKET_CAP_DELAY_DROP = (1 << 3),
Noa Osherovichebaaee22017-01-18 15:39:54 +02001677};
1678
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001679enum ib_wq_type {
1680 IB_WQT_RQ
1681};
1682
1683enum ib_wq_state {
1684 IB_WQS_RESET,
1685 IB_WQS_RDY,
1686 IB_WQS_ERR
1687};
1688
1689struct ib_wq {
1690 struct ib_device *device;
1691 struct ib_uobject *uobject;
1692 void *wq_context;
1693 void (*event_handler)(struct ib_event *, void *);
1694 struct ib_pd *pd;
1695 struct ib_cq *cq;
1696 u32 wq_num;
1697 enum ib_wq_state state;
1698 enum ib_wq_type wq_type;
1699 atomic_t usecnt;
1700};
1701
Noa Osherovich10bac722017-01-18 15:39:55 +02001702enum ib_wq_flags {
1703 IB_WQ_FLAGS_CVLAN_STRIPPING = 1 << 0,
Noa Osherovich27b0df12017-01-18 15:39:57 +02001704 IB_WQ_FLAGS_SCATTER_FCS = 1 << 1,
Maor Gottlieb7d9336d2017-05-30 10:29:10 +03001705 IB_WQ_FLAGS_DELAY_DROP = 1 << 2,
Noa Osheroviche1d2e882017-10-29 13:59:44 +02001706 IB_WQ_FLAGS_PCI_WRITE_END_PADDING = 1 << 3,
Noa Osherovich10bac722017-01-18 15:39:55 +02001707};
1708
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001709struct ib_wq_init_attr {
1710 void *wq_context;
1711 enum ib_wq_type wq_type;
1712 u32 max_wr;
1713 u32 max_sge;
1714 struct ib_cq *cq;
1715 void (*event_handler)(struct ib_event *, void *);
Noa Osherovich10bac722017-01-18 15:39:55 +02001716 u32 create_flags; /* Use enum ib_wq_flags */
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001717};
1718
1719enum ib_wq_attr_mask {
Noa Osherovich10bac722017-01-18 15:39:55 +02001720 IB_WQ_STATE = 1 << 0,
1721 IB_WQ_CUR_STATE = 1 << 1,
1722 IB_WQ_FLAGS = 1 << 2,
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001723};
1724
1725struct ib_wq_attr {
1726 enum ib_wq_state wq_state;
1727 enum ib_wq_state curr_wq_state;
Noa Osherovich10bac722017-01-18 15:39:55 +02001728 u32 flags; /* Use enum ib_wq_flags */
1729 u32 flags_mask; /* Use enum ib_wq_flags */
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001730};
1731
Yishai Hadas6d397862016-05-23 15:20:51 +03001732struct ib_rwq_ind_table {
1733 struct ib_device *device;
1734 struct ib_uobject *uobject;
1735 atomic_t usecnt;
1736 u32 ind_tbl_num;
1737 u32 log_ind_tbl_size;
1738 struct ib_wq **ind_tbl;
1739};
1740
1741struct ib_rwq_ind_table_init_attr {
1742 u32 log_ind_tbl_size;
1743 /* Each entry is a pointer to Receive Work Queue */
1744 struct ib_wq **ind_tbl;
1745};
1746
Daniel Jurgensd291f1a2017-05-19 15:48:52 +03001747enum port_pkey_state {
1748 IB_PORT_PKEY_NOT_VALID = 0,
1749 IB_PORT_PKEY_VALID = 1,
1750 IB_PORT_PKEY_LISTED = 2,
1751};
1752
1753struct ib_qp_security;
1754
1755struct ib_port_pkey {
1756 enum port_pkey_state state;
1757 u16 pkey_index;
1758 u8 port_num;
1759 struct list_head qp_list;
1760 struct list_head to_error_list;
1761 struct ib_qp_security *sec;
1762};
1763
1764struct ib_ports_pkeys {
1765 struct ib_port_pkey main;
1766 struct ib_port_pkey alt;
1767};
1768
1769struct ib_qp_security {
1770 struct ib_qp *qp;
1771 struct ib_device *dev;
1772 /* Hold this mutex when changing port and pkey settings. */
1773 struct mutex mutex;
1774 struct ib_ports_pkeys *ports_pkeys;
1775 /* A list of all open shared QP handles. Required to enforce security
1776 * properly for all users of a shared QP.
1777 */
1778 struct list_head shared_qp_list;
1779 void *security;
1780 bool destroying;
1781 atomic_t error_list_count;
1782 struct completion error_complete;
1783 int error_comps_pending;
1784};
1785
Bart Van Assche632bc3f2016-07-21 13:03:30 -07001786/*
1787 * @max_write_sge: Maximum SGE elements per RDMA WRITE request.
1788 * @max_read_sge: Maximum SGE elements per RDMA READ request.
1789 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001790struct ib_qp {
1791 struct ib_device *device;
1792 struct ib_pd *pd;
1793 struct ib_cq *send_cq;
1794 struct ib_cq *recv_cq;
Christoph Hellwigfffb0382016-05-03 18:01:07 +02001795 spinlock_t mr_lock;
1796 int mrs_used;
Christoph Hellwiga060b562016-05-03 18:01:09 +02001797 struct list_head rdma_mrs;
Christoph Hellwig0e353e32016-05-03 18:01:12 +02001798 struct list_head sig_mrs;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001799 struct ib_srq *srq;
Sean Heftyb42b63c2011-05-23 19:59:25 -07001800 struct ib_xrcd *xrcd; /* XRC TGT QPs only */
Sean Heftyd3d72d92011-05-26 23:06:44 -07001801 struct list_head xrcd_list;
Christoph Hellwigfffb0382016-05-03 18:01:07 +02001802
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001803 /* count times opened, mcast attaches, flow attaches */
1804 atomic_t usecnt;
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07001805 struct list_head open_list;
1806 struct ib_qp *real_qp;
Roland Dreiere2773c02005-07-07 17:57:10 -07001807 struct ib_uobject *uobject;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001808 void (*event_handler)(struct ib_event *, void *);
1809 void *qp_context;
Jason Gunthorpe1a1f4602018-06-13 10:22:08 +03001810 /* sgid_attrs associated with the AV's */
1811 const struct ib_gid_attr *av_sgid_attr;
1812 const struct ib_gid_attr *alt_path_sgid_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001813 u32 qp_num;
Bart Van Assche632bc3f2016-07-21 13:03:30 -07001814 u32 max_write_sge;
1815 u32 max_read_sge;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001816 enum ib_qp_type qp_type;
Yishai Hadasa9017e22016-05-23 15:20:54 +03001817 struct ib_rwq_ind_table *rwq_ind_tbl;
Daniel Jurgensd291f1a2017-05-19 15:48:52 +03001818 struct ib_qp_security *qp_sec;
Noa Osherovich498ca3c2017-08-23 08:35:40 +03001819 u8 port;
Leon Romanovsky02d88832018-01-28 11:17:20 +02001820
1821 /*
1822 * Implementation details of the RDMA core, don't use in drivers:
1823 */
1824 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001825};
1826
Ariel Levkovichbee76d72018-04-05 18:53:24 +03001827struct ib_dm {
1828 struct ib_device *device;
1829 u32 length;
1830 u32 flags;
1831 struct ib_uobject *uobject;
1832 atomic_t usecnt;
1833};
1834
Linus Torvalds1da177e2005-04-16 15:20:36 -07001835struct ib_mr {
Roland Dreiere2773c02005-07-07 17:57:10 -07001836 struct ib_device *device;
1837 struct ib_pd *pd;
Roland Dreiere2773c02005-07-07 17:57:10 -07001838 u32 lkey;
1839 u32 rkey;
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001840 u64 iova;
Parav Panditedd31552017-09-24 21:46:31 +03001841 u64 length;
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001842 unsigned int page_size;
Steve Wised4a85c32016-05-03 18:01:08 +02001843 bool need_inval;
Christoph Hellwigfffb0382016-05-03 18:01:07 +02001844 union {
1845 struct ib_uobject *uobject; /* user */
1846 struct list_head qp_entry; /* FR */
1847 };
Steve Wisefccec5b2018-03-01 13:58:13 -08001848
Ariel Levkovichbe934cc2018-04-05 18:53:25 +03001849 struct ib_dm *dm;
1850
Steve Wisefccec5b2018-03-01 13:58:13 -08001851 /*
1852 * Implementation details of the RDMA core, don't use in drivers:
1853 */
1854 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001855};
1856
1857struct ib_mw {
1858 struct ib_device *device;
1859 struct ib_pd *pd;
Roland Dreiere2773c02005-07-07 17:57:10 -07001860 struct ib_uobject *uobject;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001861 u32 rkey;
Shani Michaeli7083e422013-02-06 16:19:12 +00001862 enum ib_mw_type type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001863};
1864
1865struct ib_fmr {
1866 struct ib_device *device;
1867 struct ib_pd *pd;
1868 struct list_head list;
1869 u32 lkey;
1870 u32 rkey;
1871};
1872
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001873/* Supported steering options */
1874enum ib_flow_attr_type {
1875 /* steering according to rule specifications */
1876 IB_FLOW_ATTR_NORMAL = 0x0,
1877 /* default unicast and multicast rule -
1878 * receive all Eth traffic which isn't steered to any QP
1879 */
1880 IB_FLOW_ATTR_ALL_DEFAULT = 0x1,
1881 /* default multicast rule -
1882 * receive all Eth multicast traffic which isn't steered to any QP
1883 */
1884 IB_FLOW_ATTR_MC_DEFAULT = 0x2,
1885 /* sniffer rule - receive all port traffic */
1886 IB_FLOW_ATTR_SNIFFER = 0x3
1887};
1888
1889/* Supported steering header types */
1890enum ib_flow_spec_type {
1891 /* L2 headers*/
Moses Reuben76bd23b2016-11-14 19:04:48 +02001892 IB_FLOW_SPEC_ETH = 0x20,
1893 IB_FLOW_SPEC_IB = 0x22,
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001894 /* L3 header*/
Moses Reuben76bd23b2016-11-14 19:04:48 +02001895 IB_FLOW_SPEC_IPV4 = 0x30,
1896 IB_FLOW_SPEC_IPV6 = 0x31,
Matan Barak56ab0b32018-03-28 09:27:49 +03001897 IB_FLOW_SPEC_ESP = 0x34,
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001898 /* L4 headers*/
Moses Reuben76bd23b2016-11-14 19:04:48 +02001899 IB_FLOW_SPEC_TCP = 0x40,
1900 IB_FLOW_SPEC_UDP = 0x41,
Moses Reuben0dbf3332016-11-14 19:04:47 +02001901 IB_FLOW_SPEC_VXLAN_TUNNEL = 0x50,
Ariel Levkovichd90e5e52018-05-13 14:33:30 +03001902 IB_FLOW_SPEC_GRE = 0x51,
Ariel Levkovichb04f0f02018-05-13 14:33:32 +03001903 IB_FLOW_SPEC_MPLS = 0x60,
Moses Reubenfbf46862016-11-14 19:04:51 +02001904 IB_FLOW_SPEC_INNER = 0x100,
Moses Reuben460d0192017-01-18 14:59:48 +02001905 /* Actions */
1906 IB_FLOW_SPEC_ACTION_TAG = 0x1000,
Slava Shwartsman483a3962017-04-03 13:13:51 +03001907 IB_FLOW_SPEC_ACTION_DROP = 0x1001,
Matan Barak9b828442018-03-28 09:27:46 +03001908 IB_FLOW_SPEC_ACTION_HANDLE = 0x1002,
Raed Salem7eea23a2018-05-31 16:43:36 +03001909 IB_FLOW_SPEC_ACTION_COUNT = 0x1003,
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001910};
Matan Barak240ae002013-11-07 15:25:13 +02001911#define IB_FLOW_SPEC_LAYER_MASK 0xF0
Raed Salem7eea23a2018-05-31 16:43:36 +03001912#define IB_FLOW_SPEC_SUPPORT_LAYERS 10
Matan Barak22878db2013-09-01 18:39:52 +03001913
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001914/* Flow steering rule priority is set according to it's domain.
1915 * Lower domain value means higher priority.
1916 */
1917enum ib_flow_domain {
1918 IB_FLOW_DOMAIN_USER,
1919 IB_FLOW_DOMAIN_ETHTOOL,
1920 IB_FLOW_DOMAIN_RFS,
1921 IB_FLOW_DOMAIN_NIC,
1922 IB_FLOW_DOMAIN_NUM /* Must be last */
1923};
1924
Marina Varshavera3100a72016-02-18 18:31:05 +02001925enum ib_flow_flags {
1926 IB_FLOW_ATTR_FLAGS_DONT_TRAP = 1UL << 1, /* Continue match, no steal */
Boris Pismenny21e82d32018-03-28 09:27:47 +03001927 IB_FLOW_ATTR_FLAGS_EGRESS = 1UL << 2, /* Egress flow */
1928 IB_FLOW_ATTR_FLAGS_RESERVED = 1UL << 3 /* Must be last */
Marina Varshavera3100a72016-02-18 18:31:05 +02001929};
1930
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001931struct ib_flow_eth_filter {
1932 u8 dst_mac[6];
1933 u8 src_mac[6];
1934 __be16 ether_type;
1935 __be16 vlan_tag;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001936 /* Must be last */
1937 u8 real_sz[0];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001938};
1939
1940struct ib_flow_spec_eth {
Moses Reubenfbf46862016-11-14 19:04:51 +02001941 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001942 u16 size;
1943 struct ib_flow_eth_filter val;
1944 struct ib_flow_eth_filter mask;
1945};
1946
Matan Barak240ae002013-11-07 15:25:13 +02001947struct ib_flow_ib_filter {
1948 __be16 dlid;
1949 __u8 sl;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001950 /* Must be last */
1951 u8 real_sz[0];
Matan Barak240ae002013-11-07 15:25:13 +02001952};
1953
1954struct ib_flow_spec_ib {
Moses Reubenfbf46862016-11-14 19:04:51 +02001955 u32 type;
Matan Barak240ae002013-11-07 15:25:13 +02001956 u16 size;
1957 struct ib_flow_ib_filter val;
1958 struct ib_flow_ib_filter mask;
1959};
1960
Maor Gottlieb989a3a82016-08-30 16:58:33 +03001961/* IPv4 header flags */
1962enum ib_ipv4_flags {
1963 IB_IPV4_DONT_FRAG = 0x2, /* Don't enable packet fragmentation */
1964 IB_IPV4_MORE_FRAG = 0X4 /* For All fragmented packets except the
1965 last have this flag set */
1966};
1967
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001968struct ib_flow_ipv4_filter {
1969 __be32 src_ip;
1970 __be32 dst_ip;
Maor Gottlieb989a3a82016-08-30 16:58:33 +03001971 u8 proto;
1972 u8 tos;
1973 u8 ttl;
1974 u8 flags;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001975 /* Must be last */
1976 u8 real_sz[0];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001977};
1978
1979struct ib_flow_spec_ipv4 {
Moses Reubenfbf46862016-11-14 19:04:51 +02001980 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001981 u16 size;
1982 struct ib_flow_ipv4_filter val;
1983 struct ib_flow_ipv4_filter mask;
1984};
1985
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03001986struct ib_flow_ipv6_filter {
1987 u8 src_ip[16];
1988 u8 dst_ip[16];
Maor Gottlieba72c6a22016-08-30 16:58:34 +03001989 __be32 flow_label;
1990 u8 next_hdr;
1991 u8 traffic_class;
1992 u8 hop_limit;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001993 /* Must be last */
1994 u8 real_sz[0];
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03001995};
1996
1997struct ib_flow_spec_ipv6 {
Moses Reubenfbf46862016-11-14 19:04:51 +02001998 u32 type;
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03001999 u16 size;
2000 struct ib_flow_ipv6_filter val;
2001 struct ib_flow_ipv6_filter mask;
2002};
2003
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002004struct ib_flow_tcp_udp_filter {
2005 __be16 dst_port;
2006 __be16 src_port;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03002007 /* Must be last */
2008 u8 real_sz[0];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002009};
2010
2011struct ib_flow_spec_tcp_udp {
Moses Reubenfbf46862016-11-14 19:04:51 +02002012 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002013 u16 size;
2014 struct ib_flow_tcp_udp_filter val;
2015 struct ib_flow_tcp_udp_filter mask;
2016};
2017
Moses Reuben0dbf3332016-11-14 19:04:47 +02002018struct ib_flow_tunnel_filter {
2019 __be32 tunnel_id;
2020 u8 real_sz[0];
2021};
2022
2023/* ib_flow_spec_tunnel describes the Vxlan tunnel
2024 * the tunnel_id from val has the vni value
2025 */
2026struct ib_flow_spec_tunnel {
Moses Reubenfbf46862016-11-14 19:04:51 +02002027 u32 type;
Moses Reuben0dbf3332016-11-14 19:04:47 +02002028 u16 size;
2029 struct ib_flow_tunnel_filter val;
2030 struct ib_flow_tunnel_filter mask;
2031};
2032
Matan Barak56ab0b32018-03-28 09:27:49 +03002033struct ib_flow_esp_filter {
2034 __be32 spi;
2035 __be32 seq;
2036 /* Must be last */
2037 u8 real_sz[0];
2038};
2039
2040struct ib_flow_spec_esp {
2041 u32 type;
2042 u16 size;
2043 struct ib_flow_esp_filter val;
2044 struct ib_flow_esp_filter mask;
2045};
2046
Ariel Levkovichd90e5e52018-05-13 14:33:30 +03002047struct ib_flow_gre_filter {
2048 __be16 c_ks_res0_ver;
2049 __be16 protocol;
2050 __be32 key;
2051 /* Must be last */
2052 u8 real_sz[0];
2053};
2054
2055struct ib_flow_spec_gre {
2056 u32 type;
2057 u16 size;
2058 struct ib_flow_gre_filter val;
2059 struct ib_flow_gre_filter mask;
2060};
2061
Ariel Levkovichb04f0f02018-05-13 14:33:32 +03002062struct ib_flow_mpls_filter {
2063 __be32 tag;
2064 /* Must be last */
2065 u8 real_sz[0];
2066};
2067
2068struct ib_flow_spec_mpls {
2069 u32 type;
2070 u16 size;
2071 struct ib_flow_mpls_filter val;
2072 struct ib_flow_mpls_filter mask;
2073};
2074
Moses Reuben460d0192017-01-18 14:59:48 +02002075struct ib_flow_spec_action_tag {
2076 enum ib_flow_spec_type type;
2077 u16 size;
2078 u32 tag_id;
2079};
2080
Slava Shwartsman483a3962017-04-03 13:13:51 +03002081struct ib_flow_spec_action_drop {
2082 enum ib_flow_spec_type type;
2083 u16 size;
2084};
2085
Matan Barak9b828442018-03-28 09:27:46 +03002086struct ib_flow_spec_action_handle {
2087 enum ib_flow_spec_type type;
2088 u16 size;
2089 struct ib_flow_action *act;
2090};
2091
Raed Salem7eea23a2018-05-31 16:43:36 +03002092enum ib_counters_description {
2093 IB_COUNTER_PACKETS,
2094 IB_COUNTER_BYTES,
2095};
2096
2097struct ib_flow_spec_action_count {
2098 enum ib_flow_spec_type type;
2099 u16 size;
2100 struct ib_counters *counters;
2101};
2102
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002103union ib_flow_spec {
2104 struct {
Moses Reubenfbf46862016-11-14 19:04:51 +02002105 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002106 u16 size;
2107 };
2108 struct ib_flow_spec_eth eth;
Matan Barak240ae002013-11-07 15:25:13 +02002109 struct ib_flow_spec_ib ib;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002110 struct ib_flow_spec_ipv4 ipv4;
2111 struct ib_flow_spec_tcp_udp tcp_udp;
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03002112 struct ib_flow_spec_ipv6 ipv6;
Moses Reuben0dbf3332016-11-14 19:04:47 +02002113 struct ib_flow_spec_tunnel tunnel;
Matan Barak56ab0b32018-03-28 09:27:49 +03002114 struct ib_flow_spec_esp esp;
Ariel Levkovichd90e5e52018-05-13 14:33:30 +03002115 struct ib_flow_spec_gre gre;
Ariel Levkovichb04f0f02018-05-13 14:33:32 +03002116 struct ib_flow_spec_mpls mpls;
Moses Reuben460d0192017-01-18 14:59:48 +02002117 struct ib_flow_spec_action_tag flow_tag;
Slava Shwartsman483a3962017-04-03 13:13:51 +03002118 struct ib_flow_spec_action_drop drop;
Matan Barak9b828442018-03-28 09:27:46 +03002119 struct ib_flow_spec_action_handle action;
Raed Salem7eea23a2018-05-31 16:43:36 +03002120 struct ib_flow_spec_action_count flow_count;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002121};
2122
2123struct ib_flow_attr {
2124 enum ib_flow_attr_type type;
2125 u16 size;
2126 u16 priority;
2127 u32 flags;
2128 u8 num_of_specs;
2129 u8 port;
Matthew Wilcox7654cb12018-06-07 07:57:16 -07002130 union ib_flow_spec flows[];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002131};
2132
2133struct ib_flow {
2134 struct ib_qp *qp;
Yishai Hadas6cd080a2018-07-23 15:25:08 +03002135 struct ib_device *device;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002136 struct ib_uobject *uobject;
2137};
2138
Matan Barak2eb9bea2018-03-28 09:27:45 +03002139enum ib_flow_action_type {
2140 IB_FLOW_ACTION_UNSPECIFIED,
2141 IB_FLOW_ACTION_ESP = 1,
2142};
2143
2144struct ib_flow_action_attrs_esp_keymats {
2145 enum ib_uverbs_flow_action_esp_keymat protocol;
2146 union {
2147 struct ib_uverbs_flow_action_esp_keymat_aes_gcm aes_gcm;
2148 } keymat;
2149};
2150
2151struct ib_flow_action_attrs_esp_replays {
2152 enum ib_uverbs_flow_action_esp_replay protocol;
2153 union {
2154 struct ib_uverbs_flow_action_esp_replay_bmp bmp;
2155 } replay;
2156};
2157
2158enum ib_flow_action_attrs_esp_flags {
2159 /* All user-space flags at the top: Use enum ib_uverbs_flow_action_esp_flags
2160 * This is done in order to share the same flags between user-space and
2161 * kernel and spare an unnecessary translation.
2162 */
2163
2164 /* Kernel flags */
2165 IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED = 1ULL << 32,
Matan Barak7d12f8d2018-03-28 09:27:48 +03002166 IB_FLOW_ACTION_ESP_FLAGS_MOD_ESP_ATTRS = 1ULL << 33,
Matan Barak2eb9bea2018-03-28 09:27:45 +03002167};
2168
2169struct ib_flow_spec_list {
2170 struct ib_flow_spec_list *next;
2171 union ib_flow_spec spec;
2172};
2173
2174struct ib_flow_action_attrs_esp {
2175 struct ib_flow_action_attrs_esp_keymats *keymat;
2176 struct ib_flow_action_attrs_esp_replays *replay;
2177 struct ib_flow_spec_list *encap;
2178 /* Used only if IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED is enabled.
2179 * Value of 0 is a valid value.
2180 */
2181 u32 esn;
2182 u32 spi;
2183 u32 seq;
2184 u32 tfc_pad;
2185 /* Use enum ib_flow_action_attrs_esp_flags */
2186 u64 flags;
2187 u64 hard_limit_pkts;
2188};
2189
2190struct ib_flow_action {
2191 struct ib_device *device;
2192 struct ib_uobject *uobject;
2193 enum ib_flow_action_type type;
2194 atomic_t usecnt;
2195};
2196
Ira Weiny4cd7c942015-06-06 14:38:31 -04002197struct ib_mad_hdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002198struct ib_grh;
2199
2200enum ib_process_mad_flags {
2201 IB_MAD_IGNORE_MKEY = 1,
2202 IB_MAD_IGNORE_BKEY = 2,
2203 IB_MAD_IGNORE_ALL = IB_MAD_IGNORE_MKEY | IB_MAD_IGNORE_BKEY
2204};
2205
2206enum ib_mad_result {
2207 IB_MAD_RESULT_FAILURE = 0, /* (!SUCCESS is the important flag) */
2208 IB_MAD_RESULT_SUCCESS = 1 << 0, /* MAD was successfully processed */
2209 IB_MAD_RESULT_REPLY = 1 << 1, /* Reply packet needs to be sent */
2210 IB_MAD_RESULT_CONSUMED = 1 << 2 /* Packet consumed: stop processing */
2211};
2212
Jack Wang21d64542017-01-17 10:11:12 +01002213struct ib_port_cache {
Daniel Jurgens883c71f2017-05-19 15:48:51 +03002214 u64 subnet_prefix;
Jack Wang21d64542017-01-17 10:11:12 +01002215 struct ib_pkey_cache *pkey;
2216 struct ib_gid_table *gid;
2217 u8 lmc;
2218 enum ib_port_state port_state;
2219};
2220
Linus Torvalds1da177e2005-04-16 15:20:36 -07002221struct ib_cache {
2222 rwlock_t lock;
2223 struct ib_event_handler event_handler;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002224};
2225
Ira Weiny77386132015-05-13 20:02:58 -04002226struct ib_port_immutable {
2227 int pkey_tbl_len;
2228 int gid_tbl_len;
Ira Weinyf9b22e32015-05-13 20:02:59 -04002229 u32 core_cap_flags;
Ira Weiny337877a2015-06-06 14:38:29 -04002230 u32 max_mad_size;
Ira Weiny77386132015-05-13 20:02:58 -04002231};
2232
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002233struct ib_port_data {
Jason Gunthorpe324e2272019-02-12 21:12:51 -07002234 struct ib_device *ib_dev;
2235
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002236 struct ib_port_immutable immutable;
2237
2238 spinlock_t pkey_list_lock;
2239 struct list_head pkey_list;
Jason Gunthorpe8faea9f2019-02-12 21:12:49 -07002240
2241 struct ib_port_cache cache;
Jason Gunthorpec2261dd2019-02-12 21:12:50 -07002242
2243 spinlock_t netdev_lock;
Jason Gunthorpe324e2272019-02-12 21:12:51 -07002244 struct net_device __rcu *netdev;
2245 struct hlist_node ndev_hash_link;
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002246};
2247
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002248/* rdma netdev type - specifies protocol type */
2249enum rdma_netdev_t {
Niranjana Vishwanathapuraf0ad83ac2017-04-10 11:22:25 +03002250 RDMA_NETDEV_OPA_VNIC,
2251 RDMA_NETDEV_IPOIB,
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002252};
2253
2254/**
2255 * struct rdma_netdev - rdma netdev
2256 * For cases where netstack interfacing is required.
2257 */
2258struct rdma_netdev {
2259 void *clnt_priv;
2260 struct ib_device *hca;
2261 u8 port_num;
2262
Jason Gunthorpe9f49a5b2018-07-29 11:34:56 +03002263 /*
2264 * cleanup function must be specified.
2265 * FIXME: This is only used for OPA_VNIC and that usage should be
2266 * removed too.
2267 */
Niranjana Vishwanathapura8e959602017-06-30 13:14:46 -07002268 void (*free_rdma_netdev)(struct net_device *netdev);
2269
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002270 /* control functions */
2271 void (*set_id)(struct net_device *netdev, int id);
Niranjana Vishwanathapuraf0ad83ac2017-04-10 11:22:25 +03002272 /* send packet */
2273 int (*send)(struct net_device *dev, struct sk_buff *skb,
2274 struct ib_ah *address, u32 dqpn);
2275 /* multicast */
2276 int (*attach_mcast)(struct net_device *dev, struct ib_device *hca,
2277 union ib_gid *gid, u16 mlid,
2278 int set_qkey, u32 qkey);
2279 int (*detach_mcast)(struct net_device *dev, struct ib_device *hca,
2280 union ib_gid *gid, u16 mlid);
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002281};
2282
Denis Drozdovf6a8a192018-08-14 14:08:51 +03002283struct rdma_netdev_alloc_params {
2284 size_t sizeof_priv;
2285 unsigned int txqs;
2286 unsigned int rxqs;
2287 void *param;
2288
2289 int (*initialize_rdma_netdev)(struct ib_device *device, u8 port_num,
2290 struct net_device *netdev, void *param);
2291};
2292
Raed Salemfa9b1802018-05-31 16:43:31 +03002293struct ib_counters {
2294 struct ib_device *device;
2295 struct ib_uobject *uobject;
2296 /* num of objects attached */
2297 atomic_t usecnt;
2298};
2299
Raed Salem51d7a532018-05-31 16:43:33 +03002300struct ib_counters_read_attr {
2301 u64 *counters_buff;
2302 u32 ncounters;
2303 u32 flags; /* use enum ib_read_counters_flags */
2304};
2305
Matan Barak2eb9bea2018-03-28 09:27:45 +03002306struct uverbs_attr_bundle;
Kamal Heibdd05cb82019-04-29 14:59:06 +03002307struct iw_cm_id;
2308struct iw_cm_conn_param;
Matan Barak2eb9bea2018-03-28 09:27:45 +03002309
Leon Romanovsky30471d42019-02-03 14:55:50 +02002310#define INIT_RDMA_OBJ_SIZE(ib_struct, drv_struct, member) \
2311 .size_##ib_struct = \
2312 (sizeof(struct drv_struct) + \
2313 BUILD_BUG_ON_ZERO(offsetof(struct drv_struct, member)) + \
2314 BUILD_BUG_ON_ZERO( \
2315 !__same_type(((struct drv_struct *)NULL)->member, \
2316 struct ib_struct)))
2317
Leon Romanovskyf6316032019-03-28 15:12:58 +02002318#define rdma_zalloc_drv_obj_gfp(ib_dev, ib_type, gfp) \
2319 ((struct ib_type *)kzalloc(ib_dev->ops.size_##ib_type, gfp))
2320
Leon Romanovsky30471d42019-02-03 14:55:50 +02002321#define rdma_zalloc_drv_obj(ib_dev, ib_type) \
Leon Romanovskyf6316032019-03-28 15:12:58 +02002322 rdma_zalloc_drv_obj_gfp(ib_dev, ib_type, GFP_KERNEL)
Leon Romanovsky30471d42019-02-03 14:55:50 +02002323
2324#define DECLARE_RDMA_OBJ_SIZE(ib_struct) size_t size_##ib_struct
2325
Kamal Heib521ed0d2018-12-10 21:09:30 +02002326/**
2327 * struct ib_device_ops - InfiniBand device operations
2328 * This structure defines all the InfiniBand device operations, providers will
2329 * need to define the supported operations, otherwise they will be set to null.
2330 */
2331struct ib_device_ops {
2332 int (*post_send)(struct ib_qp *qp, const struct ib_send_wr *send_wr,
2333 const struct ib_send_wr **bad_send_wr);
2334 int (*post_recv)(struct ib_qp *qp, const struct ib_recv_wr *recv_wr,
2335 const struct ib_recv_wr **bad_recv_wr);
2336 void (*drain_rq)(struct ib_qp *qp);
2337 void (*drain_sq)(struct ib_qp *qp);
2338 int (*poll_cq)(struct ib_cq *cq, int num_entries, struct ib_wc *wc);
2339 int (*peek_cq)(struct ib_cq *cq, int wc_cnt);
2340 int (*req_notify_cq)(struct ib_cq *cq, enum ib_cq_notify_flags flags);
2341 int (*req_ncomp_notif)(struct ib_cq *cq, int wc_cnt);
2342 int (*post_srq_recv)(struct ib_srq *srq,
2343 const struct ib_recv_wr *recv_wr,
2344 const struct ib_recv_wr **bad_recv_wr);
2345 int (*process_mad)(struct ib_device *device, int process_mad_flags,
2346 u8 port_num, const struct ib_wc *in_wc,
2347 const struct ib_grh *in_grh,
2348 const struct ib_mad_hdr *in_mad, size_t in_mad_size,
2349 struct ib_mad_hdr *out_mad, size_t *out_mad_size,
2350 u16 *out_mad_pkey_index);
2351 int (*query_device)(struct ib_device *device,
2352 struct ib_device_attr *device_attr,
2353 struct ib_udata *udata);
2354 int (*modify_device)(struct ib_device *device, int device_modify_mask,
2355 struct ib_device_modify *device_modify);
2356 void (*get_dev_fw_str)(struct ib_device *device, char *str);
2357 const struct cpumask *(*get_vector_affinity)(struct ib_device *ibdev,
2358 int comp_vector);
2359 int (*query_port)(struct ib_device *device, u8 port_num,
2360 struct ib_port_attr *port_attr);
2361 int (*modify_port)(struct ib_device *device, u8 port_num,
2362 int port_modify_mask,
2363 struct ib_port_modify *port_modify);
2364 /**
2365 * The following mandatory functions are used only at device
2366 * registration. Keep functions such as these at the end of this
2367 * structure to avoid cache line misses when accessing struct ib_device
2368 * in fast paths.
2369 */
2370 int (*get_port_immutable)(struct ib_device *device, u8 port_num,
2371 struct ib_port_immutable *immutable);
2372 enum rdma_link_layer (*get_link_layer)(struct ib_device *device,
2373 u8 port_num);
2374 /**
2375 * When calling get_netdev, the HW vendor's driver should return the
2376 * net device of device @device at port @port_num or NULL if such
2377 * a net device doesn't exist. The vendor driver should call dev_hold
2378 * on this net device. The HW vendor's device driver must guarantee
2379 * that this function returns NULL before the net device has finished
2380 * NETDEV_UNREGISTER state.
2381 */
2382 struct net_device *(*get_netdev)(struct ib_device *device, u8 port_num);
2383 /**
2384 * rdma netdev operation
2385 *
2386 * Driver implementing alloc_rdma_netdev or rdma_netdev_get_params
2387 * must return -EOPNOTSUPP if it doesn't support the specified type.
2388 */
2389 struct net_device *(*alloc_rdma_netdev)(
2390 struct ib_device *device, u8 port_num, enum rdma_netdev_t type,
2391 const char *name, unsigned char name_assign_type,
2392 void (*setup)(struct net_device *));
2393
2394 int (*rdma_netdev_get_params)(struct ib_device *device, u8 port_num,
2395 enum rdma_netdev_t type,
2396 struct rdma_netdev_alloc_params *params);
2397 /**
2398 * query_gid should be return GID value for @device, when @port_num
2399 * link layer is either IB or iWarp. It is no-op if @port_num port
2400 * is RoCE link layer.
2401 */
2402 int (*query_gid)(struct ib_device *device, u8 port_num, int index,
2403 union ib_gid *gid);
2404 /**
2405 * When calling add_gid, the HW vendor's driver should add the gid
2406 * of device of port at gid index available at @attr. Meta-info of
2407 * that gid (for example, the network device related to this gid) is
2408 * available at @attr. @context allows the HW vendor driver to store
2409 * extra information together with a GID entry. The HW vendor driver may
2410 * allocate memory to contain this information and store it in @context
2411 * when a new GID entry is written to. Params are consistent until the
2412 * next call of add_gid or delete_gid. The function should return 0 on
2413 * success or error otherwise. The function could be called
2414 * concurrently for different ports. This function is only called when
2415 * roce_gid_table is used.
2416 */
2417 int (*add_gid)(const struct ib_gid_attr *attr, void **context);
2418 /**
2419 * When calling del_gid, the HW vendor's driver should delete the
2420 * gid of device @device at gid index gid_index of port port_num
2421 * available in @attr.
2422 * Upon the deletion of a GID entry, the HW vendor must free any
2423 * allocated memory. The caller will clear @context afterwards.
2424 * This function is only called when roce_gid_table is used.
2425 */
2426 int (*del_gid)(const struct ib_gid_attr *attr, void **context);
2427 int (*query_pkey)(struct ib_device *device, u8 port_num, u16 index,
2428 u16 *pkey);
Leon Romanovskya2a074e2019-02-12 20:39:16 +02002429 int (*alloc_ucontext)(struct ib_ucontext *context,
2430 struct ib_udata *udata);
2431 void (*dealloc_ucontext)(struct ib_ucontext *context);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002432 int (*mmap)(struct ib_ucontext *context, struct vm_area_struct *vma);
2433 void (*disassociate_ucontext)(struct ib_ucontext *ibcontext);
Shamir Rabinovitchff23dfa2019-03-31 19:10:07 +03002434 int (*alloc_pd)(struct ib_pd *pd, struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002435 void (*dealloc_pd)(struct ib_pd *pd, struct ib_udata *udata);
Leon Romanovskyd3456912019-04-03 16:42:42 +03002436 int (*create_ah)(struct ib_ah *ah, struct rdma_ah_attr *ah_attr,
2437 u32 flags, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002438 int (*modify_ah)(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
2439 int (*query_ah)(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
Leon Romanovskyd3456912019-04-03 16:42:42 +03002440 void (*destroy_ah)(struct ib_ah *ah, u32 flags);
Leon Romanovsky68e326d2019-04-03 16:42:43 +03002441 int (*create_srq)(struct ib_srq *srq,
2442 struct ib_srq_init_attr *srq_init_attr,
2443 struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002444 int (*modify_srq)(struct ib_srq *srq, struct ib_srq_attr *srq_attr,
2445 enum ib_srq_attr_mask srq_attr_mask,
2446 struct ib_udata *udata);
2447 int (*query_srq)(struct ib_srq *srq, struct ib_srq_attr *srq_attr);
Leon Romanovsky68e326d2019-04-03 16:42:43 +03002448 void (*destroy_srq)(struct ib_srq *srq, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002449 struct ib_qp *(*create_qp)(struct ib_pd *pd,
2450 struct ib_qp_init_attr *qp_init_attr,
2451 struct ib_udata *udata);
2452 int (*modify_qp)(struct ib_qp *qp, struct ib_qp_attr *qp_attr,
2453 int qp_attr_mask, struct ib_udata *udata);
2454 int (*query_qp)(struct ib_qp *qp, struct ib_qp_attr *qp_attr,
2455 int qp_attr_mask, struct ib_qp_init_attr *qp_init_attr);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002456 int (*destroy_qp)(struct ib_qp *qp, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002457 struct ib_cq *(*create_cq)(struct ib_device *device,
2458 const struct ib_cq_init_attr *attr,
Kamal Heib521ed0d2018-12-10 21:09:30 +02002459 struct ib_udata *udata);
2460 int (*modify_cq)(struct ib_cq *cq, u16 cq_count, u16 cq_period);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002461 int (*destroy_cq)(struct ib_cq *cq, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002462 int (*resize_cq)(struct ib_cq *cq, int cqe, struct ib_udata *udata);
2463 struct ib_mr *(*get_dma_mr)(struct ib_pd *pd, int mr_access_flags);
2464 struct ib_mr *(*reg_user_mr)(struct ib_pd *pd, u64 start, u64 length,
2465 u64 virt_addr, int mr_access_flags,
2466 struct ib_udata *udata);
2467 int (*rereg_user_mr)(struct ib_mr *mr, int flags, u64 start, u64 length,
2468 u64 virt_addr, int mr_access_flags,
2469 struct ib_pd *pd, struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002470 int (*dereg_mr)(struct ib_mr *mr, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002471 struct ib_mr *(*alloc_mr)(struct ib_pd *pd, enum ib_mr_type mr_type,
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002472 u32 max_num_sg, struct ib_udata *udata);
Moni Shouaad8a4492018-12-11 13:37:52 +02002473 int (*advise_mr)(struct ib_pd *pd,
2474 enum ib_uverbs_advise_mr_advice advice, u32 flags,
2475 struct ib_sge *sg_list, u32 num_sge,
2476 struct uverbs_attr_bundle *attrs);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002477 int (*map_mr_sg)(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
2478 unsigned int *sg_offset);
2479 int (*check_mr_status)(struct ib_mr *mr, u32 check_mask,
2480 struct ib_mr_status *mr_status);
2481 struct ib_mw *(*alloc_mw)(struct ib_pd *pd, enum ib_mw_type type,
2482 struct ib_udata *udata);
2483 int (*dealloc_mw)(struct ib_mw *mw);
2484 struct ib_fmr *(*alloc_fmr)(struct ib_pd *pd, int mr_access_flags,
2485 struct ib_fmr_attr *fmr_attr);
2486 int (*map_phys_fmr)(struct ib_fmr *fmr, u64 *page_list, int list_len,
2487 u64 iova);
2488 int (*unmap_fmr)(struct list_head *fmr_list);
2489 int (*dealloc_fmr)(struct ib_fmr *fmr);
2490 int (*attach_mcast)(struct ib_qp *qp, union ib_gid *gid, u16 lid);
2491 int (*detach_mcast)(struct ib_qp *qp, union ib_gid *gid, u16 lid);
2492 struct ib_xrcd *(*alloc_xrcd)(struct ib_device *device,
Kamal Heib521ed0d2018-12-10 21:09:30 +02002493 struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002494 int (*dealloc_xrcd)(struct ib_xrcd *xrcd, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002495 struct ib_flow *(*create_flow)(struct ib_qp *qp,
2496 struct ib_flow_attr *flow_attr,
2497 int domain, struct ib_udata *udata);
2498 int (*destroy_flow)(struct ib_flow *flow_id);
2499 struct ib_flow_action *(*create_flow_action_esp)(
2500 struct ib_device *device,
2501 const struct ib_flow_action_attrs_esp *attr,
2502 struct uverbs_attr_bundle *attrs);
2503 int (*destroy_flow_action)(struct ib_flow_action *action);
2504 int (*modify_flow_action_esp)(
2505 struct ib_flow_action *action,
2506 const struct ib_flow_action_attrs_esp *attr,
2507 struct uverbs_attr_bundle *attrs);
2508 int (*set_vf_link_state)(struct ib_device *device, int vf, u8 port,
2509 int state);
2510 int (*get_vf_config)(struct ib_device *device, int vf, u8 port,
2511 struct ifla_vf_info *ivf);
2512 int (*get_vf_stats)(struct ib_device *device, int vf, u8 port,
2513 struct ifla_vf_stats *stats);
2514 int (*set_vf_guid)(struct ib_device *device, int vf, u8 port, u64 guid,
2515 int type);
2516 struct ib_wq *(*create_wq)(struct ib_pd *pd,
2517 struct ib_wq_init_attr *init_attr,
2518 struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002519 int (*destroy_wq)(struct ib_wq *wq, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002520 int (*modify_wq)(struct ib_wq *wq, struct ib_wq_attr *attr,
2521 u32 wq_attr_mask, struct ib_udata *udata);
2522 struct ib_rwq_ind_table *(*create_rwq_ind_table)(
2523 struct ib_device *device,
2524 struct ib_rwq_ind_table_init_attr *init_attr,
2525 struct ib_udata *udata);
2526 int (*destroy_rwq_ind_table)(struct ib_rwq_ind_table *wq_ind_table);
2527 struct ib_dm *(*alloc_dm)(struct ib_device *device,
2528 struct ib_ucontext *context,
2529 struct ib_dm_alloc_attr *attr,
2530 struct uverbs_attr_bundle *attrs);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002531 int (*dealloc_dm)(struct ib_dm *dm, struct uverbs_attr_bundle *attrs);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002532 struct ib_mr *(*reg_dm_mr)(struct ib_pd *pd, struct ib_dm *dm,
2533 struct ib_dm_mr_attr *attr,
2534 struct uverbs_attr_bundle *attrs);
2535 struct ib_counters *(*create_counters)(
2536 struct ib_device *device, struct uverbs_attr_bundle *attrs);
2537 int (*destroy_counters)(struct ib_counters *counters);
2538 int (*read_counters)(struct ib_counters *counters,
2539 struct ib_counters_read_attr *counters_read_attr,
2540 struct uverbs_attr_bundle *attrs);
2541 /**
2542 * alloc_hw_stats - Allocate a struct rdma_hw_stats and fill in the
2543 * driver initialized data. The struct is kfree()'ed by the sysfs
2544 * core when the device is removed. A lifespan of -1 in the return
2545 * struct tells the core to set a default lifespan.
2546 */
2547 struct rdma_hw_stats *(*alloc_hw_stats)(struct ib_device *device,
2548 u8 port_num);
2549 /**
2550 * get_hw_stats - Fill in the counter value(s) in the stats struct.
2551 * @index - The index in the value array we wish to have updated, or
2552 * num_counters if we want all stats updated
2553 * Return codes -
2554 * < 0 - Error, no counters updated
2555 * index - Updated the single counter pointed to by index
2556 * num_counters - Updated all counters (will reset the timestamp
2557 * and prevent further calls for lifespan milliseconds)
2558 * Drivers are allowed to update all counters in leiu of just the
2559 * one given in index at their option
2560 */
2561 int (*get_hw_stats)(struct ib_device *device,
2562 struct rdma_hw_stats *stats, u8 port, int index);
Parav Panditea4baf72018-12-18 14:28:30 +02002563 /*
2564 * This function is called once for each port when a ib device is
2565 * registered.
2566 */
2567 int (*init_port)(struct ib_device *device, u8 port_num,
2568 struct kobject *port_sysfs);
Leon Romanovsky02da3752019-01-30 12:49:02 +02002569 /**
2570 * Allows rdma drivers to add their own restrack attributes.
2571 */
2572 int (*fill_res_entry)(struct sk_buff *msg,
2573 struct rdma_restrack_entry *entry);
Leon Romanovsky21a428a2019-02-03 14:55:51 +02002574
Jason Gunthorped0899892019-02-12 21:12:53 -07002575 /* Device lifecycle callbacks */
2576 /*
Jason Gunthorpeca223542019-02-12 21:12:56 -07002577 * Called after the device becomes registered, before clients are
2578 * attached
2579 */
2580 int (*enable_driver)(struct ib_device *dev);
2581 /*
Jason Gunthorped0899892019-02-12 21:12:53 -07002582 * This is called as part of ib_dealloc_device().
2583 */
2584 void (*dealloc_driver)(struct ib_device *dev);
2585
Kamal Heibdd05cb82019-04-29 14:59:06 +03002586 /* iWarp CM callbacks */
2587 void (*iw_add_ref)(struct ib_qp *qp);
2588 void (*iw_rem_ref)(struct ib_qp *qp);
2589 struct ib_qp *(*iw_get_qp)(struct ib_device *device, int qpn);
2590 int (*iw_connect)(struct iw_cm_id *cm_id,
2591 struct iw_cm_conn_param *conn_param);
2592 int (*iw_accept)(struct iw_cm_id *cm_id,
2593 struct iw_cm_conn_param *conn_param);
2594 int (*iw_reject)(struct iw_cm_id *cm_id, const void *pdata,
2595 u8 pdata_len);
2596 int (*iw_create_listen)(struct iw_cm_id *cm_id, int backlog);
2597 int (*iw_destroy_listen)(struct iw_cm_id *cm_id);
2598
Leon Romanovskyd3456912019-04-03 16:42:42 +03002599 DECLARE_RDMA_OBJ_SIZE(ib_ah);
Leon Romanovsky21a428a2019-02-03 14:55:51 +02002600 DECLARE_RDMA_OBJ_SIZE(ib_pd);
Leon Romanovsky68e326d2019-04-03 16:42:43 +03002601 DECLARE_RDMA_OBJ_SIZE(ib_srq);
Leon Romanovskya2a074e2019-02-12 20:39:16 +02002602 DECLARE_RDMA_OBJ_SIZE(ib_ucontext);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002603};
2604
Parav Panditcebe5562019-02-26 13:56:11 +02002605struct ib_core_device {
2606 /* device must be the first element in structure until,
2607 * union of ib_core_device and device exists in ib_device.
2608 */
2609 struct device dev;
Parav Pandit4e0f7b92019-02-26 13:56:13 +02002610 possible_net_t rdma_net;
Parav Panditcebe5562019-02-26 13:56:11 +02002611 struct kobject *ports_kobj;
2612 struct list_head port_list;
2613 struct ib_device *owner; /* reach back to owner ib_device */
2614};
Leon Romanovsky41eda652019-02-18 22:25:47 +02002615
Parav Panditcebe5562019-02-26 13:56:11 +02002616struct rdma_restrack_root;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002617struct ib_device {
Bart Van Assche0957c292017-03-07 22:56:53 +00002618 /* Do not access @dma_device directly from ULP nor from HW drivers. */
2619 struct device *dma_device;
Kamal Heib3023a1e2018-12-10 21:09:48 +02002620 struct ib_device_ops ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002621 char name[IB_DEVICE_NAME_MAX];
Jason Gunthorpe324e2272019-02-12 21:12:51 -07002622 struct rcu_head rcu_head;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002623
2624 struct list_head event_handler_list;
2625 spinlock_t event_handler_lock;
2626
Jason Gunthorpe921eab12019-02-06 22:41:54 -07002627 struct rw_semaphore client_data_rwsem;
Jason Gunthorpe0df91bb2019-02-06 22:41:53 -07002628 struct xarray client_data;
Jason Gunthorped0899892019-02-12 21:12:53 -07002629 struct mutex unregistration_lock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002630
2631 struct ib_cache cache;
Ira Weiny77386132015-05-13 20:02:58 -04002632 /**
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002633 * port_data is indexed by port number
Ira Weiny77386132015-05-13 20:02:58 -04002634 */
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002635 struct ib_port_data *port_data;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002636
Michael S. Tsirkinf4fd0b22007-05-03 13:48:47 +03002637 int num_comp_vectors;
2638
Roland Dreiere2773c02005-07-07 17:57:10 -07002639 struct module *owner;
Parav Panditcebe5562019-02-26 13:56:11 +02002640 union {
2641 struct device dev;
2642 struct ib_core_device coredev;
2643 };
2644
Parav Panditd4122f52018-10-11 22:31:53 +03002645 /* First group for device attributes,
2646 * Second group for driver provided attributes (optional).
2647 * It is NULL terminated array.
2648 */
2649 const struct attribute_group *groups[3];
Parav Panditadee9f32018-09-05 09:47:58 +03002650
Roland Dreier274c0892005-09-29 14:17:48 -07002651 int uverbs_abi_ver;
Alexander Chiang17a55f72010-02-02 19:09:16 +00002652 u64 uverbs_cmd_mask;
Yann Droneaudf21519b2013-11-06 23:21:49 +01002653 u64 uverbs_ex_cmd_mask;
Roland Dreier274c0892005-09-29 14:17:48 -07002654
Yuval Shaiabd99fde2016-08-25 10:57:07 -07002655 char node_desc[IB_DEVICE_NODE_DESC_MAX];
Sean Heftycf311cd2006-01-10 07:39:34 -08002656 __be64 node_guid;
Steve Wise96f15c02008-07-14 23:48:53 -07002657 u32 local_dma_lkey;
Hal Rosenstock41390322015-06-29 09:57:00 -04002658 u16 is_switch:1;
Gal Pressman6780c4f2019-01-22 10:08:22 +02002659 /* Indicates kernel verbs support, should not be used in drivers */
2660 u16 kverbs_provider:1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002661 u8 node_type;
2662 u8 phys_port_cnt;
Ira Weiny3e153a92015-12-18 10:59:44 +02002663 struct ib_device_attr attrs;
Christoph Lameterb40f4752016-05-16 12:49:33 -05002664 struct attribute_group *hw_stats_ag;
2665 struct rdma_hw_stats *hw_stats;
Ira Weiny77386132015-05-13 20:02:58 -04002666
Parav Pandit43579b52017-01-10 00:02:14 +00002667#ifdef CONFIG_CGROUP_RDMA
2668 struct rdmacg_device cg_device;
2669#endif
2670
Leon Romanovskyecc82c52017-06-18 14:39:59 +03002671 u32 index;
Leon Romanovsky41eda652019-02-18 22:25:47 +02002672 struct rdma_restrack_root *res;
Leon Romanovskyecc82c52017-06-18 14:39:59 +03002673
Jason Gunthorpe0cbf4322018-11-12 22:59:50 +02002674 const struct uapi_definition *driver_def;
Matan Barak0ede73b2018-03-19 15:02:34 +02002675 enum rdma_driver_id driver_id;
Jason Gunthorped79af722019-01-10 14:02:24 -07002676
Parav Pandit01b67112018-11-16 03:50:57 +02002677 /*
Jason Gunthorped79af722019-01-10 14:02:24 -07002678 * Positive refcount indicates that the device is currently
2679 * registered and cannot be unregistered.
Parav Pandit01b67112018-11-16 03:50:57 +02002680 */
2681 refcount_t refcount;
2682 struct completion unreg_completion;
Jason Gunthorped0899892019-02-12 21:12:53 -07002683 struct work_struct unregistration_work;
Steve Wise3856ec42019-02-15 11:03:53 -08002684
2685 const struct rdma_link_ops *link_ops;
Parav Pandit4e0f7b92019-02-26 13:56:13 +02002686
2687 /* Protects compat_devs xarray modifications */
2688 struct mutex compat_devs_mutex;
2689 /* Maintains compat devices for each net namespace */
2690 struct xarray compat_devs;
Kamal Heibdd05cb82019-04-29 14:59:06 +03002691
2692 /* Used by iWarp CM */
2693 char iw_ifname[IFNAMSIZ];
2694 u32 iw_driver_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002695};
2696
2697struct ib_client {
Jason Gunthorpee59178d2019-02-06 22:41:52 -07002698 const char *name;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002699 void (*add) (struct ib_device *);
Haggai Eran7c1eb452015-07-30 17:50:14 +03002700 void (*remove)(struct ib_device *, void *client_data);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002701
Yotam Kenneth9268f722015-07-30 17:50:15 +03002702 /* Returns the net_dev belonging to this ib_client and matching the
2703 * given parameters.
2704 * @dev: An RDMA device that the net_dev use for communication.
2705 * @port: A physical port number on the RDMA device.
2706 * @pkey: P_Key that the net_dev uses if applicable.
2707 * @gid: A GID that the net_dev uses to communicate.
2708 * @addr: An IP address the net_dev is configured with.
2709 * @client_data: The device's client data set by ib_set_client_data().
2710 *
2711 * An ib_client that implements a net_dev on top of RDMA devices
2712 * (such as IP over IB) should implement this callback, allowing the
2713 * rdma_cm module to find the right net_dev for a given request.
2714 *
2715 * The caller is responsible for calling dev_put on the returned
2716 * netdev. */
2717 struct net_device *(*get_net_dev_by_params)(
2718 struct ib_device *dev,
2719 u8 port,
2720 u16 pkey,
2721 const union ib_gid *gid,
2722 const struct sockaddr *addr,
2723 void *client_data);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002724 struct list_head list;
Jason Gunthorpee59178d2019-02-06 22:41:52 -07002725 u32 client_id;
Gal Pressman6780c4f2019-01-22 10:08:22 +02002726
2727 /* kverbs are not required by the client */
2728 u8 no_kverbs_req:1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002729};
2730
Shiraz Saleema8082732019-05-06 08:53:33 -05002731/*
2732 * IB block DMA iterator
2733 *
2734 * Iterates the DMA-mapped SGL in contiguous memory blocks aligned
2735 * to a HW supported page size.
2736 */
2737struct ib_block_iter {
2738 /* internal states */
2739 struct scatterlist *__sg; /* sg holding the current aligned block */
2740 dma_addr_t __dma_addr; /* unaligned DMA address of this block */
2741 unsigned int __sg_nents; /* number of SG entries */
2742 unsigned int __sg_advance; /* number of bytes to advance in sg in next step */
2743 unsigned int __pg_bit; /* alignment of current block */
2744};
2745
Leon Romanovsky459cc692019-01-30 12:49:11 +02002746struct ib_device *_ib_alloc_device(size_t size);
2747#define ib_alloc_device(drv_struct, member) \
2748 container_of(_ib_alloc_device(sizeof(struct drv_struct) + \
2749 BUILD_BUG_ON_ZERO(offsetof( \
2750 struct drv_struct, member))), \
2751 struct drv_struct, member)
2752
Linus Torvalds1da177e2005-04-16 15:20:36 -07002753void ib_dealloc_device(struct ib_device *device);
2754
Leon Romanovsky9abb0d12017-06-27 16:49:53 +03002755void ib_get_device_fw_str(struct ib_device *device, char *str);
Ira Weiny5fa76c22016-06-15 02:21:56 -04002756
Parav Panditea4baf72018-12-18 14:28:30 +02002757int ib_register_device(struct ib_device *device, const char *name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002758void ib_unregister_device(struct ib_device *device);
Jason Gunthorped0899892019-02-12 21:12:53 -07002759void ib_unregister_driver(enum rdma_driver_id driver_id);
2760void ib_unregister_device_and_put(struct ib_device *device);
2761void ib_unregister_device_queued(struct ib_device *ib_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002762
2763int ib_register_client (struct ib_client *client);
2764void ib_unregister_client(struct ib_client *client);
2765
Shiraz Saleema8082732019-05-06 08:53:33 -05002766void __rdma_block_iter_start(struct ib_block_iter *biter,
2767 struct scatterlist *sglist,
2768 unsigned int nents,
2769 unsigned long pgsz);
2770bool __rdma_block_iter_next(struct ib_block_iter *biter);
2771
2772/**
2773 * rdma_block_iter_dma_address - get the aligned dma address of the current
2774 * block held by the block iterator.
2775 * @biter: block iterator holding the memory block
2776 */
2777static inline dma_addr_t
2778rdma_block_iter_dma_address(struct ib_block_iter *biter)
2779{
2780 return biter->__dma_addr & ~(BIT_ULL(biter->__pg_bit) - 1);
2781}
2782
2783/**
2784 * rdma_for_each_block - iterate over contiguous memory blocks of the sg list
2785 * @sglist: sglist to iterate over
2786 * @biter: block iterator holding the memory block
2787 * @nents: maximum number of sg entries to iterate over
2788 * @pgsz: best HW supported page size to use
2789 *
2790 * Callers may use rdma_block_iter_dma_address() to get each
2791 * blocks aligned DMA address.
2792 */
2793#define rdma_for_each_block(sglist, biter, nents, pgsz) \
2794 for (__rdma_block_iter_start(biter, sglist, nents, \
2795 pgsz); \
2796 __rdma_block_iter_next(biter);)
2797
Jason Gunthorpe0df91bb2019-02-06 22:41:53 -07002798/**
2799 * ib_get_client_data - Get IB client context
2800 * @device:Device to get context for
2801 * @client:Client to get context for
2802 *
2803 * ib_get_client_data() returns the client context data set with
2804 * ib_set_client_data(). This can only be called while the client is
2805 * registered to the device, once the ib_client remove() callback returns this
2806 * cannot be called.
2807 */
2808static inline void *ib_get_client_data(struct ib_device *device,
2809 struct ib_client *client)
2810{
2811 return xa_load(&device->client_data, client->client_id);
2812}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002813void ib_set_client_data(struct ib_device *device, struct ib_client *client,
2814 void *data);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002815void ib_set_device_ops(struct ib_device *device,
2816 const struct ib_device_ops *ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002817
Jason Gunthorpe5f9794d2018-09-16 20:43:08 +03002818#if IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS)
2819int rdma_user_mmap_io(struct ib_ucontext *ucontext, struct vm_area_struct *vma,
2820 unsigned long pfn, unsigned long size, pgprot_t prot);
Jason Gunthorpe5f9794d2018-09-16 20:43:08 +03002821#else
2822static inline int rdma_user_mmap_io(struct ib_ucontext *ucontext,
2823 struct vm_area_struct *vma,
2824 unsigned long pfn, unsigned long size,
2825 pgprot_t prot)
2826{
2827 return -EINVAL;
2828}
Jason Gunthorpe5f9794d2018-09-16 20:43:08 +03002829#endif
2830
Roland Dreiere2773c02005-07-07 17:57:10 -07002831static inline int ib_copy_from_udata(void *dest, struct ib_udata *udata, size_t len)
2832{
2833 return copy_from_user(dest, udata->inbuf, len) ? -EFAULT : 0;
2834}
2835
2836static inline int ib_copy_to_udata(struct ib_udata *udata, void *src, size_t len)
2837{
Yann Droneaud43c611652015-02-05 22:10:18 +01002838 return copy_to_user(udata->outbuf, src, len) ? -EFAULT : 0;
Roland Dreiere2773c02005-07-07 17:57:10 -07002839}
2840
Matan Barakc66db312018-03-19 15:02:36 +02002841static inline bool ib_is_buffer_cleared(const void __user *p,
2842 size_t len)
Matan Barak301a7212015-12-15 20:30:10 +02002843{
Markus Elfring92d27ae2016-08-22 18:23:24 +02002844 bool ret;
Matan Barak301a7212015-12-15 20:30:10 +02002845 u8 *buf;
2846
2847 if (len > USHRT_MAX)
2848 return false;
2849
Markus Elfring92d27ae2016-08-22 18:23:24 +02002850 buf = memdup_user(p, len);
2851 if (IS_ERR(buf))
Matan Barak301a7212015-12-15 20:30:10 +02002852 return false;
2853
Matan Barak301a7212015-12-15 20:30:10 +02002854 ret = !memchr_inv(buf, 0, len);
Matan Barak301a7212015-12-15 20:30:10 +02002855 kfree(buf);
2856 return ret;
2857}
2858
Matan Barakc66db312018-03-19 15:02:36 +02002859static inline bool ib_is_udata_cleared(struct ib_udata *udata,
2860 size_t offset,
2861 size_t len)
2862{
2863 return ib_is_buffer_cleared(udata->inbuf + offset, len);
2864}
2865
Roland Dreier8a518662006-02-13 12:48:12 -08002866/**
Yishai Hadas1c774832018-06-20 17:11:39 +03002867 * ib_is_destroy_retryable - Check whether the uobject destruction
2868 * is retryable.
2869 * @ret: The initial destruction return code
2870 * @why: remove reason
2871 * @uobj: The uobject that is destroyed
2872 *
2873 * This function is a helper function that IB layer and low-level drivers
2874 * can use to consider whether the destruction of the given uobject is
2875 * retry-able.
2876 * It checks the original return code, if it wasn't success the destruction
2877 * is retryable according to the ucontext state (i.e. cleanup_retryable) and
2878 * the remove reason. (i.e. why).
2879 * Must be called with the object locked for destroy.
2880 */
2881static inline bool ib_is_destroy_retryable(int ret, enum rdma_remove_reason why,
2882 struct ib_uobject *uobj)
2883{
2884 return ret && (why == RDMA_REMOVE_DESTROY ||
2885 uobj->context->cleanup_retryable);
2886}
2887
2888/**
2889 * ib_destroy_usecnt - Called during destruction to check the usecnt
2890 * @usecnt: The usecnt atomic
2891 * @why: remove reason
2892 * @uobj: The uobject that is destroyed
2893 *
2894 * Non-zero usecnts will block destruction unless destruction was triggered by
2895 * a ucontext cleanup.
2896 */
2897static inline int ib_destroy_usecnt(atomic_t *usecnt,
2898 enum rdma_remove_reason why,
2899 struct ib_uobject *uobj)
2900{
2901 if (atomic_read(usecnt) && ib_is_destroy_retryable(-EBUSY, why, uobj))
2902 return -EBUSY;
2903 return 0;
2904}
2905
2906/**
Roland Dreier8a518662006-02-13 12:48:12 -08002907 * ib_modify_qp_is_ok - Check that the supplied attribute mask
2908 * contains all required attributes and no attributes not allowed for
2909 * the given QP state transition.
2910 * @cur_state: Current QP state
2911 * @next_state: Next QP state
2912 * @type: QP type
2913 * @mask: Mask of supplied QP attributes
2914 *
2915 * This function is a helper function that a low-level driver's
2916 * modify_qp method can use to validate the consumer's input. It
2917 * checks that cur_state and next_state are valid QP states, that a
2918 * transition from cur_state to next_state is allowed by the IB spec,
2919 * and that the attribute mask supplied is allowed for the transition.
2920 */
Leon Romanovsky19b1f542018-03-11 13:51:35 +02002921bool ib_modify_qp_is_ok(enum ib_qp_state cur_state, enum ib_qp_state next_state,
Kamal Heibd31131b2018-10-02 16:11:21 +03002922 enum ib_qp_type type, enum ib_qp_attr_mask mask);
Roland Dreier8a518662006-02-13 12:48:12 -08002923
Leon Romanovskydcc98812017-08-17 15:50:36 +03002924void ib_register_event_handler(struct ib_event_handler *event_handler);
2925void ib_unregister_event_handler(struct ib_event_handler *event_handler);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002926void ib_dispatch_event(struct ib_event *event);
2927
Linus Torvalds1da177e2005-04-16 15:20:36 -07002928int ib_query_port(struct ib_device *device,
2929 u8 port_num, struct ib_port_attr *port_attr);
2930
Eli Cohena3f5ada2010-09-27 17:51:10 -07002931enum rdma_link_layer rdma_port_get_link_layer(struct ib_device *device,
2932 u8 port_num);
2933
Ira Weiny0cf18d72015-05-13 20:02:55 -04002934/**
Hal Rosenstock41390322015-06-29 09:57:00 -04002935 * rdma_cap_ib_switch - Check if the device is IB switch
2936 * @device: Device to check
2937 *
2938 * Device driver is responsible for setting is_switch bit on
2939 * in ib_device structure at init time.
2940 *
2941 * Return: true if the device is IB switch.
2942 */
2943static inline bool rdma_cap_ib_switch(const struct ib_device *device)
2944{
2945 return device->is_switch;
2946}
2947
2948/**
Ira Weiny0cf18d72015-05-13 20:02:55 -04002949 * rdma_start_port - Return the first valid port number for the device
2950 * specified
2951 *
2952 * @device: Device to be checked
2953 *
2954 * Return start port number
2955 */
2956static inline u8 rdma_start_port(const struct ib_device *device)
2957{
Hal Rosenstock41390322015-06-29 09:57:00 -04002958 return rdma_cap_ib_switch(device) ? 0 : 1;
Ira Weiny0cf18d72015-05-13 20:02:55 -04002959}
2960
2961/**
Jason Gunthorpeea1075e2019-02-12 21:12:47 -07002962 * rdma_for_each_port - Iterate over all valid port numbers of the IB device
2963 * @device - The struct ib_device * to iterate over
2964 * @iter - The unsigned int to store the port number
2965 */
2966#define rdma_for_each_port(device, iter) \
2967 for (iter = rdma_start_port(device + BUILD_BUG_ON_ZERO(!__same_type( \
2968 unsigned int, iter))); \
2969 iter <= rdma_end_port(device); (iter)++)
2970
2971/**
Ira Weiny0cf18d72015-05-13 20:02:55 -04002972 * rdma_end_port - Return the last valid port number for the device
2973 * specified
2974 *
2975 * @device: Device to be checked
2976 *
2977 * Return last port number
2978 */
2979static inline u8 rdma_end_port(const struct ib_device *device)
2980{
Hal Rosenstock41390322015-06-29 09:57:00 -04002981 return rdma_cap_ib_switch(device) ? 0 : device->phys_port_cnt;
Ira Weiny0cf18d72015-05-13 20:02:55 -04002982}
2983
Yuval Shaia24dc8312017-01-25 18:41:37 +02002984static inline int rdma_is_port_valid(const struct ib_device *device,
2985 unsigned int port)
2986{
2987 return (port >= rdma_start_port(device) &&
2988 port <= rdma_end_port(device));
2989}
2990
Artemy Kovalyovb02289b2018-07-04 15:57:50 +03002991static inline bool rdma_is_grh_required(const struct ib_device *device,
2992 u8 port_num)
2993{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002994 return device->port_data[port_num].immutable.core_cap_flags &
2995 RDMA_CORE_PORT_IB_GRH_REQUIRED;
Artemy Kovalyovb02289b2018-07-04 15:57:50 +03002996}
2997
Ira Weiny5ede9282015-05-31 17:15:29 -04002998static inline bool rdma_protocol_ib(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02002999{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003000 return device->port_data[port_num].immutable.core_cap_flags &
3001 RDMA_CORE_CAP_PROT_IB;
Michael Wangde66be92015-05-05 14:50:19 +02003002}
3003
Ira Weiny5ede9282015-05-31 17:15:29 -04003004static inline bool rdma_protocol_roce(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003005{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003006 return device->port_data[port_num].immutable.core_cap_flags &
3007 (RDMA_CORE_CAP_PROT_ROCE | RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP);
Matan Barak7766a992015-12-23 14:56:50 +02003008}
3009
3010static inline bool rdma_protocol_roce_udp_encap(const struct ib_device *device, u8 port_num)
3011{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003012 return device->port_data[port_num].immutable.core_cap_flags &
3013 RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP;
Matan Barak7766a992015-12-23 14:56:50 +02003014}
3015
3016static inline bool rdma_protocol_roce_eth_encap(const struct ib_device *device, u8 port_num)
3017{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003018 return device->port_data[port_num].immutable.core_cap_flags &
3019 RDMA_CORE_CAP_PROT_ROCE;
Michael Wangde66be92015-05-05 14:50:19 +02003020}
3021
Ira Weiny5ede9282015-05-31 17:15:29 -04003022static inline bool rdma_protocol_iwarp(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003023{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003024 return device->port_data[port_num].immutable.core_cap_flags &
3025 RDMA_CORE_CAP_PROT_IWARP;
Michael Wangde66be92015-05-05 14:50:19 +02003026}
3027
Ira Weiny5ede9282015-05-31 17:15:29 -04003028static inline bool rdma_ib_or_roce(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003029{
Matan Barak7766a992015-12-23 14:56:50 +02003030 return rdma_protocol_ib(device, port_num) ||
3031 rdma_protocol_roce(device, port_num);
Michael Wangde66be92015-05-05 14:50:19 +02003032}
3033
Or Gerlitzaa773bd2017-01-24 13:02:35 +02003034static inline bool rdma_protocol_raw_packet(const struct ib_device *device, u8 port_num)
3035{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003036 return device->port_data[port_num].immutable.core_cap_flags &
3037 RDMA_CORE_CAP_PROT_RAW_PACKET;
Or Gerlitzaa773bd2017-01-24 13:02:35 +02003038}
3039
Or Gerlitzce1e0552017-01-24 13:02:38 +02003040static inline bool rdma_protocol_usnic(const struct ib_device *device, u8 port_num)
3041{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003042 return device->port_data[port_num].immutable.core_cap_flags &
3043 RDMA_CORE_CAP_PROT_USNIC;
Or Gerlitzce1e0552017-01-24 13:02:38 +02003044}
3045
Michael Wangc757dea2015-05-05 14:50:32 +02003046/**
Michael Wang296ec002015-05-18 10:41:45 +02003047 * rdma_cap_ib_mad - Check if the port of a device supports Infiniband
Michael Wangc757dea2015-05-05 14:50:32 +02003048 * Management Datagrams.
Michael Wang296ec002015-05-18 10:41:45 +02003049 * @device: Device to check
3050 * @port_num: Port number to check
Michael Wangc757dea2015-05-05 14:50:32 +02003051 *
Michael Wang296ec002015-05-18 10:41:45 +02003052 * Management Datagrams (MAD) are a required part of the InfiniBand
3053 * specification and are supported on all InfiniBand devices. A slightly
3054 * extended version are also supported on OPA interfaces.
Michael Wangc757dea2015-05-05 14:50:32 +02003055 *
Michael Wang296ec002015-05-18 10:41:45 +02003056 * Return: true if the port supports sending/receiving of MAD packets.
Michael Wangc757dea2015-05-05 14:50:32 +02003057 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003058static inline bool rdma_cap_ib_mad(const struct ib_device *device, u8 port_num)
Michael Wangc757dea2015-05-05 14:50:32 +02003059{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003060 return device->port_data[port_num].immutable.core_cap_flags &
3061 RDMA_CORE_CAP_IB_MAD;
Michael Wangc757dea2015-05-05 14:50:32 +02003062}
3063
Michael Wang29541e32015-05-05 14:50:33 +02003064/**
Ira Weiny65995fe2015-06-06 14:38:32 -04003065 * rdma_cap_opa_mad - Check if the port of device provides support for OPA
3066 * Management Datagrams.
3067 * @device: Device to check
3068 * @port_num: Port number to check
3069 *
3070 * Intel OmniPath devices extend and/or replace the InfiniBand Management
3071 * datagrams with their own versions. These OPA MADs share many but not all of
3072 * the characteristics of InfiniBand MADs.
3073 *
3074 * OPA MADs differ in the following ways:
3075 *
3076 * 1) MADs are variable size up to 2K
3077 * IBTA defined MADs remain fixed at 256 bytes
3078 * 2) OPA SMPs must carry valid PKeys
3079 * 3) OPA SMP packets are a different format
3080 *
3081 * Return: true if the port supports OPA MAD packet formats.
3082 */
3083static inline bool rdma_cap_opa_mad(struct ib_device *device, u8 port_num)
3084{
Leon Romanovskyd3243da2019-03-10 17:27:46 +02003085 return device->port_data[port_num].immutable.core_cap_flags &
3086 RDMA_CORE_CAP_OPA_MAD;
Ira Weiny65995fe2015-06-06 14:38:32 -04003087}
3088
3089/**
Michael Wang296ec002015-05-18 10:41:45 +02003090 * rdma_cap_ib_smi - Check if the port of a device provides an Infiniband
3091 * Subnet Management Agent (SMA) on the Subnet Management Interface (SMI).
3092 * @device: Device to check
3093 * @port_num: Port number to check
Michael Wang29541e32015-05-05 14:50:33 +02003094 *
Michael Wang296ec002015-05-18 10:41:45 +02003095 * Each InfiniBand node is required to provide a Subnet Management Agent
3096 * that the subnet manager can access. Prior to the fabric being fully
3097 * configured by the subnet manager, the SMA is accessed via a well known
3098 * interface called the Subnet Management Interface (SMI). This interface
3099 * uses directed route packets to communicate with the SM to get around the
3100 * chicken and egg problem of the SM needing to know what's on the fabric
3101 * in order to configure the fabric, and needing to configure the fabric in
3102 * order to send packets to the devices on the fabric. These directed
3103 * route packets do not need the fabric fully configured in order to reach
3104 * their destination. The SMI is the only method allowed to send
3105 * directed route packets on an InfiniBand fabric.
Michael Wang29541e32015-05-05 14:50:33 +02003106 *
Michael Wang296ec002015-05-18 10:41:45 +02003107 * Return: true if the port provides an SMI.
Michael Wang29541e32015-05-05 14:50:33 +02003108 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003109static inline bool rdma_cap_ib_smi(const struct ib_device *device, u8 port_num)
Michael Wang29541e32015-05-05 14:50:33 +02003110{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003111 return device->port_data[port_num].immutable.core_cap_flags &
3112 RDMA_CORE_CAP_IB_SMI;
Michael Wang29541e32015-05-05 14:50:33 +02003113}
3114
Michael Wang72219cea2015-05-05 14:50:34 +02003115/**
3116 * rdma_cap_ib_cm - Check if the port of device has the capability Infiniband
3117 * Communication Manager.
Michael Wang296ec002015-05-18 10:41:45 +02003118 * @device: Device to check
3119 * @port_num: Port number to check
Michael Wang72219cea2015-05-05 14:50:34 +02003120 *
Michael Wang296ec002015-05-18 10:41:45 +02003121 * The InfiniBand Communication Manager is one of many pre-defined General
3122 * Service Agents (GSA) that are accessed via the General Service
3123 * Interface (GSI). It's role is to facilitate establishment of connections
3124 * between nodes as well as other management related tasks for established
3125 * connections.
Michael Wang72219cea2015-05-05 14:50:34 +02003126 *
Michael Wang296ec002015-05-18 10:41:45 +02003127 * Return: true if the port supports an IB CM (this does not guarantee that
3128 * a CM is actually running however).
Michael Wang72219cea2015-05-05 14:50:34 +02003129 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003130static inline bool rdma_cap_ib_cm(const struct ib_device *device, u8 port_num)
Michael Wang72219cea2015-05-05 14:50:34 +02003131{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003132 return device->port_data[port_num].immutable.core_cap_flags &
3133 RDMA_CORE_CAP_IB_CM;
Michael Wang72219cea2015-05-05 14:50:34 +02003134}
3135
Michael Wang04215332015-05-05 14:50:35 +02003136/**
3137 * rdma_cap_iw_cm - Check if the port of device has the capability IWARP
3138 * Communication Manager.
Michael Wang296ec002015-05-18 10:41:45 +02003139 * @device: Device to check
3140 * @port_num: Port number to check
Michael Wang04215332015-05-05 14:50:35 +02003141 *
Michael Wang296ec002015-05-18 10:41:45 +02003142 * Similar to above, but specific to iWARP connections which have a different
3143 * managment protocol than InfiniBand.
Michael Wang04215332015-05-05 14:50:35 +02003144 *
Michael Wang296ec002015-05-18 10:41:45 +02003145 * Return: true if the port supports an iWARP CM (this does not guarantee that
3146 * a CM is actually running however).
Michael Wang04215332015-05-05 14:50:35 +02003147 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003148static inline bool rdma_cap_iw_cm(const struct ib_device *device, u8 port_num)
Michael Wang04215332015-05-05 14:50:35 +02003149{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003150 return device->port_data[port_num].immutable.core_cap_flags &
3151 RDMA_CORE_CAP_IW_CM;
Michael Wang04215332015-05-05 14:50:35 +02003152}
3153
Michael Wangfe53ba22015-05-05 14:50:36 +02003154/**
3155 * rdma_cap_ib_sa - Check if the port of device has the capability Infiniband
3156 * Subnet Administration.
Michael Wang296ec002015-05-18 10:41:45 +02003157 * @device: Device to check
3158 * @port_num: Port number to check
Michael Wangfe53ba22015-05-05 14:50:36 +02003159 *
Michael Wang296ec002015-05-18 10:41:45 +02003160 * An InfiniBand Subnet Administration (SA) service is a pre-defined General
3161 * Service Agent (GSA) provided by the Subnet Manager (SM). On InfiniBand
3162 * fabrics, devices should resolve routes to other hosts by contacting the
3163 * SA to query the proper route.
Michael Wangfe53ba22015-05-05 14:50:36 +02003164 *
Michael Wang296ec002015-05-18 10:41:45 +02003165 * Return: true if the port should act as a client to the fabric Subnet
3166 * Administration interface. This does not imply that the SA service is
3167 * running locally.
Michael Wangfe53ba22015-05-05 14:50:36 +02003168 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003169static inline bool rdma_cap_ib_sa(const struct ib_device *device, u8 port_num)
Michael Wangfe53ba22015-05-05 14:50:36 +02003170{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003171 return device->port_data[port_num].immutable.core_cap_flags &
3172 RDMA_CORE_CAP_IB_SA;
Michael Wangfe53ba22015-05-05 14:50:36 +02003173}
3174
Michael Wanga31ad3b2015-05-05 14:50:37 +02003175/**
3176 * rdma_cap_ib_mcast - Check if the port of device has the capability Infiniband
3177 * Multicast.
Michael Wang296ec002015-05-18 10:41:45 +02003178 * @device: Device to check
3179 * @port_num: Port number to check
Michael Wanga31ad3b2015-05-05 14:50:37 +02003180 *
Michael Wang296ec002015-05-18 10:41:45 +02003181 * InfiniBand multicast registration is more complex than normal IPv4 or
3182 * IPv6 multicast registration. Each Host Channel Adapter must register
3183 * with the Subnet Manager when it wishes to join a multicast group. It
3184 * should do so only once regardless of how many queue pairs it subscribes
3185 * to this group. And it should leave the group only after all queue pairs
3186 * attached to the group have been detached.
Michael Wanga31ad3b2015-05-05 14:50:37 +02003187 *
Michael Wang296ec002015-05-18 10:41:45 +02003188 * Return: true if the port must undertake the additional adminstrative
3189 * overhead of registering/unregistering with the SM and tracking of the
3190 * total number of queue pairs attached to the multicast group.
Michael Wanga31ad3b2015-05-05 14:50:37 +02003191 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003192static inline bool rdma_cap_ib_mcast(const struct ib_device *device, u8 port_num)
Michael Wanga31ad3b2015-05-05 14:50:37 +02003193{
3194 return rdma_cap_ib_sa(device, port_num);
3195}
3196
Michael Wangbc0f1d72015-05-05 14:50:38 +02003197/**
Michael Wang30a74ef2015-05-05 14:50:39 +02003198 * rdma_cap_af_ib - Check if the port of device has the capability
3199 * Native Infiniband Address.
Michael Wang296ec002015-05-18 10:41:45 +02003200 * @device: Device to check
3201 * @port_num: Port number to check
Michael Wang30a74ef2015-05-05 14:50:39 +02003202 *
Michael Wang296ec002015-05-18 10:41:45 +02003203 * InfiniBand addressing uses a port's GUID + Subnet Prefix to make a default
3204 * GID. RoCE uses a different mechanism, but still generates a GID via
3205 * a prescribed mechanism and port specific data.
Michael Wang30a74ef2015-05-05 14:50:39 +02003206 *
Michael Wang296ec002015-05-18 10:41:45 +02003207 * Return: true if the port uses a GID address to identify devices on the
3208 * network.
Michael Wang30a74ef2015-05-05 14:50:39 +02003209 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003210static inline bool rdma_cap_af_ib(const struct ib_device *device, u8 port_num)
Michael Wang30a74ef2015-05-05 14:50:39 +02003211{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003212 return device->port_data[port_num].immutable.core_cap_flags &
3213 RDMA_CORE_CAP_AF_IB;
Michael Wang30a74ef2015-05-05 14:50:39 +02003214}
3215
3216/**
Michael Wang227128f2015-05-05 14:50:40 +02003217 * rdma_cap_eth_ah - Check if the port of device has the capability
Michael Wang296ec002015-05-18 10:41:45 +02003218 * Ethernet Address Handle.
3219 * @device: Device to check
3220 * @port_num: Port number to check
Michael Wang227128f2015-05-05 14:50:40 +02003221 *
Michael Wang296ec002015-05-18 10:41:45 +02003222 * RoCE is InfiniBand over Ethernet, and it uses a well defined technique
3223 * to fabricate GIDs over Ethernet/IP specific addresses native to the
3224 * port. Normally, packet headers are generated by the sending host
3225 * adapter, but when sending connectionless datagrams, we must manually
3226 * inject the proper headers for the fabric we are communicating over.
Michael Wang227128f2015-05-05 14:50:40 +02003227 *
Michael Wang296ec002015-05-18 10:41:45 +02003228 * Return: true if we are running as a RoCE port and must force the
3229 * addition of a Global Route Header built from our Ethernet Address
3230 * Handle into our header list for connectionless packets.
Michael Wang227128f2015-05-05 14:50:40 +02003231 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003232static inline bool rdma_cap_eth_ah(const struct ib_device *device, u8 port_num)
Michael Wang227128f2015-05-05 14:50:40 +02003233{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003234 return device->port_data[port_num].immutable.core_cap_flags &
3235 RDMA_CORE_CAP_ETH_AH;
Michael Wang227128f2015-05-05 14:50:40 +02003236}
3237
3238/**
Dasaratharaman Chandramouli94d595c2017-03-20 19:38:09 -04003239 * rdma_cap_opa_ah - Check if the port of device supports
3240 * OPA Address handles
3241 * @device: Device to check
3242 * @port_num: Port number to check
3243 *
3244 * Return: true if we are running on an OPA device which supports
3245 * the extended OPA addressing.
3246 */
3247static inline bool rdma_cap_opa_ah(struct ib_device *device, u8 port_num)
3248{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003249 return (device->port_data[port_num].immutable.core_cap_flags &
Dasaratharaman Chandramouli94d595c2017-03-20 19:38:09 -04003250 RDMA_CORE_CAP_OPA_AH) == RDMA_CORE_CAP_OPA_AH;
3251}
3252
3253/**
Ira Weiny337877a2015-06-06 14:38:29 -04003254 * rdma_max_mad_size - Return the max MAD size required by this RDMA Port.
3255 *
3256 * @device: Device
3257 * @port_num: Port number
3258 *
3259 * This MAD size includes the MAD headers and MAD payload. No other headers
3260 * are included.
3261 *
3262 * Return the max MAD size required by the Port. Will return 0 if the port
3263 * does not support MADs
3264 */
3265static inline size_t rdma_max_mad_size(const struct ib_device *device, u8 port_num)
3266{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003267 return device->port_data[port_num].immutable.max_mad_size;
Ira Weiny337877a2015-06-06 14:38:29 -04003268}
3269
Matan Barak03db3a22015-07-30 18:33:26 +03003270/**
3271 * rdma_cap_roce_gid_table - Check if the port of device uses roce_gid_table
3272 * @device: Device to check
3273 * @port_num: Port number to check
3274 *
3275 * RoCE GID table mechanism manages the various GIDs for a device.
3276 *
3277 * NOTE: if allocating the port's GID table has failed, this call will still
3278 * return true, but any RoCE GID table API will fail.
3279 *
3280 * Return: true if the port uses RoCE GID table mechanism in order to manage
3281 * its GIDs.
3282 */
3283static inline bool rdma_cap_roce_gid_table(const struct ib_device *device,
3284 u8 port_num)
3285{
3286 return rdma_protocol_roce(device, port_num) &&
Kamal Heib3023a1e2018-12-10 21:09:48 +02003287 device->ops.add_gid && device->ops.del_gid;
Matan Barak03db3a22015-07-30 18:33:26 +03003288}
3289
Christoph Hellwig002516e2016-05-03 18:01:05 +02003290/*
3291 * Check if the device supports READ W/ INVALIDATE.
3292 */
3293static inline bool rdma_cap_read_inv(struct ib_device *dev, u32 port_num)
3294{
3295 /*
3296 * iWarp drivers must support READ W/ INVALIDATE. No other protocol
3297 * has support for it yet.
3298 */
3299 return rdma_protocol_iwarp(dev, port_num);
3300}
3301
Shiraz Saleem4a353392019-05-06 08:53:32 -05003302/**
3303 * rdma_find_pg_bit - Find page bit given address and HW supported page sizes
3304 *
3305 * @addr: address
3306 * @pgsz_bitmap: bitmap of HW supported page sizes
3307 */
3308static inline unsigned int rdma_find_pg_bit(unsigned long addr,
3309 unsigned long pgsz_bitmap)
3310{
3311 unsigned long align;
3312 unsigned long pgsz;
3313
3314 align = addr & -addr;
3315
3316 /* Find page bit such that addr is aligned to the highest supported
3317 * HW page size
3318 */
3319 pgsz = pgsz_bitmap & ~(-align << 1);
3320 if (!pgsz)
3321 return __ffs(pgsz_bitmap);
3322
3323 return __fls(pgsz);
3324}
3325
Eli Cohen50174a72016-03-11 22:58:38 +02003326int ib_set_vf_link_state(struct ib_device *device, int vf, u8 port,
3327 int state);
3328int ib_get_vf_config(struct ib_device *device, int vf, u8 port,
3329 struct ifla_vf_info *info);
3330int ib_get_vf_stats(struct ib_device *device, int vf, u8 port,
3331 struct ifla_vf_stats *stats);
3332int ib_set_vf_guid(struct ib_device *device, int vf, u8 port, u64 guid,
3333 int type);
3334
Linus Torvalds1da177e2005-04-16 15:20:36 -07003335int ib_query_pkey(struct ib_device *device,
3336 u8 port_num, u16 index, u16 *pkey);
3337
3338int ib_modify_device(struct ib_device *device,
3339 int device_modify_mask,
3340 struct ib_device_modify *device_modify);
3341
3342int ib_modify_port(struct ib_device *device,
3343 u8 port_num, int port_modify_mask,
3344 struct ib_port_modify *port_modify);
3345
Yosef Etigin5eb620c2007-05-14 07:26:51 +03003346int ib_find_gid(struct ib_device *device, union ib_gid *gid,
Parav Panditb26c4a12018-03-13 16:06:12 +02003347 u8 *port_num, u16 *index);
Yosef Etigin5eb620c2007-05-14 07:26:51 +03003348
3349int ib_find_pkey(struct ib_device *device,
3350 u8 port_num, u16 pkey, u16 *index);
3351
Christoph Hellwiged082d32016-09-05 12:56:17 +02003352enum ib_pd_flags {
3353 /*
3354 * Create a memory registration for all memory in the system and place
3355 * the rkey for it into pd->unsafe_global_rkey. This can be used by
3356 * ULPs to avoid the overhead of dynamic MRs.
3357 *
3358 * This flag is generally considered unsafe and must only be used in
3359 * extremly trusted environments. Every use of it will log a warning
3360 * in the kernel log.
3361 */
3362 IB_PD_UNSAFE_GLOBAL_RKEY = 0x01,
3363};
Linus Torvalds1da177e2005-04-16 15:20:36 -07003364
Christoph Hellwiged082d32016-09-05 12:56:17 +02003365struct ib_pd *__ib_alloc_pd(struct ib_device *device, unsigned int flags,
3366 const char *caller);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003367
Christoph Hellwiged082d32016-09-05 12:56:17 +02003368#define ib_alloc_pd(device, flags) \
Leon Romanovskye4496442018-01-28 11:17:18 +02003369 __ib_alloc_pd((device), (flags), KBUILD_MODNAME)
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003370
3371/**
3372 * ib_dealloc_pd_user - Deallocate kernel/user PD
3373 * @pd: The protection domain
3374 * @udata: Valid user data or NULL for kernel objects
3375 */
3376void ib_dealloc_pd_user(struct ib_pd *pd, struct ib_udata *udata);
3377
3378/**
3379 * ib_dealloc_pd - Deallocate kernel PD
3380 * @pd: The protection domain
3381 *
3382 * NOTE: for user PD use ib_dealloc_pd_user with valid udata!
3383 */
3384static inline void ib_dealloc_pd(struct ib_pd *pd)
3385{
3386 ib_dealloc_pd_user(pd, NULL);
3387}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003388
Gal Pressmanb090c4e2018-12-12 11:09:05 +02003389enum rdma_create_ah_flags {
3390 /* In a sleepable context */
3391 RDMA_CREATE_AH_SLEEPABLE = BIT(0),
3392};
3393
Linus Torvalds1da177e2005-04-16 15:20:36 -07003394/**
Dasaratharaman Chandramouli0a18cfe2017-04-29 14:41:19 -04003395 * rdma_create_ah - Creates an address handle for the given address vector.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003396 * @pd: The protection domain associated with the address handle.
3397 * @ah_attr: The attributes of the address vector.
Gal Pressmanb090c4e2018-12-12 11:09:05 +02003398 * @flags: Create address handle flags (see enum rdma_create_ah_flags).
Linus Torvalds1da177e2005-04-16 15:20:36 -07003399 *
3400 * The address handle is used to reference a local or global destination
3401 * in all UD QP post sends.
3402 */
Gal Pressmanb090c4e2018-12-12 11:09:05 +02003403struct ib_ah *rdma_create_ah(struct ib_pd *pd, struct rdma_ah_attr *ah_attr,
3404 u32 flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003405
3406/**
Parav Pandit5cda6582017-10-16 08:45:12 +03003407 * rdma_create_user_ah - Creates an address handle for the given address vector.
3408 * It resolves destination mac address for ah attribute of RoCE type.
3409 * @pd: The protection domain associated with the address handle.
3410 * @ah_attr: The attributes of the address vector.
3411 * @udata: pointer to user's input output buffer information need by
3412 * provider driver.
3413 *
3414 * It returns 0 on success and returns appropriate error code on error.
3415 * The address handle is used to reference a local or global destination
3416 * in all UD QP post sends.
3417 */
3418struct ib_ah *rdma_create_user_ah(struct ib_pd *pd,
3419 struct rdma_ah_attr *ah_attr,
3420 struct ib_udata *udata);
3421/**
Moni Shoua850d8fd2016-11-10 11:30:56 +02003422 * ib_get_gids_from_rdma_hdr - Get sgid and dgid from GRH or IPv4 header
3423 * work completion.
3424 * @hdr: the L3 header to parse
3425 * @net_type: type of header to parse
3426 * @sgid: place to store source gid
3427 * @dgid: place to store destination gid
3428 */
3429int ib_get_gids_from_rdma_hdr(const union rdma_network_hdr *hdr,
3430 enum rdma_network_type net_type,
3431 union ib_gid *sgid, union ib_gid *dgid);
3432
3433/**
3434 * ib_get_rdma_header_version - Get the header version
3435 * @hdr: the L3 header to parse
3436 */
3437int ib_get_rdma_header_version(const union rdma_network_hdr *hdr);
3438
3439/**
Parav Panditf6bdb142017-11-14 14:52:17 +02003440 * ib_init_ah_attr_from_wc - Initializes address handle attributes from a
Sean Hefty4e00d692006-06-17 20:37:39 -07003441 * work completion.
3442 * @device: Device on which the received message arrived.
3443 * @port_num: Port on which the received message arrived.
3444 * @wc: Work completion associated with the received message.
3445 * @grh: References the received global route header. This parameter is
3446 * ignored unless the work completion indicates that the GRH is valid.
3447 * @ah_attr: Returned attributes that can be used when creating an address
3448 * handle for replying to the message.
Parav Panditb7403212018-06-19 10:59:14 +03003449 * When ib_init_ah_attr_from_wc() returns success,
3450 * (a) for IB link layer it optionally contains a reference to SGID attribute
3451 * when GRH is present for IB link layer.
3452 * (b) for RoCE link layer it contains a reference to SGID attribute.
3453 * User must invoke rdma_cleanup_ah_attr_gid_attr() to release reference to SGID
3454 * attributes which are initialized using ib_init_ah_attr_from_wc().
3455 *
Sean Hefty4e00d692006-06-17 20:37:39 -07003456 */
Parav Panditf6bdb142017-11-14 14:52:17 +02003457int ib_init_ah_attr_from_wc(struct ib_device *device, u8 port_num,
3458 const struct ib_wc *wc, const struct ib_grh *grh,
3459 struct rdma_ah_attr *ah_attr);
Sean Hefty4e00d692006-06-17 20:37:39 -07003460
3461/**
Hal Rosenstock513789e2005-07-27 11:45:34 -07003462 * ib_create_ah_from_wc - Creates an address handle associated with the
3463 * sender of the specified work completion.
3464 * @pd: The protection domain associated with the address handle.
3465 * @wc: Work completion information associated with a received message.
3466 * @grh: References the received global route header. This parameter is
3467 * ignored unless the work completion indicates that the GRH is valid.
3468 * @port_num: The outbound port number to associate with the address.
3469 *
3470 * The address handle is used to reference a local or global destination
3471 * in all UD QP post sends.
3472 */
Ira Weiny73cdaae2015-05-31 17:15:31 -04003473struct ib_ah *ib_create_ah_from_wc(struct ib_pd *pd, const struct ib_wc *wc,
3474 const struct ib_grh *grh, u8 port_num);
Hal Rosenstock513789e2005-07-27 11:45:34 -07003475
3476/**
Dasaratharaman Chandramouli67b985b2017-04-29 14:41:20 -04003477 * rdma_modify_ah - Modifies the address vector associated with an address
Linus Torvalds1da177e2005-04-16 15:20:36 -07003478 * handle.
3479 * @ah: The address handle to modify.
3480 * @ah_attr: The new address vector attributes to associate with the
3481 * address handle.
3482 */
Dasaratharaman Chandramouli67b985b2017-04-29 14:41:20 -04003483int rdma_modify_ah(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003484
3485/**
Dasaratharaman Chandramoulibfbfd662017-04-29 14:41:21 -04003486 * rdma_query_ah - Queries the address vector associated with an address
Linus Torvalds1da177e2005-04-16 15:20:36 -07003487 * handle.
3488 * @ah: The address handle to query.
3489 * @ah_attr: The address vector attributes associated with the address
3490 * handle.
3491 */
Dasaratharaman Chandramoulibfbfd662017-04-29 14:41:21 -04003492int rdma_query_ah(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003493
Gal Pressman2553ba22018-12-12 11:09:06 +02003494enum rdma_destroy_ah_flags {
3495 /* In a sleepable context */
3496 RDMA_DESTROY_AH_SLEEPABLE = BIT(0),
3497};
3498
Linus Torvalds1da177e2005-04-16 15:20:36 -07003499/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003500 * rdma_destroy_ah_user - Destroys an address handle.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003501 * @ah: The address handle to destroy.
Gal Pressman2553ba22018-12-12 11:09:06 +02003502 * @flags: Destroy address handle flags (see enum rdma_destroy_ah_flags).
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003503 * @udata: Valid user data or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003504 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003505int rdma_destroy_ah_user(struct ib_ah *ah, u32 flags, struct ib_udata *udata);
3506
3507/**
3508 * rdma_destroy_ah - Destroys an kernel address handle.
3509 * @ah: The address handle to destroy.
3510 * @flags: Destroy address handle flags (see enum rdma_destroy_ah_flags).
3511 *
3512 * NOTE: for user ah use rdma_destroy_ah_user with valid udata!
3513 */
3514static inline int rdma_destroy_ah(struct ib_ah *ah, u32 flags)
3515{
3516 return rdma_destroy_ah_user(ah, flags, NULL);
3517}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003518
3519/**
Roland Dreierd41fcc62005-08-18 12:23:08 -07003520 * ib_create_srq - Creates a SRQ associated with the specified protection
3521 * domain.
3522 * @pd: The protection domain associated with the SRQ.
Dotan Barakabb6e9b2006-02-23 12:13:51 -08003523 * @srq_init_attr: A list of initial attributes required to create the
3524 * SRQ. If SRQ creation succeeds, then the attributes are updated to
3525 * the actual capabilities of the created SRQ.
Roland Dreierd41fcc62005-08-18 12:23:08 -07003526 *
3527 * srq_attr->max_wr and srq_attr->max_sge are read the determine the
3528 * requested size of the SRQ, and set to the actual values allocated
3529 * on return. If ib_create_srq() succeeds, then max_wr and max_sge
3530 * will always be at least as large as the requested values.
3531 */
3532struct ib_srq *ib_create_srq(struct ib_pd *pd,
3533 struct ib_srq_init_attr *srq_init_attr);
3534
3535/**
3536 * ib_modify_srq - Modifies the attributes for the specified SRQ.
3537 * @srq: The SRQ to modify.
3538 * @srq_attr: On input, specifies the SRQ attributes to modify. On output,
3539 * the current values of selected SRQ attributes are returned.
3540 * @srq_attr_mask: A bit-mask used to specify which attributes of the SRQ
3541 * are being modified.
3542 *
3543 * The mask may contain IB_SRQ_MAX_WR to resize the SRQ and/or
3544 * IB_SRQ_LIMIT to set the SRQ's limit and request notification when
3545 * the number of receives queued drops below the limit.
3546 */
3547int ib_modify_srq(struct ib_srq *srq,
3548 struct ib_srq_attr *srq_attr,
3549 enum ib_srq_attr_mask srq_attr_mask);
3550
3551/**
3552 * ib_query_srq - Returns the attribute list and current values for the
3553 * specified SRQ.
3554 * @srq: The SRQ to query.
3555 * @srq_attr: The attributes of the specified SRQ.
3556 */
3557int ib_query_srq(struct ib_srq *srq,
3558 struct ib_srq_attr *srq_attr);
3559
3560/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003561 * ib_destroy_srq_user - Destroys the specified SRQ.
Roland Dreierd41fcc62005-08-18 12:23:08 -07003562 * @srq: The SRQ to destroy.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003563 * @udata: Valid user data or NULL for kernel objects
Roland Dreierd41fcc62005-08-18 12:23:08 -07003564 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003565int ib_destroy_srq_user(struct ib_srq *srq, struct ib_udata *udata);
3566
3567/**
3568 * ib_destroy_srq - Destroys the specified kernel SRQ.
3569 * @srq: The SRQ to destroy.
3570 *
3571 * NOTE: for user srq use ib_destroy_srq_user with valid udata!
3572 */
3573static inline int ib_destroy_srq(struct ib_srq *srq)
3574{
3575 return ib_destroy_srq_user(srq, NULL);
3576}
Roland Dreierd41fcc62005-08-18 12:23:08 -07003577
3578/**
3579 * ib_post_srq_recv - Posts a list of work requests to the specified SRQ.
3580 * @srq: The SRQ to post the work request on.
3581 * @recv_wr: A list of work requests to post on the receive queue.
3582 * @bad_recv_wr: On an immediate failure, this parameter will reference
3583 * the work request that failed to be posted on the QP.
3584 */
3585static inline int ib_post_srq_recv(struct ib_srq *srq,
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003586 const struct ib_recv_wr *recv_wr,
3587 const struct ib_recv_wr **bad_recv_wr)
Roland Dreierd41fcc62005-08-18 12:23:08 -07003588{
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003589 const struct ib_recv_wr *dummy;
Bart Van Asschebb039a82018-07-18 09:25:16 -07003590
Kamal Heib3023a1e2018-12-10 21:09:48 +02003591 return srq->device->ops.post_srq_recv(srq, recv_wr,
3592 bad_recv_wr ? : &dummy);
Roland Dreierd41fcc62005-08-18 12:23:08 -07003593}
3594
3595/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003596 * ib_create_qp_user - Creates a QP associated with the specified protection
Linus Torvalds1da177e2005-04-16 15:20:36 -07003597 * domain.
3598 * @pd: The protection domain associated with the QP.
Dotan Barakabb6e9b2006-02-23 12:13:51 -08003599 * @qp_init_attr: A list of initial attributes required to create the
3600 * QP. If QP creation succeeds, then the attributes are updated to
3601 * the actual capabilities of the created QP.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003602 * @udata: Valid user data or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003603 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003604struct ib_qp *ib_create_qp_user(struct ib_pd *pd,
3605 struct ib_qp_init_attr *qp_init_attr,
3606 struct ib_udata *udata);
3607
3608/**
3609 * ib_create_qp - Creates a kernel QP associated with the specified protection
3610 * domain.
3611 * @pd: The protection domain associated with the QP.
3612 * @qp_init_attr: A list of initial attributes required to create the
3613 * QP. If QP creation succeeds, then the attributes are updated to
3614 * the actual capabilities of the created QP.
3615 * @udata: Valid user data or NULL for kernel objects
3616 *
3617 * NOTE: for user qp use ib_create_qp_user with valid udata!
3618 */
3619static inline struct ib_qp *ib_create_qp(struct ib_pd *pd,
3620 struct ib_qp_init_attr *qp_init_attr)
3621{
3622 return ib_create_qp_user(pd, qp_init_attr, NULL);
3623}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003624
3625/**
Parav Pandita512c2f2017-05-23 11:26:08 +03003626 * ib_modify_qp_with_udata - Modifies the attributes for the specified QP.
3627 * @qp: The QP to modify.
3628 * @attr: On input, specifies the QP attributes to modify. On output,
3629 * the current values of selected QP attributes are returned.
3630 * @attr_mask: A bit-mask used to specify which attributes of the QP
3631 * are being modified.
3632 * @udata: pointer to user's input output buffer information
3633 * are being modified.
3634 * It returns 0 on success and returns appropriate error code on error.
3635 */
3636int ib_modify_qp_with_udata(struct ib_qp *qp,
3637 struct ib_qp_attr *attr,
3638 int attr_mask,
3639 struct ib_udata *udata);
3640
3641/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07003642 * ib_modify_qp - Modifies the attributes for the specified QP and then
3643 * transitions the QP to the given state.
3644 * @qp: The QP to modify.
3645 * @qp_attr: On input, specifies the QP attributes to modify. On output,
3646 * the current values of selected QP attributes are returned.
3647 * @qp_attr_mask: A bit-mask used to specify which attributes of the QP
3648 * are being modified.
3649 */
3650int ib_modify_qp(struct ib_qp *qp,
3651 struct ib_qp_attr *qp_attr,
3652 int qp_attr_mask);
3653
3654/**
3655 * ib_query_qp - Returns the attribute list and current values for the
3656 * specified QP.
3657 * @qp: The QP to query.
3658 * @qp_attr: The attributes of the specified QP.
3659 * @qp_attr_mask: A bit-mask used to select specific attributes to query.
3660 * @qp_init_attr: Additional attributes of the selected QP.
3661 *
3662 * The qp_attr_mask may be used to limit the query to gathering only the
3663 * selected attributes.
3664 */
3665int ib_query_qp(struct ib_qp *qp,
3666 struct ib_qp_attr *qp_attr,
3667 int qp_attr_mask,
3668 struct ib_qp_init_attr *qp_init_attr);
3669
3670/**
3671 * ib_destroy_qp - Destroys the specified QP.
3672 * @qp: The QP to destroy.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003673 * @udata: Valid udata or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003674 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003675int ib_destroy_qp_user(struct ib_qp *qp, struct ib_udata *udata);
3676
3677/**
3678 * ib_destroy_qp - Destroys the specified kernel QP.
3679 * @qp: The QP to destroy.
3680 *
3681 * NOTE: for user qp use ib_destroy_qp_user with valid udata!
3682 */
3683static inline int ib_destroy_qp(struct ib_qp *qp)
3684{
3685 return ib_destroy_qp_user(qp, NULL);
3686}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003687
3688/**
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07003689 * ib_open_qp - Obtain a reference to an existing sharable QP.
3690 * @xrcd - XRC domain
3691 * @qp_open_attr: Attributes identifying the QP to open.
3692 *
3693 * Returns a reference to a sharable QP.
3694 */
3695struct ib_qp *ib_open_qp(struct ib_xrcd *xrcd,
3696 struct ib_qp_open_attr *qp_open_attr);
3697
3698/**
3699 * ib_close_qp - Release an external reference to a QP.
Sean Heftyd3d72d92011-05-26 23:06:44 -07003700 * @qp: The QP handle to release
3701 *
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07003702 * The opened QP handle is released by the caller. The underlying
3703 * shared QP is not destroyed until all internal references are released.
Sean Heftyd3d72d92011-05-26 23:06:44 -07003704 */
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07003705int ib_close_qp(struct ib_qp *qp);
Sean Heftyd3d72d92011-05-26 23:06:44 -07003706
3707/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07003708 * ib_post_send - Posts a list of work requests to the send queue of
3709 * the specified QP.
3710 * @qp: The QP to post the work request on.
3711 * @send_wr: A list of work requests to post on the send queue.
3712 * @bad_send_wr: On an immediate failure, this parameter will reference
3713 * the work request that failed to be posted on the QP.
Bart Van Assche55464d42009-12-09 14:20:04 -08003714 *
3715 * While IBA Vol. 1 section 11.4.1.1 specifies that if an immediate
3716 * error is returned, the QP state shall not be affected,
3717 * ib_post_send() will return an immediate error after queueing any
3718 * earlier work requests in the list.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003719 */
3720static inline int ib_post_send(struct ib_qp *qp,
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003721 const struct ib_send_wr *send_wr,
3722 const struct ib_send_wr **bad_send_wr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003723{
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003724 const struct ib_send_wr *dummy;
Bart Van Asschebb039a82018-07-18 09:25:16 -07003725
Kamal Heib3023a1e2018-12-10 21:09:48 +02003726 return qp->device->ops.post_send(qp, send_wr, bad_send_wr ? : &dummy);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003727}
3728
3729/**
3730 * ib_post_recv - Posts a list of work requests to the receive queue of
3731 * the specified QP.
3732 * @qp: The QP to post the work request on.
3733 * @recv_wr: A list of work requests to post on the receive queue.
3734 * @bad_recv_wr: On an immediate failure, this parameter will reference
3735 * the work request that failed to be posted on the QP.
3736 */
3737static inline int ib_post_recv(struct ib_qp *qp,
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003738 const struct ib_recv_wr *recv_wr,
3739 const struct ib_recv_wr **bad_recv_wr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003740{
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003741 const struct ib_recv_wr *dummy;
Bart Van Asschebb039a82018-07-18 09:25:16 -07003742
Kamal Heib3023a1e2018-12-10 21:09:48 +02003743 return qp->device->ops.post_recv(qp, recv_wr, bad_recv_wr ? : &dummy);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003744}
3745
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003746struct ib_cq *__ib_alloc_cq_user(struct ib_device *dev, void *private,
3747 int nr_cqe, int comp_vector,
3748 enum ib_poll_context poll_ctx,
3749 const char *caller, struct ib_udata *udata);
Leon Romanovskyf66c8ba2018-01-28 11:17:19 +02003750
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003751/**
3752 * ib_alloc_cq_user: Allocate kernel/user CQ
3753 * @dev: The IB device
3754 * @private: Private data attached to the CQE
3755 * @nr_cqe: Number of CQEs in the CQ
3756 * @comp_vector: Completion vector used for the IRQs
3757 * @poll_ctx: Context used for polling the CQ
3758 * @udata: Valid user data or NULL for kernel objects
3759 */
3760static inline struct ib_cq *ib_alloc_cq_user(struct ib_device *dev,
3761 void *private, int nr_cqe,
3762 int comp_vector,
3763 enum ib_poll_context poll_ctx,
3764 struct ib_udata *udata)
3765{
3766 return __ib_alloc_cq_user(dev, private, nr_cqe, comp_vector, poll_ctx,
3767 KBUILD_MODNAME, udata);
3768}
3769
3770/**
3771 * ib_alloc_cq: Allocate kernel CQ
3772 * @dev: The IB device
3773 * @private: Private data attached to the CQE
3774 * @nr_cqe: Number of CQEs in the CQ
3775 * @comp_vector: Completion vector used for the IRQs
3776 * @poll_ctx: Context used for polling the CQ
3777 *
3778 * NOTE: for user cq use ib_alloc_cq_user with valid udata!
3779 */
3780static inline struct ib_cq *ib_alloc_cq(struct ib_device *dev, void *private,
3781 int nr_cqe, int comp_vector,
3782 enum ib_poll_context poll_ctx)
3783{
3784 return ib_alloc_cq_user(dev, private, nr_cqe, comp_vector, poll_ctx,
3785 NULL);
3786}
3787
3788/**
3789 * ib_free_cq_user - Free kernel/user CQ
3790 * @cq: The CQ to free
3791 * @udata: Valid user data or NULL for kernel objects
3792 */
3793void ib_free_cq_user(struct ib_cq *cq, struct ib_udata *udata);
3794
3795/**
3796 * ib_free_cq - Free kernel CQ
3797 * @cq: The CQ to free
3798 *
3799 * NOTE: for user cq use ib_free_cq_user with valid udata!
3800 */
3801static inline void ib_free_cq(struct ib_cq *cq)
3802{
3803 ib_free_cq_user(cq, NULL);
3804}
3805
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08003806int ib_process_cq_direct(struct ib_cq *cq, int budget);
3807
Linus Torvalds1da177e2005-04-16 15:20:36 -07003808/**
3809 * ib_create_cq - Creates a CQ on the specified device.
3810 * @device: The device on which to create the CQ.
3811 * @comp_handler: A user-specified callback that is invoked when a
3812 * completion event occurs on the CQ.
3813 * @event_handler: A user-specified callback that is invoked when an
3814 * asynchronous event not associated with a completion occurs on the CQ.
3815 * @cq_context: Context associated with the CQ returned to the user via
3816 * the associated completion and event handlers.
Matan Barak8e372102015-06-11 16:35:21 +03003817 * @cq_attr: The attributes the CQ should be created upon.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003818 *
3819 * Users can examine the cq structure to determine the actual CQ size.
3820 */
Bharat Potnuri7350cdd2018-06-15 20:52:33 +05303821struct ib_cq *__ib_create_cq(struct ib_device *device,
3822 ib_comp_handler comp_handler,
3823 void (*event_handler)(struct ib_event *, void *),
3824 void *cq_context,
3825 const struct ib_cq_init_attr *cq_attr,
3826 const char *caller);
3827#define ib_create_cq(device, cmp_hndlr, evt_hndlr, cq_ctxt, cq_attr) \
3828 __ib_create_cq((device), (cmp_hndlr), (evt_hndlr), (cq_ctxt), (cq_attr), KBUILD_MODNAME)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003829
3830/**
3831 * ib_resize_cq - Modifies the capacity of the CQ.
3832 * @cq: The CQ to resize.
3833 * @cqe: The minimum size of the CQ.
3834 *
3835 * Users can examine the cq structure to determine the actual CQ size.
3836 */
3837int ib_resize_cq(struct ib_cq *cq, int cqe);
3838
3839/**
Leon Romanovsky4190b4e2017-11-13 10:51:19 +02003840 * rdma_set_cq_moderation - Modifies moderation params of the CQ
Eli Cohen2dd57162008-04-16 21:09:33 -07003841 * @cq: The CQ to modify.
3842 * @cq_count: number of CQEs that will trigger an event
3843 * @cq_period: max period of time in usec before triggering an event
3844 *
3845 */
Leon Romanovsky4190b4e2017-11-13 10:51:19 +02003846int rdma_set_cq_moderation(struct ib_cq *cq, u16 cq_count, u16 cq_period);
Eli Cohen2dd57162008-04-16 21:09:33 -07003847
3848/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003849 * ib_destroy_cq_user - Destroys the specified CQ.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003850 * @cq: The CQ to destroy.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003851 * @udata: Valid user data or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003852 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003853int ib_destroy_cq_user(struct ib_cq *cq, struct ib_udata *udata);
3854
3855/**
3856 * ib_destroy_cq - Destroys the specified kernel CQ.
3857 * @cq: The CQ to destroy.
3858 *
3859 * NOTE: for user cq use ib_destroy_cq_user with valid udata!
3860 */
Leon Romanovsky890ac8d2019-05-20 09:54:21 +03003861static inline void ib_destroy_cq(struct ib_cq *cq)
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003862{
Leon Romanovsky890ac8d2019-05-20 09:54:21 +03003863 ib_destroy_cq_user(cq, NULL);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003864}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003865
3866/**
3867 * ib_poll_cq - poll a CQ for completion(s)
3868 * @cq:the CQ being polled
3869 * @num_entries:maximum number of completions to return
3870 * @wc:array of at least @num_entries &struct ib_wc where completions
3871 * will be returned
3872 *
3873 * Poll a CQ for (possibly multiple) completions. If the return value
3874 * is < 0, an error occurred. If the return value is >= 0, it is the
3875 * number of completions returned. If the return value is
3876 * non-negative and < num_entries, then the CQ was emptied.
3877 */
3878static inline int ib_poll_cq(struct ib_cq *cq, int num_entries,
3879 struct ib_wc *wc)
3880{
Kamal Heib3023a1e2018-12-10 21:09:48 +02003881 return cq->device->ops.poll_cq(cq, num_entries, wc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003882}
3883
3884/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07003885 * ib_req_notify_cq - Request completion notification on a CQ.
3886 * @cq: The CQ to generate an event for.
Roland Dreiered23a722007-05-06 21:02:48 -07003887 * @flags:
3888 * Must contain exactly one of %IB_CQ_SOLICITED or %IB_CQ_NEXT_COMP
3889 * to request an event on the next solicited event or next work
3890 * completion at any type, respectively. %IB_CQ_REPORT_MISSED_EVENTS
3891 * may also be |ed in to request a hint about missed events, as
3892 * described below.
3893 *
3894 * Return Value:
3895 * < 0 means an error occurred while requesting notification
3896 * == 0 means notification was requested successfully, and if
3897 * IB_CQ_REPORT_MISSED_EVENTS was passed in, then no events
3898 * were missed and it is safe to wait for another event. In
3899 * this case is it guaranteed that any work completions added
3900 * to the CQ since the last CQ poll will trigger a completion
3901 * notification event.
3902 * > 0 is only returned if IB_CQ_REPORT_MISSED_EVENTS was passed
3903 * in. It means that the consumer must poll the CQ again to
3904 * make sure it is empty to avoid missing an event because of a
3905 * race between requesting notification and an entry being
3906 * added to the CQ. This return value means it is possible
3907 * (but not guaranteed) that a work completion has been added
3908 * to the CQ since the last poll without triggering a
3909 * completion notification event.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003910 */
3911static inline int ib_req_notify_cq(struct ib_cq *cq,
Roland Dreiered23a722007-05-06 21:02:48 -07003912 enum ib_cq_notify_flags flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003913{
Kamal Heib3023a1e2018-12-10 21:09:48 +02003914 return cq->device->ops.req_notify_cq(cq, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003915}
3916
3917/**
3918 * ib_req_ncomp_notif - Request completion notification when there are
3919 * at least the specified number of unreaped completions on the CQ.
3920 * @cq: The CQ to generate an event for.
3921 * @wc_cnt: The number of unreaped completions that should be on the
3922 * CQ before an event is generated.
3923 */
3924static inline int ib_req_ncomp_notif(struct ib_cq *cq, int wc_cnt)
3925{
Kamal Heib3023a1e2018-12-10 21:09:48 +02003926 return cq->device->ops.req_ncomp_notif ?
3927 cq->device->ops.req_ncomp_notif(cq, wc_cnt) :
Linus Torvalds1da177e2005-04-16 15:20:36 -07003928 -ENOSYS;
3929}
3930
3931/**
Ralph Campbell9b513092006-12-12 14:27:41 -08003932 * ib_dma_mapping_error - check a DMA addr for error
3933 * @dev: The device for which the dma_addr was created
3934 * @dma_addr: The DMA address to check
3935 */
3936static inline int ib_dma_mapping_error(struct ib_device *dev, u64 dma_addr)
3937{
Bart Van Assche0957c292017-03-07 22:56:53 +00003938 return dma_mapping_error(dev->dma_device, dma_addr);
Ralph Campbell9b513092006-12-12 14:27:41 -08003939}
3940
3941/**
3942 * ib_dma_map_single - Map a kernel virtual address to DMA address
3943 * @dev: The device for which the dma_addr is to be created
3944 * @cpu_addr: The kernel virtual address
3945 * @size: The size of the region in bytes
3946 * @direction: The direction of the DMA
3947 */
3948static inline u64 ib_dma_map_single(struct ib_device *dev,
3949 void *cpu_addr, size_t size,
3950 enum dma_data_direction direction)
3951{
Bart Van Assche0957c292017-03-07 22:56:53 +00003952 return dma_map_single(dev->dma_device, cpu_addr, size, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08003953}
3954
3955/**
3956 * ib_dma_unmap_single - Destroy a mapping created by ib_dma_map_single()
3957 * @dev: The device for which the DMA address was created
3958 * @addr: The DMA address
3959 * @size: The size of the region in bytes
3960 * @direction: The direction of the DMA
3961 */
3962static inline void ib_dma_unmap_single(struct ib_device *dev,
3963 u64 addr, size_t size,
3964 enum dma_data_direction direction)
3965{
Bart Van Assche0957c292017-03-07 22:56:53 +00003966 dma_unmap_single(dev->dma_device, addr, size, direction);
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07003967}
3968
Ralph Campbell9b513092006-12-12 14:27:41 -08003969/**
3970 * ib_dma_map_page - Map a physical page to DMA address
3971 * @dev: The device for which the dma_addr is to be created
3972 * @page: The page to be mapped
3973 * @offset: The offset within the page
3974 * @size: The size of the region in bytes
3975 * @direction: The direction of the DMA
3976 */
3977static inline u64 ib_dma_map_page(struct ib_device *dev,
3978 struct page *page,
3979 unsigned long offset,
3980 size_t size,
3981 enum dma_data_direction direction)
3982{
Bart Van Assche0957c292017-03-07 22:56:53 +00003983 return dma_map_page(dev->dma_device, page, offset, size, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08003984}
3985
3986/**
3987 * ib_dma_unmap_page - Destroy a mapping created by ib_dma_map_page()
3988 * @dev: The device for which the DMA address was created
3989 * @addr: The DMA address
3990 * @size: The size of the region in bytes
3991 * @direction: The direction of the DMA
3992 */
3993static inline void ib_dma_unmap_page(struct ib_device *dev,
3994 u64 addr, size_t size,
3995 enum dma_data_direction direction)
3996{
Bart Van Assche0957c292017-03-07 22:56:53 +00003997 dma_unmap_page(dev->dma_device, addr, size, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08003998}
3999
4000/**
4001 * ib_dma_map_sg - Map a scatter/gather list to DMA addresses
4002 * @dev: The device for which the DMA addresses are to be created
4003 * @sg: The array of scatter/gather entries
4004 * @nents: The number of scatter/gather entries
4005 * @direction: The direction of the DMA
4006 */
4007static inline int ib_dma_map_sg(struct ib_device *dev,
4008 struct scatterlist *sg, int nents,
4009 enum dma_data_direction direction)
4010{
Bart Van Assche0957c292017-03-07 22:56:53 +00004011 return dma_map_sg(dev->dma_device, sg, nents, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08004012}
4013
4014/**
4015 * ib_dma_unmap_sg - Unmap a scatter/gather list of DMA addresses
4016 * @dev: The device for which the DMA addresses were created
4017 * @sg: The array of scatter/gather entries
4018 * @nents: The number of scatter/gather entries
4019 * @direction: The direction of the DMA
4020 */
4021static inline void ib_dma_unmap_sg(struct ib_device *dev,
4022 struct scatterlist *sg, int nents,
4023 enum dma_data_direction direction)
4024{
Bart Van Assche0957c292017-03-07 22:56:53 +00004025 dma_unmap_sg(dev->dma_device, sg, nents, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08004026}
4027
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004028static inline int ib_dma_map_sg_attrs(struct ib_device *dev,
4029 struct scatterlist *sg, int nents,
4030 enum dma_data_direction direction,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07004031 unsigned long dma_attrs)
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004032{
Bart Van Assche0957c292017-03-07 22:56:53 +00004033 return dma_map_sg_attrs(dev->dma_device, sg, nents, direction,
4034 dma_attrs);
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004035}
4036
4037static inline void ib_dma_unmap_sg_attrs(struct ib_device *dev,
4038 struct scatterlist *sg, int nents,
4039 enum dma_data_direction direction,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07004040 unsigned long dma_attrs)
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004041{
Bart Van Assche0957c292017-03-07 22:56:53 +00004042 dma_unmap_sg_attrs(dev->dma_device, sg, nents, direction, dma_attrs);
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004043}
Ralph Campbell9b513092006-12-12 14:27:41 -08004044
4045/**
Bart Van Assche0b5cb332019-01-22 10:25:20 -08004046 * ib_dma_max_seg_size - Return the size limit of a single DMA transfer
4047 * @dev: The device to query
4048 *
4049 * The returned value represents a size in bytes.
4050 */
4051static inline unsigned int ib_dma_max_seg_size(struct ib_device *dev)
4052{
4053 struct device_dma_parameters *p = dev->dma_device->dma_parms;
4054
4055 return p ? p->max_segment_size : UINT_MAX;
4056}
4057
4058/**
Ralph Campbell9b513092006-12-12 14:27:41 -08004059 * ib_dma_sync_single_for_cpu - Prepare DMA region to be accessed by CPU
4060 * @dev: The device for which the DMA address was created
4061 * @addr: The DMA address
4062 * @size: The size of the region in bytes
4063 * @dir: The direction of the DMA
4064 */
4065static inline void ib_dma_sync_single_for_cpu(struct ib_device *dev,
4066 u64 addr,
4067 size_t size,
4068 enum dma_data_direction dir)
4069{
Bart Van Assche0957c292017-03-07 22:56:53 +00004070 dma_sync_single_for_cpu(dev->dma_device, addr, size, dir);
Ralph Campbell9b513092006-12-12 14:27:41 -08004071}
4072
4073/**
4074 * ib_dma_sync_single_for_device - Prepare DMA region to be accessed by device
4075 * @dev: The device for which the DMA address was created
4076 * @addr: The DMA address
4077 * @size: The size of the region in bytes
4078 * @dir: The direction of the DMA
4079 */
4080static inline void ib_dma_sync_single_for_device(struct ib_device *dev,
4081 u64 addr,
4082 size_t size,
4083 enum dma_data_direction dir)
4084{
Bart Van Assche0957c292017-03-07 22:56:53 +00004085 dma_sync_single_for_device(dev->dma_device, addr, size, dir);
Ralph Campbell9b513092006-12-12 14:27:41 -08004086}
4087
4088/**
4089 * ib_dma_alloc_coherent - Allocate memory and map it for DMA
4090 * @dev: The device for which the DMA address is requested
4091 * @size: The size of the region to allocate in bytes
4092 * @dma_handle: A pointer for returning the DMA address of the region
4093 * @flag: memory allocator flags
4094 */
4095static inline void *ib_dma_alloc_coherent(struct ib_device *dev,
4096 size_t size,
Bart Van Assched43dbac2017-01-20 13:04:10 -08004097 dma_addr_t *dma_handle,
Ralph Campbell9b513092006-12-12 14:27:41 -08004098 gfp_t flag)
4099{
Bart Van Assche0957c292017-03-07 22:56:53 +00004100 return dma_alloc_coherent(dev->dma_device, size, dma_handle, flag);
Ralph Campbell9b513092006-12-12 14:27:41 -08004101}
4102
4103/**
4104 * ib_dma_free_coherent - Free memory allocated by ib_dma_alloc_coherent()
4105 * @dev: The device for which the DMA addresses were allocated
4106 * @size: The size of the region
4107 * @cpu_addr: the address returned by ib_dma_alloc_coherent()
4108 * @dma_handle: the DMA address returned by ib_dma_alloc_coherent()
4109 */
4110static inline void ib_dma_free_coherent(struct ib_device *dev,
4111 size_t size, void *cpu_addr,
Bart Van Assched43dbac2017-01-20 13:04:10 -08004112 dma_addr_t dma_handle)
Ralph Campbell9b513092006-12-12 14:27:41 -08004113{
Bart Van Assche0957c292017-03-07 22:56:53 +00004114 dma_free_coherent(dev->dma_device, size, cpu_addr, dma_handle);
Ralph Campbell9b513092006-12-12 14:27:41 -08004115}
4116
4117/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004118 * ib_dereg_mr_user - Deregisters a memory region and removes it from the
4119 * HCA translation table.
4120 * @mr: The memory region to deregister.
4121 * @udata: Valid user data or NULL for kernel object
4122 *
4123 * This function can fail, if the memory region has memory windows bound to it.
4124 */
4125int ib_dereg_mr_user(struct ib_mr *mr, struct ib_udata *udata);
4126
4127/**
4128 * ib_dereg_mr - Deregisters a kernel memory region and removes it from the
Linus Torvalds1da177e2005-04-16 15:20:36 -07004129 * HCA translation table.
4130 * @mr: The memory region to deregister.
Shani Michaeli7083e422013-02-06 16:19:12 +00004131 *
4132 * This function can fail, if the memory region has memory windows bound to it.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004133 *
4134 * NOTE: for user mr use ib_dereg_mr_user with valid udata!
Linus Torvalds1da177e2005-04-16 15:20:36 -07004135 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004136static inline int ib_dereg_mr(struct ib_mr *mr)
4137{
4138 return ib_dereg_mr_user(mr, NULL);
4139}
Linus Torvalds1da177e2005-04-16 15:20:36 -07004140
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004141struct ib_mr *ib_alloc_mr_user(struct ib_pd *pd, enum ib_mr_type mr_type,
4142 u32 max_num_sg, struct ib_udata *udata);
4143
4144static inline struct ib_mr *ib_alloc_mr(struct ib_pd *pd,
4145 enum ib_mr_type mr_type, u32 max_num_sg)
4146{
4147 return ib_alloc_mr_user(pd, mr_type, max_num_sg, NULL);
4148}
Steve Wise00f7ec32008-07-14 23:48:45 -07004149
4150/**
Steve Wise00f7ec32008-07-14 23:48:45 -07004151 * ib_update_fast_reg_key - updates the key portion of the fast_reg MR
4152 * R_Key and L_Key.
4153 * @mr - struct ib_mr pointer to be updated.
4154 * @newkey - new key to be used.
4155 */
4156static inline void ib_update_fast_reg_key(struct ib_mr *mr, u8 newkey)
4157{
4158 mr->lkey = (mr->lkey & 0xffffff00) | newkey;
4159 mr->rkey = (mr->rkey & 0xffffff00) | newkey;
4160}
4161
4162/**
Shani Michaeli7083e422013-02-06 16:19:12 +00004163 * ib_inc_rkey - increments the key portion of the given rkey. Can be used
4164 * for calculating a new rkey for type 2 memory windows.
4165 * @rkey - the rkey to increment.
4166 */
4167static inline u32 ib_inc_rkey(u32 rkey)
4168{
4169 const u32 mask = 0x000000ff;
4170 return ((rkey + 1) & mask) | (rkey & ~mask);
4171}
4172
4173/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07004174 * ib_alloc_fmr - Allocates a unmapped fast memory region.
4175 * @pd: The protection domain associated with the unmapped region.
4176 * @mr_access_flags: Specifies the memory access rights.
4177 * @fmr_attr: Attributes of the unmapped region.
4178 *
4179 * A fast memory region must be mapped before it can be used as part of
4180 * a work request.
4181 */
4182struct ib_fmr *ib_alloc_fmr(struct ib_pd *pd,
4183 int mr_access_flags,
4184 struct ib_fmr_attr *fmr_attr);
4185
4186/**
4187 * ib_map_phys_fmr - Maps a list of physical pages to a fast memory region.
4188 * @fmr: The fast memory region to associate with the pages.
4189 * @page_list: An array of physical pages to map to the fast memory region.
4190 * @list_len: The number of pages in page_list.
4191 * @iova: The I/O virtual address to use with the mapped region.
4192 */
4193static inline int ib_map_phys_fmr(struct ib_fmr *fmr,
4194 u64 *page_list, int list_len,
4195 u64 iova)
4196{
Kamal Heib3023a1e2018-12-10 21:09:48 +02004197 return fmr->device->ops.map_phys_fmr(fmr, page_list, list_len, iova);
Linus Torvalds1da177e2005-04-16 15:20:36 -07004198}
4199
4200/**
4201 * ib_unmap_fmr - Removes the mapping from a list of fast memory regions.
4202 * @fmr_list: A linked list of fast memory regions to unmap.
4203 */
4204int ib_unmap_fmr(struct list_head *fmr_list);
4205
4206/**
4207 * ib_dealloc_fmr - Deallocates a fast memory region.
4208 * @fmr: The fast memory region to deallocate.
4209 */
4210int ib_dealloc_fmr(struct ib_fmr *fmr);
4211
4212/**
4213 * ib_attach_mcast - Attaches the specified QP to a multicast group.
4214 * @qp: QP to attach to the multicast group. The QP must be type
4215 * IB_QPT_UD.
4216 * @gid: Multicast group GID.
4217 * @lid: Multicast group LID in host byte order.
4218 *
4219 * In order to send and receive multicast packets, subnet
4220 * administration must have created the multicast group and configured
4221 * the fabric appropriately. The port associated with the specified
4222 * QP must also be a member of the multicast group.
4223 */
4224int ib_attach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
4225
4226/**
4227 * ib_detach_mcast - Detaches the specified QP from a multicast group.
4228 * @qp: QP to detach from the multicast group.
4229 * @gid: Multicast group GID.
4230 * @lid: Multicast group LID in host byte order.
4231 */
4232int ib_detach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
4233
Sean Hefty59991f92011-05-23 17:52:46 -07004234/**
4235 * ib_alloc_xrcd - Allocates an XRC domain.
4236 * @device: The device on which to allocate the XRC domain.
Leon Romanovskyf66c8ba2018-01-28 11:17:19 +02004237 * @caller: Module name for kernel consumers
Sean Hefty59991f92011-05-23 17:52:46 -07004238 */
Leon Romanovskyf66c8ba2018-01-28 11:17:19 +02004239struct ib_xrcd *__ib_alloc_xrcd(struct ib_device *device, const char *caller);
4240#define ib_alloc_xrcd(device) \
4241 __ib_alloc_xrcd((device), KBUILD_MODNAME)
Sean Hefty59991f92011-05-23 17:52:46 -07004242
4243/**
4244 * ib_dealloc_xrcd - Deallocates an XRC domain.
4245 * @xrcd: The XRC domain to deallocate.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004246 * @udata: Valid user data or NULL for kernel object
Sean Hefty59991f92011-05-23 17:52:46 -07004247 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004248int ib_dealloc_xrcd(struct ib_xrcd *xrcd, struct ib_udata *udata);
Sean Hefty59991f92011-05-23 17:52:46 -07004249
Eli Cohen1c636f82013-10-31 15:26:32 +02004250static inline int ib_check_mr_access(int flags)
4251{
4252 /*
4253 * Local write permission is required if remote write or
4254 * remote atomic permission is also requested.
4255 */
4256 if (flags & (IB_ACCESS_REMOTE_ATOMIC | IB_ACCESS_REMOTE_WRITE) &&
4257 !(flags & IB_ACCESS_LOCAL_WRITE))
4258 return -EINVAL;
4259
4260 return 0;
4261}
4262
Jack Morgenstein08bb5582018-05-23 15:30:30 +03004263static inline bool ib_access_writable(int access_flags)
4264{
4265 /*
4266 * We have writable memory backing the MR if any of the following
4267 * access flags are set. "Local write" and "remote write" obviously
4268 * require write access. "Remote atomic" can do things like fetch and
4269 * add, which will modify memory, and "MW bind" can change permissions
4270 * by binding a window.
4271 */
4272 return access_flags &
4273 (IB_ACCESS_LOCAL_WRITE | IB_ACCESS_REMOTE_WRITE |
4274 IB_ACCESS_REMOTE_ATOMIC | IB_ACCESS_MW_BIND);
4275}
4276
Sagi Grimberg1b01d332014-02-23 14:19:05 +02004277/**
4278 * ib_check_mr_status: lightweight check of MR status.
4279 * This routine may provide status checks on a selected
4280 * ib_mr. first use is for signature status check.
4281 *
4282 * @mr: A memory region.
4283 * @check_mask: Bitmask of which checks to perform from
4284 * ib_mr_status_check enumeration.
4285 * @mr_status: The container of relevant status checks.
4286 * failed checks will be indicated in the status bitmask
4287 * and the relevant info shall be in the error item.
4288 */
4289int ib_check_mr_status(struct ib_mr *mr, u32 check_mask,
4290 struct ib_mr_status *mr_status);
4291
Jason Gunthorped79af722019-01-10 14:02:24 -07004292/**
4293 * ib_device_try_get: Hold a registration lock
4294 * device: The device to lock
4295 *
4296 * A device under an active registration lock cannot become unregistered. It
4297 * is only possible to obtain a registration lock on a device that is fully
4298 * registered, otherwise this function returns false.
4299 *
4300 * The registration lock is only necessary for actions which require the
4301 * device to still be registered. Uses that only require the device pointer to
4302 * be valid should use get_device(&ibdev->dev) to hold the memory.
4303 *
4304 */
4305static inline bool ib_device_try_get(struct ib_device *dev)
4306{
4307 return refcount_inc_not_zero(&dev->refcount);
4308}
4309
4310void ib_device_put(struct ib_device *device);
Jason Gunthorpe324e2272019-02-12 21:12:51 -07004311struct ib_device *ib_device_get_by_netdev(struct net_device *ndev,
4312 enum rdma_driver_id driver_id);
4313struct ib_device *ib_device_get_by_name(const char *name,
4314 enum rdma_driver_id driver_id);
Yotam Kenneth9268f722015-07-30 17:50:15 +03004315struct net_device *ib_get_net_dev_by_params(struct ib_device *dev, u8 port,
4316 u16 pkey, const union ib_gid *gid,
4317 const struct sockaddr *addr);
Jason Gunthorpec2261dd2019-02-12 21:12:50 -07004318int ib_device_set_netdev(struct ib_device *ib_dev, struct net_device *ndev,
4319 unsigned int port);
4320struct net_device *ib_device_netdev(struct ib_device *dev, u8 port);
4321
Yishai Hadas5fd251c2016-05-23 15:20:48 +03004322struct ib_wq *ib_create_wq(struct ib_pd *pd,
4323 struct ib_wq_init_attr *init_attr);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004324int ib_destroy_wq(struct ib_wq *wq, struct ib_udata *udata);
Yishai Hadas5fd251c2016-05-23 15:20:48 +03004325int ib_modify_wq(struct ib_wq *wq, struct ib_wq_attr *attr,
4326 u32 wq_attr_mask);
Yishai Hadas6d397862016-05-23 15:20:51 +03004327struct ib_rwq_ind_table *ib_create_rwq_ind_table(struct ib_device *device,
4328 struct ib_rwq_ind_table_init_attr*
4329 wq_ind_table_init_attr);
4330int ib_destroy_rwq_ind_table(struct ib_rwq_ind_table *wq_ind_table);
Yotam Kenneth9268f722015-07-30 17:50:15 +03004331
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004332int ib_map_mr_sg(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
Bart Van Assche9aa8b322016-05-12 10:49:15 -07004333 unsigned int *sg_offset, unsigned int page_size);
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004334
4335static inline int
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004336ib_map_mr_sg_zbva(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
Bart Van Assche9aa8b322016-05-12 10:49:15 -07004337 unsigned int *sg_offset, unsigned int page_size)
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004338{
4339 int n;
4340
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004341 n = ib_map_mr_sg(mr, sg, sg_nents, sg_offset, page_size);
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004342 mr->iova = 0;
4343
4344 return n;
4345}
4346
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004347int ib_sg_to_pages(struct ib_mr *mr, struct scatterlist *sgl, int sg_nents,
Bart Van Assche9aa8b322016-05-12 10:49:15 -07004348 unsigned int *sg_offset, int (*set_page)(struct ib_mr *, u64));
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004349
Steve Wise765d6772016-02-17 08:15:41 -08004350void ib_drain_rq(struct ib_qp *qp);
4351void ib_drain_sq(struct ib_qp *qp);
4352void ib_drain_qp(struct ib_qp *qp);
Moni Shoua850d8fd2016-11-10 11:30:56 +02004353
Yuval Shaiad4186192017-06-14 23:13:34 +03004354int ib_get_eth_speed(struct ib_device *dev, u8 port_num, u8 *speed, u8 *width);
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004355
4356static inline u8 *rdma_ah_retrieve_dmac(struct rdma_ah_attr *attr)
4357{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004358 if (attr->type == RDMA_AH_ATTR_TYPE_ROCE)
4359 return attr->roce.dmac;
4360 return NULL;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004361}
4362
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004363static inline void rdma_ah_set_dlid(struct rdma_ah_attr *attr, u32 dlid)
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004364{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004365 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004366 attr->ib.dlid = (u16)dlid;
4367 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4368 attr->opa.dlid = dlid;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004369}
4370
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004371static inline u32 rdma_ah_get_dlid(const struct rdma_ah_attr *attr)
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004372{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004373 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
4374 return attr->ib.dlid;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004375 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4376 return attr->opa.dlid;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004377 return 0;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004378}
4379
4380static inline void rdma_ah_set_sl(struct rdma_ah_attr *attr, u8 sl)
4381{
4382 attr->sl = sl;
4383}
4384
4385static inline u8 rdma_ah_get_sl(const struct rdma_ah_attr *attr)
4386{
4387 return attr->sl;
4388}
4389
4390static inline void rdma_ah_set_path_bits(struct rdma_ah_attr *attr,
4391 u8 src_path_bits)
4392{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004393 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
4394 attr->ib.src_path_bits = src_path_bits;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004395 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4396 attr->opa.src_path_bits = src_path_bits;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004397}
4398
4399static inline u8 rdma_ah_get_path_bits(const struct rdma_ah_attr *attr)
4400{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004401 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
4402 return attr->ib.src_path_bits;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004403 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4404 return attr->opa.src_path_bits;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004405 return 0;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004406}
4407
Don Hiattd98bb7f2017-08-04 13:54:16 -07004408static inline void rdma_ah_set_make_grd(struct rdma_ah_attr *attr,
4409 bool make_grd)
4410{
4411 if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4412 attr->opa.make_grd = make_grd;
4413}
4414
4415static inline bool rdma_ah_get_make_grd(const struct rdma_ah_attr *attr)
4416{
4417 if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4418 return attr->opa.make_grd;
4419 return false;
4420}
4421
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004422static inline void rdma_ah_set_port_num(struct rdma_ah_attr *attr, u8 port_num)
4423{
4424 attr->port_num = port_num;
4425}
4426
4427static inline u8 rdma_ah_get_port_num(const struct rdma_ah_attr *attr)
4428{
4429 return attr->port_num;
4430}
4431
4432static inline void rdma_ah_set_static_rate(struct rdma_ah_attr *attr,
4433 u8 static_rate)
4434{
4435 attr->static_rate = static_rate;
4436}
4437
4438static inline u8 rdma_ah_get_static_rate(const struct rdma_ah_attr *attr)
4439{
4440 return attr->static_rate;
4441}
4442
4443static inline void rdma_ah_set_ah_flags(struct rdma_ah_attr *attr,
4444 enum ib_ah_flags flag)
4445{
4446 attr->ah_flags = flag;
4447}
4448
4449static inline enum ib_ah_flags
4450 rdma_ah_get_ah_flags(const struct rdma_ah_attr *attr)
4451{
4452 return attr->ah_flags;
4453}
4454
4455static inline const struct ib_global_route
4456 *rdma_ah_read_grh(const struct rdma_ah_attr *attr)
4457{
4458 return &attr->grh;
4459}
4460
4461/*To retrieve and modify the grh */
4462static inline struct ib_global_route
4463 *rdma_ah_retrieve_grh(struct rdma_ah_attr *attr)
4464{
4465 return &attr->grh;
4466}
4467
4468static inline void rdma_ah_set_dgid_raw(struct rdma_ah_attr *attr, void *dgid)
4469{
4470 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4471
4472 memcpy(grh->dgid.raw, dgid, sizeof(grh->dgid));
4473}
4474
4475static inline void rdma_ah_set_subnet_prefix(struct rdma_ah_attr *attr,
4476 __be64 prefix)
4477{
4478 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4479
4480 grh->dgid.global.subnet_prefix = prefix;
4481}
4482
4483static inline void rdma_ah_set_interface_id(struct rdma_ah_attr *attr,
4484 __be64 if_id)
4485{
4486 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4487
4488 grh->dgid.global.interface_id = if_id;
4489}
4490
4491static inline void rdma_ah_set_grh(struct rdma_ah_attr *attr,
4492 union ib_gid *dgid, u32 flow_label,
4493 u8 sgid_index, u8 hop_limit,
4494 u8 traffic_class)
4495{
4496 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4497
4498 attr->ah_flags = IB_AH_GRH;
4499 if (dgid)
4500 grh->dgid = *dgid;
4501 grh->flow_label = flow_label;
4502 grh->sgid_index = sgid_index;
4503 grh->hop_limit = hop_limit;
4504 grh->traffic_class = traffic_class;
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +03004505 grh->sgid_attr = NULL;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004506}
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004507
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +03004508void rdma_destroy_ah_attr(struct rdma_ah_attr *ah_attr);
4509void rdma_move_grh_sgid_attr(struct rdma_ah_attr *attr, union ib_gid *dgid,
4510 u32 flow_label, u8 hop_limit, u8 traffic_class,
4511 const struct ib_gid_attr *sgid_attr);
Jason Gunthorped97099f2018-06-13 10:22:05 +03004512void rdma_copy_ah_attr(struct rdma_ah_attr *dest,
4513 const struct rdma_ah_attr *src);
4514void rdma_replace_ah_attr(struct rdma_ah_attr *old,
4515 const struct rdma_ah_attr *new);
4516void rdma_move_ah_attr(struct rdma_ah_attr *dest, struct rdma_ah_attr *src);
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +03004517
Don Hiatt87daac62018-02-01 10:57:03 -08004518/**
4519 * rdma_ah_find_type - Return address handle type.
4520 *
4521 * @dev: Device to be checked
4522 * @port_num: Port number
4523 */
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004524static inline enum rdma_ah_attr_type rdma_ah_find_type(struct ib_device *dev,
Don Hiatt87daac62018-02-01 10:57:03 -08004525 u8 port_num)
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004526{
Parav Pandita6532e72018-01-12 07:58:42 +02004527 if (rdma_protocol_roce(dev, port_num))
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004528 return RDMA_AH_ATTR_TYPE_ROCE;
Don Hiatt87daac62018-02-01 10:57:03 -08004529 if (rdma_protocol_ib(dev, port_num)) {
4530 if (rdma_cap_opa_ah(dev, port_num))
4531 return RDMA_AH_ATTR_TYPE_OPA;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004532 return RDMA_AH_ATTR_TYPE_IB;
Don Hiatt87daac62018-02-01 10:57:03 -08004533 }
4534
4535 return RDMA_AH_ATTR_TYPE_UNDEFINED;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004536}
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004537
Hiatt, Don62ede772017-08-14 14:17:43 -04004538/**
4539 * ib_lid_cpu16 - Return lid in 16bit CPU encoding.
4540 * In the current implementation the only way to get
4541 * get the 32bit lid is from other sources for OPA.
4542 * For IB, lids will always be 16bits so cast the
4543 * value accordingly.
4544 *
4545 * @lid: A 32bit LID
4546 */
4547static inline u16 ib_lid_cpu16(u32 lid)
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004548{
Hiatt, Don62ede772017-08-14 14:17:43 -04004549 WARN_ON_ONCE(lid & 0xFFFF0000);
4550 return (u16)lid;
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004551}
4552
Hiatt, Don62ede772017-08-14 14:17:43 -04004553/**
4554 * ib_lid_be16 - Return lid in 16bit BE encoding.
4555 *
4556 * @lid: A 32bit LID
4557 */
4558static inline __be16 ib_lid_be16(u32 lid)
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004559{
Hiatt, Don62ede772017-08-14 14:17:43 -04004560 WARN_ON_ONCE(lid & 0xFFFF0000);
4561 return cpu_to_be16((u16)lid);
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004562}
Doug Ledford32043832017-08-10 14:31:29 -04004563
Sagi Grimbergc66cd352017-07-13 11:09:41 +03004564/**
4565 * ib_get_vector_affinity - Get the affinity mappings of a given completion
4566 * vector
4567 * @device: the rdma device
4568 * @comp_vector: index of completion vector
4569 *
4570 * Returns NULL on failure, otherwise a corresponding cpu map of the
4571 * completion vector (returns all-cpus map if the device driver doesn't
4572 * implement get_vector_affinity).
4573 */
4574static inline const struct cpumask *
4575ib_get_vector_affinity(struct ib_device *device, int comp_vector)
4576{
4577 if (comp_vector < 0 || comp_vector >= device->num_comp_vectors ||
Kamal Heib3023a1e2018-12-10 21:09:48 +02004578 !device->ops.get_vector_affinity)
Sagi Grimbergc66cd352017-07-13 11:09:41 +03004579 return NULL;
4580
Kamal Heib3023a1e2018-12-10 21:09:48 +02004581 return device->ops.get_vector_affinity(device, comp_vector);
Sagi Grimbergc66cd352017-07-13 11:09:41 +03004582
4583}
4584
Daniel Jurgens32f69e42018-01-04 17:25:36 +02004585/**
4586 * rdma_roce_rescan_device - Rescan all of the network devices in the system
4587 * and add their gids, as needed, to the relevant RoCE devices.
4588 *
4589 * @device: the rdma device
4590 */
4591void rdma_roce_rescan_device(struct ib_device *ibdev);
4592
Jason Gunthorpe8313c102018-11-25 20:51:13 +02004593struct ib_ucontext *ib_uverbs_get_ucontext_file(struct ib_uverbs_file *ufile);
Yishai Hadas7dc08dc2018-06-17 12:59:59 +03004594
Jason Gunthorpe15a1b4b2018-11-25 20:51:15 +02004595int uverbs_destroy_def_handler(struct uverbs_attr_bundle *attrs);
Denis Drozdovf6a8a192018-08-14 14:08:51 +03004596
4597struct net_device *rdma_alloc_netdev(struct ib_device *device, u8 port_num,
4598 enum rdma_netdev_t type, const char *name,
4599 unsigned char name_assign_type,
4600 void (*setup)(struct net_device *));
Denis Drozdov5d6b0cb2018-08-14 14:22:35 +03004601
4602int rdma_init_netdev(struct ib_device *device, u8 port_num,
4603 enum rdma_netdev_t type, const char *name,
4604 unsigned char name_assign_type,
4605 void (*setup)(struct net_device *),
4606 struct net_device *netdev);
4607
Parav Panditd4122f52018-10-11 22:31:53 +03004608/**
4609 * rdma_set_device_sysfs_group - Set device attributes group to have
4610 * driver specific sysfs entries at
4611 * for infiniband class.
4612 *
4613 * @device: device pointer for which attributes to be created
4614 * @group: Pointer to group which should be added when device
4615 * is registered with sysfs.
4616 * rdma_set_device_sysfs_group() allows existing drivers to expose one
4617 * group per device to have sysfs attributes.
4618 *
4619 * NOTE: New drivers should not make use of this API; instead new device
4620 * parameter should be exposed via netlink command. This API and mechanism
4621 * exist only for existing drivers.
4622 */
4623static inline void
4624rdma_set_device_sysfs_group(struct ib_device *dev,
4625 const struct attribute_group *group)
4626{
4627 dev->groups[1] = group;
4628}
4629
Parav Pandit54747232018-12-18 14:15:56 +02004630/**
4631 * rdma_device_to_ibdev - Get ib_device pointer from device pointer
4632 *
4633 * @device: device pointer for which ib_device pointer to retrieve
4634 *
4635 * rdma_device_to_ibdev() retrieves ib_device pointer from device.
4636 *
4637 */
4638static inline struct ib_device *rdma_device_to_ibdev(struct device *device)
4639{
Parav Panditcebe5562019-02-26 13:56:11 +02004640 struct ib_core_device *coredev =
4641 container_of(device, struct ib_core_device, dev);
4642
4643 return coredev->owner;
Parav Pandit54747232018-12-18 14:15:56 +02004644}
4645
4646/**
4647 * rdma_device_to_drv_device - Helper macro to reach back to driver's
4648 * ib_device holder structure from device pointer.
4649 *
4650 * NOTE: New drivers should not make use of this API; This API is only for
4651 * existing drivers who have exposed sysfs entries using
4652 * rdma_set_device_sysfs_group().
4653 */
4654#define rdma_device_to_drv_device(dev, drv_dev_struct, ibdev_member) \
4655 container_of(rdma_device_to_ibdev(dev), drv_dev_struct, ibdev_member)
Parav Pandit41c61402019-02-26 14:01:46 +02004656
4657bool rdma_dev_access_netns(const struct ib_device *device,
4658 const struct net *net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07004659#endif /* IB_VERBS_H */