blob: dacf2b5ad8629de0233ed9f4e4b563fe28ef2d29 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (c) 2004 Mellanox Technologies Ltd. All rights reserved.
3 * Copyright (c) 2004 Infinicon Corporation. All rights reserved.
4 * Copyright (c) 2004 Intel Corporation. All rights reserved.
5 * Copyright (c) 2004 Topspin Corporation. All rights reserved.
6 * Copyright (c) 2004 Voltaire Corporation. All rights reserved.
Roland Dreier2a1d9b72005-08-10 23:03:10 -07007 * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
Roland Dreierf7c6a7b2007-03-04 16:15:11 -08008 * Copyright (c) 2005, 2006, 2007 Cisco Systems. All rights reserved.
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 *
10 * This software is available to you under a choice of one of two
11 * licenses. You may choose to be licensed under the terms of the GNU
12 * General Public License (GPL) Version 2, available from the file
13 * COPYING in the main directory of this source tree, or the
14 * OpenIB.org BSD license below:
15 *
16 * Redistribution and use in source and binary forms, with or
17 * without modification, are permitted provided that the following
18 * conditions are met:
19 *
20 * - Redistributions of source code must retain the above
21 * copyright notice, this list of conditions and the following
22 * disclaimer.
23 *
24 * - Redistributions in binary form must reproduce the above
25 * copyright notice, this list of conditions and the following
26 * disclaimer in the documentation and/or other materials
27 * provided with the distribution.
28 *
29 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
30 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
31 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
32 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
33 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
34 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
35 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
36 * SOFTWARE.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
39#if !defined(IB_VERBS_H)
40#define IB_VERBS_H
41
42#include <linux/types.h>
43#include <linux/device.h>
Ralph Campbell9b513092006-12-12 14:27:41 -080044#include <linux/dma-mapping.h>
Michael S. Tsirkin459d6e22007-02-04 14:11:55 -080045#include <linux/kref.h>
Dotan Barakbfb3ea12007-07-31 16:49:15 +030046#include <linux/list.h>
47#include <linux/rwsem.h>
Tejun Heof0626712010-10-19 15:24:36 +000048#include <linux/workqueue.h>
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -080049#include <linux/irq_poll.h>
Matan Barakdd5f03b2013-12-12 18:03:11 +020050#include <uapi/linux/if_ether.h>
Somnath Koturc865f242015-12-23 14:56:51 +020051#include <net/ipv6.h>
52#include <net/ip.h>
Matan Barak301a7212015-12-15 20:30:10 +020053#include <linux/string.h>
54#include <linux/slab.h>
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -070055#include <linux/netdevice.h>
Parav Pandit01b67112018-11-16 03:50:57 +020056#include <linux/refcount.h>
Eli Cohen50174a72016-03-11 22:58:38 +020057#include <linux/if_link.h>
Arun Sharma600634972011-07-26 16:09:06 -070058#include <linux/atomic.h>
Haggai Eran882214e2014-12-11 17:04:18 +020059#include <linux/mmu_notifier.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080060#include <linux/uaccess.h>
Parav Pandit43579b52017-01-10 00:02:14 +000061#include <linux/cgroup_rdma.h>
Leon Romanovskyf6316032019-03-28 15:12:58 +020062#include <linux/irqflags.h>
63#include <linux/preempt.h>
Nicolas Dichtelea6819e2017-03-27 14:20:14 +020064#include <uapi/rdma/ib_user_verbs.h>
Leon Romanovsky02d88832018-01-28 11:17:20 +020065#include <rdma/restrack.h>
Matan Barak0ede73b2018-03-19 15:02:34 +020066#include <uapi/rdma/rdma_user_ioctl.h>
Matan Barak2eb9bea2018-03-28 09:27:45 +030067#include <uapi/rdma/ib_user_ioctl_verbs.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Leon Romanovsky9abb0d12017-06-27 16:49:53 +030069#define IB_FW_VERSION_NAME_MAX ETHTOOL_FWVERS_LEN
70
Jason Gunthorpeb5231b02018-09-16 20:48:04 +030071struct ib_umem_odp;
72
Tejun Heof0626712010-10-19 15:24:36 +000073extern struct workqueue_struct *ib_wq;
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -080074extern struct workqueue_struct *ib_comp_wq;
Jack Morgensteinf7948092018-08-27 08:35:55 +030075extern struct workqueue_struct *ib_comp_unbound_wq;
Tejun Heof0626712010-10-19 15:24:36 +000076
Gal Pressman923abb92019-05-01 13:48:13 +030077__printf(3, 4) __cold
78void ibdev_printk(const char *level, const struct ib_device *ibdev,
79 const char *format, ...);
80__printf(2, 3) __cold
81void ibdev_emerg(const struct ib_device *ibdev, const char *format, ...);
82__printf(2, 3) __cold
83void ibdev_alert(const struct ib_device *ibdev, const char *format, ...);
84__printf(2, 3) __cold
85void ibdev_crit(const struct ib_device *ibdev, const char *format, ...);
86__printf(2, 3) __cold
87void ibdev_err(const struct ib_device *ibdev, const char *format, ...);
88__printf(2, 3) __cold
89void ibdev_warn(const struct ib_device *ibdev, const char *format, ...);
90__printf(2, 3) __cold
91void ibdev_notice(const struct ib_device *ibdev, const char *format, ...);
92__printf(2, 3) __cold
93void ibdev_info(const struct ib_device *ibdev, const char *format, ...);
94
95#if defined(CONFIG_DYNAMIC_DEBUG)
96#define ibdev_dbg(__dev, format, args...) \
97 dynamic_ibdev_dbg(__dev, format, ##args)
98#elif defined(DEBUG)
99#define ibdev_dbg(__dev, format, args...) \
100 ibdev_printk(KERN_DEBUG, __dev, format, ##args)
101#else
102__printf(2, 3) __cold
103static inline
104void ibdev_dbg(const struct ib_device *ibdev, const char *format, ...) {}
105#endif
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107union ib_gid {
108 u8 raw[16];
109 struct {
Sean Hefty97f52eb2005-08-13 21:05:57 -0700110 __be64 subnet_prefix;
111 __be64 interface_id;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 } global;
113};
114
Moni Shouae26be1b2015-07-30 18:33:29 +0300115extern union ib_gid zgid;
116
Matan Barakb39ffa12015-12-23 14:56:47 +0200117enum ib_gid_type {
118 /* If link layer is Ethernet, this is RoCE V1 */
119 IB_GID_TYPE_IB = 0,
120 IB_GID_TYPE_ROCE = 0,
Matan Barak7766a992015-12-23 14:56:50 +0200121 IB_GID_TYPE_ROCE_UDP_ENCAP = 1,
Matan Barakb39ffa12015-12-23 14:56:47 +0200122 IB_GID_TYPE_SIZE
123};
124
Moni Shoua7ead4bc2016-01-14 17:50:38 +0200125#define ROCE_V2_UDP_DPORT 4791
Matan Barak03db3a22015-07-30 18:33:26 +0300126struct ib_gid_attr {
Parav Pandit943bd982019-05-02 10:48:07 +0300127 struct net_device __rcu *ndev;
Parav Pandit598ff6b2018-04-01 15:08:21 +0300128 struct ib_device *device;
Parav Panditb150c382018-06-05 08:40:15 +0300129 union ib_gid gid;
Parav Pandit598ff6b2018-04-01 15:08:21 +0300130 enum ib_gid_type gid_type;
131 u16 index;
132 u8 port_num;
Matan Barak03db3a22015-07-30 18:33:26 +0300133};
134
Tom Tucker07ebafb2006-08-03 16:02:42 -0500135enum rdma_node_type {
136 /* IB values map to NodeInfo:NodeType. */
137 RDMA_NODE_IB_CA = 1,
138 RDMA_NODE_IB_SWITCH,
139 RDMA_NODE_IB_ROUTER,
Upinder Malhi \(umalhi\)180771a2013-09-10 03:36:59 +0000140 RDMA_NODE_RNIC,
141 RDMA_NODE_USNIC,
Upinder Malhi5db57652014-01-15 17:02:36 -0800142 RDMA_NODE_USNIC_UDP,
Gal Pressmanf95be3d2019-05-05 20:59:21 +0300143 RDMA_NODE_UNSPECIFIED,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144};
145
Eli Cohena0c1b2a2016-03-11 22:58:37 +0200146enum {
147 /* set the local administered indication */
148 IB_SA_WELL_KNOWN_GUID = BIT_ULL(57) | 2,
149};
150
Tom Tucker07ebafb2006-08-03 16:02:42 -0500151enum rdma_transport_type {
152 RDMA_TRANSPORT_IB,
Upinder Malhi \(umalhi\)180771a2013-09-10 03:36:59 +0000153 RDMA_TRANSPORT_IWARP,
Upinder Malhi248567f2014-01-09 14:48:19 -0800154 RDMA_TRANSPORT_USNIC,
Gal Pressmanf95be3d2019-05-05 20:59:21 +0300155 RDMA_TRANSPORT_USNIC_UDP,
156 RDMA_TRANSPORT_UNSPECIFIED,
Tom Tucker07ebafb2006-08-03 16:02:42 -0500157};
158
Michael Wang6b90a6d2015-05-05 14:50:18 +0200159enum rdma_protocol_type {
160 RDMA_PROTOCOL_IB,
161 RDMA_PROTOCOL_IBOE,
162 RDMA_PROTOCOL_IWARP,
163 RDMA_PROTOCOL_USNIC_UDP
164};
165
Roland Dreier8385fd82014-06-04 10:00:16 -0700166__attribute_const__ enum rdma_transport_type
167rdma_node_get_transport(enum rdma_node_type node_type);
Tom Tucker07ebafb2006-08-03 16:02:42 -0500168
Somnath Koturc865f242015-12-23 14:56:51 +0200169enum rdma_network_type {
170 RDMA_NETWORK_IB,
171 RDMA_NETWORK_ROCE_V1 = RDMA_NETWORK_IB,
172 RDMA_NETWORK_IPV4,
173 RDMA_NETWORK_IPV6
174};
175
176static inline enum ib_gid_type ib_network_to_gid_type(enum rdma_network_type network_type)
177{
178 if (network_type == RDMA_NETWORK_IPV4 ||
179 network_type == RDMA_NETWORK_IPV6)
180 return IB_GID_TYPE_ROCE_UDP_ENCAP;
181
182 /* IB_GID_TYPE_IB same as RDMA_NETWORK_ROCE_V1 */
183 return IB_GID_TYPE_IB;
184}
185
Parav Pandit47ec3862018-06-13 10:22:06 +0300186static inline enum rdma_network_type
187rdma_gid_attr_network_type(const struct ib_gid_attr *attr)
Somnath Koturc865f242015-12-23 14:56:51 +0200188{
Parav Pandit47ec3862018-06-13 10:22:06 +0300189 if (attr->gid_type == IB_GID_TYPE_IB)
Somnath Koturc865f242015-12-23 14:56:51 +0200190 return RDMA_NETWORK_IB;
191
Parav Pandit47ec3862018-06-13 10:22:06 +0300192 if (ipv6_addr_v4mapped((struct in6_addr *)&attr->gid))
Somnath Koturc865f242015-12-23 14:56:51 +0200193 return RDMA_NETWORK_IPV4;
194 else
195 return RDMA_NETWORK_IPV6;
196}
197
Eli Cohena3f5ada2010-09-27 17:51:10 -0700198enum rdma_link_layer {
199 IB_LINK_LAYER_UNSPECIFIED,
200 IB_LINK_LAYER_INFINIBAND,
201 IB_LINK_LAYER_ETHERNET,
202};
203
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204enum ib_device_cap_flags {
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200205 IB_DEVICE_RESIZE_MAX_WR = (1 << 0),
206 IB_DEVICE_BAD_PKEY_CNTR = (1 << 1),
207 IB_DEVICE_BAD_QKEY_CNTR = (1 << 2),
208 IB_DEVICE_RAW_MULTI = (1 << 3),
209 IB_DEVICE_AUTO_PATH_MIG = (1 << 4),
210 IB_DEVICE_CHANGE_PHY_PORT = (1 << 5),
211 IB_DEVICE_UD_AV_PORT_ENFORCE = (1 << 6),
212 IB_DEVICE_CURR_QP_STATE_MOD = (1 << 7),
213 IB_DEVICE_SHUTDOWN_PORT = (1 << 8),
Leon Romanovsky78b57f92017-08-17 15:50:37 +0300214 /* Not in use, former INIT_TYPE = (1 << 9),*/
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200215 IB_DEVICE_PORT_ACTIVE_EVENT = (1 << 10),
216 IB_DEVICE_SYS_IMAGE_GUID = (1 << 11),
217 IB_DEVICE_RC_RNR_NAK_GEN = (1 << 12),
218 IB_DEVICE_SRQ_RESIZE = (1 << 13),
219 IB_DEVICE_N_NOTIFY_CQ = (1 << 14),
Christoph Hellwigb1adc712015-12-23 19:12:45 +0100220
221 /*
222 * This device supports a per-device lkey or stag that can be
223 * used without performing a memory registration for the local
224 * memory. Note that ULPs should never check this flag, but
225 * instead of use the local_dma_lkey flag in the ib_pd structure,
226 * which will always contain a usable lkey.
227 */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200228 IB_DEVICE_LOCAL_DMA_LKEY = (1 << 15),
Leon Romanovsky78b57f92017-08-17 15:50:37 +0300229 /* Reserved, old SEND_W_INV = (1 << 16),*/
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200230 IB_DEVICE_MEM_WINDOW = (1 << 17),
Eli Cohene0605d92008-01-30 18:30:57 +0200231 /*
232 * Devices should set IB_DEVICE_UD_IP_SUM if they support
233 * insertion of UDP and TCP checksum on outgoing UD IPoIB
234 * messages and can verify the validity of checksum for
235 * incoming messages. Setting this flag implies that the
236 * IPoIB driver may set NETIF_F_IP_CSUM for datagram mode.
237 */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200238 IB_DEVICE_UD_IP_CSUM = (1 << 18),
239 IB_DEVICE_UD_TSO = (1 << 19),
240 IB_DEVICE_XRC = (1 << 20),
Christoph Hellwigb1adc712015-12-23 19:12:45 +0100241
242 /*
243 * This device supports the IB "base memory management extension",
244 * which includes support for fast registrations (IB_WR_REG_MR,
245 * IB_WR_LOCAL_INV and IB_WR_SEND_WITH_INV verbs). This flag should
246 * also be set by any iWarp device which must support FRs to comply
247 * to the iWarp verbs spec. iWarp devices also support the
248 * IB_WR_RDMA_READ_WITH_INV verb for RDMA READs that invalidate the
249 * stag.
250 */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200251 IB_DEVICE_MEM_MGT_EXTENSIONS = (1 << 21),
252 IB_DEVICE_BLOCK_MULTICAST_LOOPBACK = (1 << 22),
253 IB_DEVICE_MEM_WINDOW_TYPE_2A = (1 << 23),
254 IB_DEVICE_MEM_WINDOW_TYPE_2B = (1 << 24),
255 IB_DEVICE_RC_IP_CSUM = (1 << 25),
Noa Osherovichebaaee22017-01-18 15:39:54 +0200256 /* Deprecated. Please use IB_RAW_PACKET_CAP_IP_CSUM. */
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200257 IB_DEVICE_RAW_IP_CSUM = (1 << 26),
Leon Romanovsky8a06ce52015-12-20 12:16:10 +0200258 /*
259 * Devices should set IB_DEVICE_CROSS_CHANNEL if they
260 * support execution of WQEs that involve synchronization
261 * of I/O operations with single completion queue managed
262 * by hardware.
263 */
Leon Romanovsky78b57f92017-08-17 15:50:37 +0300264 IB_DEVICE_CROSS_CHANNEL = (1 << 27),
Leon Romanovsky7ca0bc52015-12-20 12:16:09 +0200265 IB_DEVICE_MANAGED_FLOW_STEERING = (1 << 29),
266 IB_DEVICE_SIGNATURE_HANDOVER = (1 << 30),
Max Gurtovoy47355b32016-06-06 19:34:39 +0300267 IB_DEVICE_ON_DEMAND_PAGING = (1ULL << 31),
Sagi Grimbergf5aa9152016-02-29 19:07:32 +0200268 IB_DEVICE_SG_GAPS_REG = (1ULL << 32),
Max Gurtovoyc7e162a2016-06-06 19:34:40 +0300269 IB_DEVICE_VIRTUAL_FUNCTION = (1ULL << 33),
Noa Osherovichebaaee22017-01-18 15:39:54 +0200270 /* Deprecated. Please use IB_RAW_PACKET_CAP_SCATTER_FCS. */
Max Gurtovoyc7e162a2016-06-06 19:34:40 +0300271 IB_DEVICE_RAW_SCATTER_FCS = (1ULL << 34),
Vishwanathapura, Niranjana62e45942017-04-12 20:29:21 -0700272 IB_DEVICE_RDMA_NETDEV_OPA_VNIC = (1ULL << 35),
Noa Osheroviche1d2e882017-10-29 13:59:44 +0200273 /* The device supports padding incoming writes to cacheline. */
274 IB_DEVICE_PCI_WRITE_END_PADDING = (1ULL << 36),
Steve Wise3856ec42019-02-15 11:03:53 -0800275 IB_DEVICE_ALLOW_USER_UNREG = (1ULL << 37),
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200276};
277
278enum ib_signature_prot_cap {
279 IB_PROT_T10DIF_TYPE_1 = 1,
280 IB_PROT_T10DIF_TYPE_2 = 1 << 1,
281 IB_PROT_T10DIF_TYPE_3 = 1 << 2,
282};
283
284enum ib_signature_guard_cap {
285 IB_GUARD_T10DIF_CRC = 1,
286 IB_GUARD_T10DIF_CSUM = 1 << 1,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287};
288
289enum ib_atomic_cap {
290 IB_ATOMIC_NONE,
291 IB_ATOMIC_HCA,
292 IB_ATOMIC_GLOB
293};
294
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200295enum ib_odp_general_cap_bits {
Artemy Kovalyov25bf14d2017-01-18 16:58:06 +0200296 IB_ODP_SUPPORT = 1 << 0,
297 IB_ODP_SUPPORT_IMPLICIT = 1 << 1,
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200298};
299
300enum ib_odp_transport_cap_bits {
301 IB_ODP_SUPPORT_SEND = 1 << 0,
302 IB_ODP_SUPPORT_RECV = 1 << 1,
303 IB_ODP_SUPPORT_WRITE = 1 << 2,
304 IB_ODP_SUPPORT_READ = 1 << 3,
305 IB_ODP_SUPPORT_ATOMIC = 1 << 4,
Moni Shouada823342019-01-22 08:48:41 +0200306 IB_ODP_SUPPORT_SRQ_RECV = 1 << 5,
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200307};
308
309struct ib_odp_caps {
310 uint64_t general_caps;
311 struct {
312 uint32_t rc_odp_caps;
313 uint32_t uc_odp_caps;
314 uint32_t ud_odp_caps;
Moni Shoua52a72e22019-01-22 08:48:42 +0200315 uint32_t xrc_odp_caps;
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200316 } per_transport_caps;
317};
318
Yishai Hadasccf20562016-08-28 11:28:43 +0300319struct ib_rss_caps {
320 /* Corresponding bit will be set if qp type from
321 * 'enum ib_qp_type' is supported, e.g.
322 * supported_qpts |= 1 << IB_QPT_UD
323 */
324 u32 supported_qpts;
325 u32 max_rwq_indirection_tables;
326 u32 max_rwq_indirection_table_size;
327};
328
Artemy Kovalyov6938fc1e2017-08-17 15:52:03 +0300329enum ib_tm_cap_flags {
330 /* Support tag matching on RC transport */
331 IB_TM_CAP_RC = 1 << 0,
332};
333
Leon Romanovsky78b1beb2017-09-24 21:46:29 +0300334struct ib_tm_caps {
Artemy Kovalyov6938fc1e2017-08-17 15:52:03 +0300335 /* Max size of RNDV header */
336 u32 max_rndv_hdr_size;
337 /* Max number of entries in tag matching list */
338 u32 max_num_tags;
339 /* From enum ib_tm_cap_flags */
340 u32 flags;
341 /* Max number of outstanding list operations */
342 u32 max_ops;
343 /* Max number of SGE in tag matching entry */
344 u32 max_sge;
345};
346
Matan Barakbcf4c1e2015-06-11 16:35:20 +0300347struct ib_cq_init_attr {
348 unsigned int cqe;
349 int comp_vector;
350 u32 flags;
351};
352
Yonatan Cohen869ddcf2017-11-13 10:51:13 +0200353enum ib_cq_attr_mask {
354 IB_CQ_MODERATE = 1 << 0,
355};
356
Yonatan Cohen18bd9072017-11-13 10:51:16 +0200357struct ib_cq_caps {
358 u16 max_cq_moderation_count;
359 u16 max_cq_moderation_period;
360};
361
Ariel Levkovichbe934cc2018-04-05 18:53:25 +0300362struct ib_dm_mr_attr {
363 u64 length;
364 u64 offset;
365 u32 access_flags;
366};
367
Ariel Levkovichbee76d72018-04-05 18:53:24 +0300368struct ib_dm_alloc_attr {
369 u64 length;
370 u32 alignment;
371 u32 flags;
372};
373
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374struct ib_device_attr {
375 u64 fw_ver;
Sean Hefty97f52eb2005-08-13 21:05:57 -0700376 __be64 sys_image_guid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 u64 max_mr_size;
378 u64 page_size_cap;
379 u32 vendor_id;
380 u32 vendor_part_id;
381 u32 hw_ver;
382 int max_qp;
383 int max_qp_wr;
Leon Romanovskyfb532d62016-02-23 10:25:25 +0200384 u64 device_cap_flags;
Steve Wise33023fb2018-06-18 08:05:26 -0700385 int max_send_sge;
386 int max_recv_sge;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387 int max_sge_rd;
388 int max_cq;
389 int max_cqe;
390 int max_mr;
391 int max_pd;
392 int max_qp_rd_atom;
393 int max_ee_rd_atom;
394 int max_res_rd_atom;
395 int max_qp_init_rd_atom;
396 int max_ee_init_rd_atom;
397 enum ib_atomic_cap atomic_cap;
Vladimir Sokolovsky5e80ba82010-04-14 17:23:01 +0300398 enum ib_atomic_cap masked_atomic_cap;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 int max_ee;
400 int max_rdd;
401 int max_mw;
402 int max_raw_ipv6_qp;
403 int max_raw_ethy_qp;
404 int max_mcast_grp;
405 int max_mcast_qp_attach;
406 int max_total_mcast_qp_attach;
407 int max_ah;
408 int max_fmr;
409 int max_map_per_fmr;
410 int max_srq;
411 int max_srq_wr;
412 int max_srq_sge;
Steve Wise00f7ec32008-07-14 23:48:45 -0700413 unsigned int max_fast_reg_page_list_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 u16 max_pkeys;
415 u8 local_ca_ack_delay;
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200416 int sig_prot_cap;
417 int sig_guard_cap;
Sagi Grimberg860f10a2014-12-11 17:04:16 +0200418 struct ib_odp_caps odp_caps;
Matan Barak24306dc2015-06-11 16:35:24 +0300419 uint64_t timestamp_mask;
420 uint64_t hca_core_clock; /* in KHZ */
Yishai Hadasccf20562016-08-28 11:28:43 +0300421 struct ib_rss_caps rss_caps;
422 u32 max_wq_type_rq;
Noa Osherovichebaaee22017-01-18 15:39:54 +0200423 u32 raw_packet_caps; /* Use ib_raw_packet_caps enum */
Leon Romanovsky78b1beb2017-09-24 21:46:29 +0300424 struct ib_tm_caps tm_caps;
Yonatan Cohen18bd9072017-11-13 10:51:16 +0200425 struct ib_cq_caps cq_caps;
Ariel Levkovich1d8eeb92018-04-05 18:53:23 +0300426 u64 max_dm_size;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427};
428
429enum ib_mtu {
430 IB_MTU_256 = 1,
431 IB_MTU_512 = 2,
432 IB_MTU_1024 = 3,
433 IB_MTU_2048 = 4,
434 IB_MTU_4096 = 5
435};
436
437static inline int ib_mtu_enum_to_int(enum ib_mtu mtu)
438{
439 switch (mtu) {
440 case IB_MTU_256: return 256;
441 case IB_MTU_512: return 512;
442 case IB_MTU_1024: return 1024;
443 case IB_MTU_2048: return 2048;
444 case IB_MTU_4096: return 4096;
445 default: return -1;
446 }
447}
448
Amrani, Ramd3f4aad2016-12-26 08:40:57 +0200449static inline enum ib_mtu ib_mtu_int_to_enum(int mtu)
450{
451 if (mtu >= 4096)
452 return IB_MTU_4096;
453 else if (mtu >= 2048)
454 return IB_MTU_2048;
455 else if (mtu >= 1024)
456 return IB_MTU_1024;
457 else if (mtu >= 512)
458 return IB_MTU_512;
459 else
460 return IB_MTU_256;
461}
462
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463enum ib_port_state {
464 IB_PORT_NOP = 0,
465 IB_PORT_DOWN = 1,
466 IB_PORT_INIT = 2,
467 IB_PORT_ARMED = 3,
468 IB_PORT_ACTIVE = 4,
469 IB_PORT_ACTIVE_DEFER = 5
470};
471
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472enum ib_port_width {
473 IB_WIDTH_1X = 1,
Michael Guralnikdbabf682018-12-09 11:49:49 +0200474 IB_WIDTH_2X = 16,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700475 IB_WIDTH_4X = 2,
476 IB_WIDTH_8X = 4,
477 IB_WIDTH_12X = 8
478};
479
480static inline int ib_width_enum_to_int(enum ib_port_width width)
481{
482 switch (width) {
483 case IB_WIDTH_1X: return 1;
Michael Guralnikdbabf682018-12-09 11:49:49 +0200484 case IB_WIDTH_2X: return 2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485 case IB_WIDTH_4X: return 4;
486 case IB_WIDTH_8X: return 8;
487 case IB_WIDTH_12X: return 12;
488 default: return -1;
489 }
490}
491
Or Gerlitz2e966912012-02-28 18:49:50 +0200492enum ib_port_speed {
493 IB_SPEED_SDR = 1,
494 IB_SPEED_DDR = 2,
495 IB_SPEED_QDR = 4,
496 IB_SPEED_FDR10 = 8,
497 IB_SPEED_FDR = 16,
Noa Osherovich12113a32017-04-20 20:53:31 +0300498 IB_SPEED_EDR = 32,
499 IB_SPEED_HDR = 64
Or Gerlitz2e966912012-02-28 18:49:50 +0200500};
501
Christoph Lameterb40f4752016-05-16 12:49:33 -0500502/**
503 * struct rdma_hw_stats
Mark Bloche9451302018-03-27 15:51:05 +0300504 * @lock - Mutex to protect parallel write access to lifespan and values
505 * of counters, which are 64bits and not guaranteeed to be written
506 * atomicaly on 32bits systems.
Christoph Lameterb40f4752016-05-16 12:49:33 -0500507 * @timestamp - Used by the core code to track when the last update was
508 * @lifespan - Used by the core code to determine how old the counters
509 * should be before being updated again. Stored in jiffies, defaults
510 * to 10 milliseconds, drivers can override the default be specifying
511 * their own value during their allocation routine.
512 * @name - Array of pointers to static names used for the counters in
513 * directory.
514 * @num_counters - How many hardware counters there are. If name is
515 * shorter than this number, a kernel oops will result. Driver authors
516 * are encouraged to leave BUILD_BUG_ON(ARRAY_SIZE(@name) < num_counters)
517 * in their code to prevent this.
518 * @value - Array of u64 counters that are accessed by the sysfs code and
519 * filled in by the drivers get_stats routine
520 */
521struct rdma_hw_stats {
Mark Bloche9451302018-03-27 15:51:05 +0300522 struct mutex lock; /* Protect lifespan and values[] */
Christoph Lameterb40f4752016-05-16 12:49:33 -0500523 unsigned long timestamp;
524 unsigned long lifespan;
525 const char * const *names;
526 int num_counters;
527 u64 value[];
Steve Wise7f624d02008-07-14 23:48:48 -0700528};
529
Christoph Lameterb40f4752016-05-16 12:49:33 -0500530#define RDMA_HW_STATS_DEFAULT_LIFESPAN 10
531/**
532 * rdma_alloc_hw_stats_struct - Helper function to allocate dynamic struct
533 * for drivers.
534 * @names - Array of static const char *
535 * @num_counters - How many elements in array
536 * @lifespan - How many milliseconds between updates
537 */
538static inline struct rdma_hw_stats *rdma_alloc_hw_stats_struct(
539 const char * const *names, int num_counters,
540 unsigned long lifespan)
541{
542 struct rdma_hw_stats *stats;
Steve Wise7f624d02008-07-14 23:48:48 -0700543
Christoph Lameterb40f4752016-05-16 12:49:33 -0500544 stats = kzalloc(sizeof(*stats) + num_counters * sizeof(u64),
545 GFP_KERNEL);
546 if (!stats)
547 return NULL;
548 stats->names = names;
549 stats->num_counters = num_counters;
550 stats->lifespan = msecs_to_jiffies(lifespan);
Steve Wise7f624d02008-07-14 23:48:48 -0700551
Christoph Lameterb40f4752016-05-16 12:49:33 -0500552 return stats;
553}
554
Steve Wise7f624d02008-07-14 23:48:48 -0700555
Ira Weinyf9b22e32015-05-13 20:02:59 -0400556/* Define bits for the various functionality this port needs to be supported by
557 * the core.
558 */
559/* Management 0x00000FFF */
560#define RDMA_CORE_CAP_IB_MAD 0x00000001
561#define RDMA_CORE_CAP_IB_SMI 0x00000002
562#define RDMA_CORE_CAP_IB_CM 0x00000004
563#define RDMA_CORE_CAP_IW_CM 0x00000008
564#define RDMA_CORE_CAP_IB_SA 0x00000010
Ira Weiny65995fe2015-06-06 14:38:32 -0400565#define RDMA_CORE_CAP_OPA_MAD 0x00000020
Ira Weinyf9b22e32015-05-13 20:02:59 -0400566
567/* Address format 0x000FF000 */
568#define RDMA_CORE_CAP_AF_IB 0x00001000
569#define RDMA_CORE_CAP_ETH_AH 0x00002000
Dasaratharaman Chandramouli94d595c2017-03-20 19:38:09 -0400570#define RDMA_CORE_CAP_OPA_AH 0x00004000
Artemy Kovalyovb02289b2018-07-04 15:57:50 +0300571#define RDMA_CORE_CAP_IB_GRH_REQUIRED 0x00008000
Ira Weinyf9b22e32015-05-13 20:02:59 -0400572
573/* Protocol 0xFFF00000 */
574#define RDMA_CORE_CAP_PROT_IB 0x00100000
575#define RDMA_CORE_CAP_PROT_ROCE 0x00200000
576#define RDMA_CORE_CAP_PROT_IWARP 0x00400000
Matan Barak7766a992015-12-23 14:56:50 +0200577#define RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP 0x00800000
Or Gerlitzaa773bd2017-01-24 13:02:35 +0200578#define RDMA_CORE_CAP_PROT_RAW_PACKET 0x01000000
Or Gerlitzce1e0552017-01-24 13:02:38 +0200579#define RDMA_CORE_CAP_PROT_USNIC 0x02000000
Ira Weinyf9b22e32015-05-13 20:02:59 -0400580
Artemy Kovalyovb02289b2018-07-04 15:57:50 +0300581#define RDMA_CORE_PORT_IB_GRH_REQUIRED (RDMA_CORE_CAP_IB_GRH_REQUIRED \
582 | RDMA_CORE_CAP_PROT_ROCE \
583 | RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP)
584
Ira Weinyf9b22e32015-05-13 20:02:59 -0400585#define RDMA_CORE_PORT_IBA_IB (RDMA_CORE_CAP_PROT_IB \
586 | RDMA_CORE_CAP_IB_MAD \
587 | RDMA_CORE_CAP_IB_SMI \
588 | RDMA_CORE_CAP_IB_CM \
589 | RDMA_CORE_CAP_IB_SA \
590 | RDMA_CORE_CAP_AF_IB)
591#define RDMA_CORE_PORT_IBA_ROCE (RDMA_CORE_CAP_PROT_ROCE \
592 | RDMA_CORE_CAP_IB_MAD \
593 | RDMA_CORE_CAP_IB_CM \
Ira Weinyf9b22e32015-05-13 20:02:59 -0400594 | RDMA_CORE_CAP_AF_IB \
595 | RDMA_CORE_CAP_ETH_AH)
Matan Barak7766a992015-12-23 14:56:50 +0200596#define RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP \
597 (RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP \
598 | RDMA_CORE_CAP_IB_MAD \
599 | RDMA_CORE_CAP_IB_CM \
600 | RDMA_CORE_CAP_AF_IB \
601 | RDMA_CORE_CAP_ETH_AH)
Ira Weinyf9b22e32015-05-13 20:02:59 -0400602#define RDMA_CORE_PORT_IWARP (RDMA_CORE_CAP_PROT_IWARP \
603 | RDMA_CORE_CAP_IW_CM)
Ira Weiny65995fe2015-06-06 14:38:32 -0400604#define RDMA_CORE_PORT_INTEL_OPA (RDMA_CORE_PORT_IBA_IB \
605 | RDMA_CORE_CAP_OPA_MAD)
Ira Weinyf9b22e32015-05-13 20:02:59 -0400606
Or Gerlitzaa773bd2017-01-24 13:02:35 +0200607#define RDMA_CORE_PORT_RAW_PACKET (RDMA_CORE_CAP_PROT_RAW_PACKET)
608
Or Gerlitzce1e0552017-01-24 13:02:38 +0200609#define RDMA_CORE_PORT_USNIC (RDMA_CORE_CAP_PROT_USNIC)
610
Linus Torvalds1da177e2005-04-16 15:20:36 -0700611struct ib_port_attr {
Eli Cohenfad61ad2016-03-11 22:58:36 +0200612 u64 subnet_prefix;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 enum ib_port_state state;
614 enum ib_mtu max_mtu;
615 enum ib_mtu active_mtu;
616 int gid_tbl_len;
Jason Gunthorpe2f944c02018-07-04 15:57:48 +0300617 unsigned int ip_gids:1;
618 /* This is the value from PortInfo CapabilityMask, defined by IBA */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 u32 port_cap_flags;
620 u32 max_msg_sz;
621 u32 bad_pkey_cntr;
622 u32 qkey_viol_cntr;
623 u16 pkey_tbl_len;
Dasaratharaman Chandramoulidb585402017-06-08 13:37:48 -0400624 u32 sm_lid;
Dasaratharaman Chandramouli582faf32017-06-08 13:37:47 -0400625 u32 lid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 u8 lmc;
627 u8 max_vl_num;
628 u8 sm_sl;
629 u8 subnet_timeout;
630 u8 init_type_reply;
631 u8 active_width;
632 u8 active_speed;
633 u8 phys_state;
Michael Guralnik1e8f43b2018-12-09 11:49:48 +0200634 u16 port_cap_flags2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635};
636
637enum ib_device_modify_flags {
Roland Dreierc5bcbbb2006-02-02 09:47:14 -0800638 IB_DEVICE_MODIFY_SYS_IMAGE_GUID = 1 << 0,
639 IB_DEVICE_MODIFY_NODE_DESC = 1 << 1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640};
641
Yuval Shaiabd99fde2016-08-25 10:57:07 -0700642#define IB_DEVICE_NODE_DESC_MAX 64
643
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644struct ib_device_modify {
645 u64 sys_image_guid;
Yuval Shaiabd99fde2016-08-25 10:57:07 -0700646 char node_desc[IB_DEVICE_NODE_DESC_MAX];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700647};
648
649enum ib_port_modify_flags {
650 IB_PORT_SHUTDOWN = 1,
651 IB_PORT_INIT_TYPE = (1<<2),
Vishwanathapura, Niranjanacb493662017-06-01 17:04:02 -0700652 IB_PORT_RESET_QKEY_CNTR = (1<<3),
653 IB_PORT_OPA_MASK_CHG = (1<<4)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654};
655
656struct ib_port_modify {
657 u32 set_port_cap_mask;
658 u32 clr_port_cap_mask;
659 u8 init_type;
660};
661
662enum ib_event_type {
663 IB_EVENT_CQ_ERR,
664 IB_EVENT_QP_FATAL,
665 IB_EVENT_QP_REQ_ERR,
666 IB_EVENT_QP_ACCESS_ERR,
667 IB_EVENT_COMM_EST,
668 IB_EVENT_SQ_DRAINED,
669 IB_EVENT_PATH_MIG,
670 IB_EVENT_PATH_MIG_ERR,
671 IB_EVENT_DEVICE_FATAL,
672 IB_EVENT_PORT_ACTIVE,
673 IB_EVENT_PORT_ERR,
674 IB_EVENT_LID_CHANGE,
675 IB_EVENT_PKEY_CHANGE,
Roland Dreierd41fcc62005-08-18 12:23:08 -0700676 IB_EVENT_SM_CHANGE,
677 IB_EVENT_SRQ_ERR,
678 IB_EVENT_SRQ_LIMIT_REACHED,
Leonid Arsh63942c92006-06-17 20:37:35 -0700679 IB_EVENT_QP_LAST_WQE_REACHED,
Or Gerlitz761d90e2011-06-15 14:39:29 +0000680 IB_EVENT_CLIENT_REREGISTER,
681 IB_EVENT_GID_CHANGE,
Yishai Hadasf213c052016-05-23 15:20:49 +0300682 IB_EVENT_WQ_FATAL,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700683};
684
Bart Van Asschedb7489e2015-08-03 10:01:52 -0700685const char *__attribute_const__ ib_event_msg(enum ib_event_type event);
Sagi Grimberg2b1b5b62015-05-18 13:40:28 +0300686
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687struct ib_event {
688 struct ib_device *device;
689 union {
690 struct ib_cq *cq;
691 struct ib_qp *qp;
Roland Dreierd41fcc62005-08-18 12:23:08 -0700692 struct ib_srq *srq;
Yishai Hadasf213c052016-05-23 15:20:49 +0300693 struct ib_wq *wq;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 u8 port_num;
695 } element;
696 enum ib_event_type event;
697};
698
699struct ib_event_handler {
700 struct ib_device *device;
701 void (*handler)(struct ib_event_handler *, struct ib_event *);
702 struct list_head list;
703};
704
705#define INIT_IB_EVENT_HANDLER(_ptr, _device, _handler) \
706 do { \
707 (_ptr)->device = _device; \
708 (_ptr)->handler = _handler; \
709 INIT_LIST_HEAD(&(_ptr)->list); \
710 } while (0)
711
712struct ib_global_route {
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +0300713 const struct ib_gid_attr *sgid_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714 union ib_gid dgid;
715 u32 flow_label;
716 u8 sgid_index;
717 u8 hop_limit;
718 u8 traffic_class;
719};
720
Hal Rosenstock513789e2005-07-27 11:45:34 -0700721struct ib_grh {
Sean Hefty97f52eb2005-08-13 21:05:57 -0700722 __be32 version_tclass_flow;
723 __be16 paylen;
Hal Rosenstock513789e2005-07-27 11:45:34 -0700724 u8 next_hdr;
725 u8 hop_limit;
726 union ib_gid sgid;
727 union ib_gid dgid;
728};
729
Somnath Koturc865f242015-12-23 14:56:51 +0200730union rdma_network_hdr {
731 struct ib_grh ibgrh;
732 struct {
733 /* The IB spec states that if it's IPv4, the header
734 * is located in the last 20 bytes of the header.
735 */
736 u8 reserved[20];
737 struct iphdr roce4grh;
738 };
739};
740
Don Hiatt7dafbab2017-05-12 09:19:55 -0700741#define IB_QPN_MASK 0xFFFFFF
742
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743enum {
744 IB_MULTICAST_QPN = 0xffffff
745};
746
Harvey Harrisonf3a7c662009-02-14 22:58:35 -0800747#define IB_LID_PERMISSIVE cpu_to_be16(0xFFFF)
Dennis Dalessandrob4e64392016-01-06 10:04:31 -0800748#define IB_MULTICAST_LID_BASE cpu_to_be16(0xC000)
Sean Hefty97f52eb2005-08-13 21:05:57 -0700749
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750enum ib_ah_flags {
751 IB_AH_GRH = 1
752};
753
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700754enum ib_rate {
755 IB_RATE_PORT_CURRENT = 0,
756 IB_RATE_2_5_GBPS = 2,
757 IB_RATE_5_GBPS = 5,
758 IB_RATE_10_GBPS = 3,
759 IB_RATE_20_GBPS = 6,
760 IB_RATE_30_GBPS = 4,
761 IB_RATE_40_GBPS = 7,
762 IB_RATE_60_GBPS = 8,
763 IB_RATE_80_GBPS = 9,
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300764 IB_RATE_120_GBPS = 10,
765 IB_RATE_14_GBPS = 11,
766 IB_RATE_56_GBPS = 12,
767 IB_RATE_112_GBPS = 13,
768 IB_RATE_168_GBPS = 14,
769 IB_RATE_25_GBPS = 15,
770 IB_RATE_100_GBPS = 16,
771 IB_RATE_200_GBPS = 17,
Michael Guralnika5a5d192018-12-09 11:49:50 +0200772 IB_RATE_300_GBPS = 18,
773 IB_RATE_28_GBPS = 19,
774 IB_RATE_50_GBPS = 20,
775 IB_RATE_400_GBPS = 21,
776 IB_RATE_600_GBPS = 22,
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700777};
778
779/**
780 * ib_rate_to_mult - Convert the IB rate enum to a multiple of the
781 * base rate of 2.5 Gbit/sec. For example, IB_RATE_5_GBPS will be
782 * converted to 2, since 5 Gbit/sec is 2 * 2.5 Gbit/sec.
783 * @rate: rate to convert.
784 */
Roland Dreier8385fd82014-06-04 10:00:16 -0700785__attribute_const__ int ib_rate_to_mult(enum ib_rate rate);
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700786
787/**
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300788 * ib_rate_to_mbps - Convert the IB rate enum to Mbps.
789 * For example, IB_RATE_2_5_GBPS will be converted to 2500.
790 * @rate: rate to convert.
791 */
Roland Dreier8385fd82014-06-04 10:00:16 -0700792__attribute_const__ int ib_rate_to_mbps(enum ib_rate rate);
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300793
Sagi Grimberg17cd3a22014-02-23 14:19:04 +0200794
795/**
Sagi Grimberg9bee1782015-07-30 10:32:35 +0300796 * enum ib_mr_type - memory region type
797 * @IB_MR_TYPE_MEM_REG: memory region that is used for
798 * normal registration
799 * @IB_MR_TYPE_SIGNATURE: memory region that is used for
800 * signature operations (data-integrity
801 * capable regions)
Sagi Grimbergf5aa9152016-02-29 19:07:32 +0200802 * @IB_MR_TYPE_SG_GAPS: memory region that is capable to
803 * register any arbitrary sg lists (without
804 * the normal mr constraints - see
805 * ib_map_mr_sg)
Sagi Grimberg17cd3a22014-02-23 14:19:04 +0200806 */
Sagi Grimberg9bee1782015-07-30 10:32:35 +0300807enum ib_mr_type {
808 IB_MR_TYPE_MEM_REG,
809 IB_MR_TYPE_SIGNATURE,
Sagi Grimbergf5aa9152016-02-29 19:07:32 +0200810 IB_MR_TYPE_SG_GAPS,
Sagi Grimberg17cd3a22014-02-23 14:19:04 +0200811};
812
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200813/**
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300814 * Signature types
815 * IB_SIG_TYPE_NONE: Unprotected.
816 * IB_SIG_TYPE_T10_DIF: Type T10-DIF
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200817 */
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300818enum ib_signature_type {
819 IB_SIG_TYPE_NONE,
820 IB_SIG_TYPE_T10_DIF,
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200821};
822
823/**
824 * Signature T10-DIF block-guard types
825 * IB_T10DIF_CRC: Corresponds to T10-PI mandated CRC checksum rules.
826 * IB_T10DIF_CSUM: Corresponds to IP checksum rules.
827 */
828enum ib_t10_dif_bg_type {
829 IB_T10DIF_CRC,
830 IB_T10DIF_CSUM
831};
832
833/**
834 * struct ib_t10_dif_domain - Parameters specific for T10-DIF
835 * domain.
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200836 * @bg_type: T10-DIF block guard type (CRC|CSUM)
837 * @pi_interval: protection information interval.
838 * @bg: seed of guard computation.
839 * @app_tag: application tag of guard block
840 * @ref_tag: initial guard block reference tag.
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300841 * @ref_remap: Indicate wethear the reftag increments each block
842 * @app_escape: Indicate to skip block check if apptag=0xffff
843 * @ref_escape: Indicate to skip block check if reftag=0xffffffff
844 * @apptag_check_mask: check bitmask of application tag.
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200845 */
846struct ib_t10_dif_domain {
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200847 enum ib_t10_dif_bg_type bg_type;
848 u16 pi_interval;
849 u16 bg;
850 u16 app_tag;
851 u32 ref_tag;
Sagi Grimberg78eda2b2014-08-13 19:54:35 +0300852 bool ref_remap;
853 bool app_escape;
854 bool ref_escape;
855 u16 apptag_check_mask;
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200856};
857
858/**
859 * struct ib_sig_domain - Parameters for signature domain
860 * @sig_type: specific signauture type
861 * @sig: union of all signature domain attributes that may
862 * be used to set domain layout.
863 */
864struct ib_sig_domain {
865 enum ib_signature_type sig_type;
866 union {
867 struct ib_t10_dif_domain dif;
868 } sig;
869};
870
871/**
872 * struct ib_sig_attrs - Parameters for signature handover operation
873 * @check_mask: bitmask for signature byte check (8 bytes)
874 * @mem: memory domain layout desciptor.
875 * @wire: wire domain layout desciptor.
876 */
877struct ib_sig_attrs {
878 u8 check_mask;
879 struct ib_sig_domain mem;
880 struct ib_sig_domain wire;
881};
882
883enum ib_sig_err_type {
884 IB_SIG_BAD_GUARD,
885 IB_SIG_BAD_REFTAG,
886 IB_SIG_BAD_APPTAG,
887};
888
889/**
Max Gurtovoyca24da02018-05-31 11:05:24 +0300890 * Signature check masks (8 bytes in total) according to the T10-PI standard:
891 * -------- -------- ------------
892 * | GUARD | APPTAG | REFTAG |
893 * | 2B | 2B | 4B |
894 * -------- -------- ------------
895 */
896enum {
897 IB_SIG_CHECK_GUARD = 0xc0,
898 IB_SIG_CHECK_APPTAG = 0x30,
899 IB_SIG_CHECK_REFTAG = 0x0f,
900};
901
902/**
Sagi Grimberg1b01d332014-02-23 14:19:05 +0200903 * struct ib_sig_err - signature error descriptor
904 */
905struct ib_sig_err {
906 enum ib_sig_err_type err_type;
907 u32 expected;
908 u32 actual;
909 u64 sig_err_offset;
910 u32 key;
911};
912
913enum ib_mr_status_check {
914 IB_MR_CHECK_SIG_STATUS = 1,
915};
916
917/**
918 * struct ib_mr_status - Memory region status container
919 *
920 * @fail_status: Bitmask of MR checks status. For each
921 * failed check a corresponding status bit is set.
922 * @sig_err: Additional info for IB_MR_CEHCK_SIG_STATUS
923 * failure.
924 */
925struct ib_mr_status {
926 u32 fail_status;
927 struct ib_sig_err sig_err;
928};
929
Marcel Apfelbaum71eeba12011-10-05 14:21:47 +0300930/**
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700931 * mult_to_ib_rate - Convert a multiple of 2.5 Gbit/sec to an IB rate
932 * enum.
933 * @mult: multiple to convert.
934 */
Roland Dreier8385fd82014-06-04 10:00:16 -0700935__attribute_const__ enum ib_rate mult_to_ib_rate(int mult);
Jack Morgensteinbf6a9e32006-04-10 09:43:47 -0700936
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400937enum rdma_ah_attr_type {
Don Hiatt87daac62018-02-01 10:57:03 -0800938 RDMA_AH_ATTR_TYPE_UNDEFINED,
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400939 RDMA_AH_ATTR_TYPE_IB,
940 RDMA_AH_ATTR_TYPE_ROCE,
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400941 RDMA_AH_ATTR_TYPE_OPA,
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400942};
943
944struct ib_ah_attr {
945 u16 dlid;
946 u8 src_path_bits;
947};
948
949struct roce_ah_attr {
950 u8 dmac[ETH_ALEN];
951};
952
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400953struct opa_ah_attr {
954 u32 dlid;
955 u8 src_path_bits;
Don Hiattd98bb7f2017-08-04 13:54:16 -0700956 bool make_grd;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400957};
958
Dasaratharaman Chandramouli90898852017-04-29 14:41:18 -0400959struct rdma_ah_attr {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700960 struct ib_global_route grh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700961 u8 sl;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700962 u8 static_rate;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700963 u8 port_num;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400964 u8 ah_flags;
965 enum rdma_ah_attr_type type;
966 union {
967 struct ib_ah_attr ib;
968 struct roce_ah_attr roce;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -0400969 struct opa_ah_attr opa;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -0400970 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700971};
972
973enum ib_wc_status {
974 IB_WC_SUCCESS,
975 IB_WC_LOC_LEN_ERR,
976 IB_WC_LOC_QP_OP_ERR,
977 IB_WC_LOC_EEC_OP_ERR,
978 IB_WC_LOC_PROT_ERR,
979 IB_WC_WR_FLUSH_ERR,
980 IB_WC_MW_BIND_ERR,
981 IB_WC_BAD_RESP_ERR,
982 IB_WC_LOC_ACCESS_ERR,
983 IB_WC_REM_INV_REQ_ERR,
984 IB_WC_REM_ACCESS_ERR,
985 IB_WC_REM_OP_ERR,
986 IB_WC_RETRY_EXC_ERR,
987 IB_WC_RNR_RETRY_EXC_ERR,
988 IB_WC_LOC_RDD_VIOL_ERR,
989 IB_WC_REM_INV_RD_REQ_ERR,
990 IB_WC_REM_ABORT_ERR,
991 IB_WC_INV_EECN_ERR,
992 IB_WC_INV_EEC_STATE_ERR,
993 IB_WC_FATAL_ERR,
994 IB_WC_RESP_TIMEOUT_ERR,
995 IB_WC_GENERAL_ERR
996};
997
Bart Van Asschedb7489e2015-08-03 10:01:52 -0700998const char *__attribute_const__ ib_wc_status_msg(enum ib_wc_status status);
Sagi Grimberg2b1b5b62015-05-18 13:40:28 +0300999
Linus Torvalds1da177e2005-04-16 15:20:36 -07001000enum ib_wc_opcode {
1001 IB_WC_SEND,
1002 IB_WC_RDMA_WRITE,
1003 IB_WC_RDMA_READ,
1004 IB_WC_COMP_SWAP,
1005 IB_WC_FETCH_ADD,
Eli Cohenc93570f2008-04-16 21:09:27 -07001006 IB_WC_LSO,
Steve Wise00f7ec32008-07-14 23:48:45 -07001007 IB_WC_LOCAL_INV,
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001008 IB_WC_REG_MR,
Vladimir Sokolovsky5e80ba82010-04-14 17:23:01 +03001009 IB_WC_MASKED_COMP_SWAP,
1010 IB_WC_MASKED_FETCH_ADD,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011/*
1012 * Set value of IB_WC_RECV so consumers can test if a completion is a
1013 * receive by testing (opcode & IB_WC_RECV).
1014 */
1015 IB_WC_RECV = 1 << 7,
1016 IB_WC_RECV_RDMA_WITH_IMM
1017};
1018
1019enum ib_wc_flags {
1020 IB_WC_GRH = 1,
Steve Wise00f7ec32008-07-14 23:48:45 -07001021 IB_WC_WITH_IMM = (1<<1),
1022 IB_WC_WITH_INVALIDATE = (1<<2),
Or Gerlitzd927d502012-01-11 19:03:51 +02001023 IB_WC_IP_CSUM_OK = (1<<3),
Matan Barakdd5f03b2013-12-12 18:03:11 +02001024 IB_WC_WITH_SMAC = (1<<4),
1025 IB_WC_WITH_VLAN = (1<<5),
Somnath Koturc865f242015-12-23 14:56:51 +02001026 IB_WC_WITH_NETWORK_HDR_TYPE = (1<<6),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001027};
1028
1029struct ib_wc {
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001030 union {
1031 u64 wr_id;
1032 struct ib_cqe *wr_cqe;
1033 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 enum ib_wc_status status;
1035 enum ib_wc_opcode opcode;
1036 u32 vendor_err;
1037 u32 byte_len;
Michael S. Tsirkin062dbb62006-12-31 21:09:42 +02001038 struct ib_qp *qp;
Steve Wise00f7ec32008-07-14 23:48:45 -07001039 union {
1040 __be32 imm_data;
1041 u32 invalidate_rkey;
1042 } ex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043 u32 src_qp;
Bodong Wangcd2a6e72018-01-12 07:58:41 +02001044 u32 slid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045 int wc_flags;
1046 u16 pkey_index;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001047 u8 sl;
1048 u8 dlid_path_bits;
1049 u8 port_num; /* valid only for DR SMPs on switches */
Matan Barakdd5f03b2013-12-12 18:03:11 +02001050 u8 smac[ETH_ALEN];
1051 u16 vlan_id;
Somnath Koturc865f242015-12-23 14:56:51 +02001052 u8 network_hdr_type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053};
1054
Roland Dreiered23a722007-05-06 21:02:48 -07001055enum ib_cq_notify_flags {
1056 IB_CQ_SOLICITED = 1 << 0,
1057 IB_CQ_NEXT_COMP = 1 << 1,
1058 IB_CQ_SOLICITED_MASK = IB_CQ_SOLICITED | IB_CQ_NEXT_COMP,
1059 IB_CQ_REPORT_MISSED_EVENTS = 1 << 2,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001060};
1061
Sean Hefty96104ed2011-05-23 16:31:36 -07001062enum ib_srq_type {
Sean Hefty418d5132011-05-23 19:42:29 -07001063 IB_SRQT_BASIC,
Artemy Kovalyov9c2c8492017-08-17 15:52:05 +03001064 IB_SRQT_XRC,
1065 IB_SRQT_TM,
Sean Hefty96104ed2011-05-23 16:31:36 -07001066};
1067
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001068static inline bool ib_srq_has_cq(enum ib_srq_type srq_type)
1069{
Artemy Kovalyov9c2c8492017-08-17 15:52:05 +03001070 return srq_type == IB_SRQT_XRC ||
1071 srq_type == IB_SRQT_TM;
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001072}
1073
Roland Dreierd41fcc62005-08-18 12:23:08 -07001074enum ib_srq_attr_mask {
1075 IB_SRQ_MAX_WR = 1 << 0,
1076 IB_SRQ_LIMIT = 1 << 1,
1077};
1078
1079struct ib_srq_attr {
1080 u32 max_wr;
1081 u32 max_sge;
1082 u32 srq_limit;
1083};
1084
1085struct ib_srq_init_attr {
1086 void (*event_handler)(struct ib_event *, void *);
1087 void *srq_context;
1088 struct ib_srq_attr attr;
Sean Hefty96104ed2011-05-23 16:31:36 -07001089 enum ib_srq_type srq_type;
Sean Hefty418d5132011-05-23 19:42:29 -07001090
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001091 struct {
1092 struct ib_cq *cq;
1093 union {
1094 struct {
1095 struct ib_xrcd *xrcd;
1096 } xrc;
Artemy Kovalyov9c2c8492017-08-17 15:52:05 +03001097
1098 struct {
1099 u32 max_num_tags;
1100 } tag_matching;
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001101 };
Sean Hefty418d5132011-05-23 19:42:29 -07001102 } ext;
Roland Dreierd41fcc62005-08-18 12:23:08 -07001103};
1104
Linus Torvalds1da177e2005-04-16 15:20:36 -07001105struct ib_qp_cap {
1106 u32 max_send_wr;
1107 u32 max_recv_wr;
1108 u32 max_send_sge;
1109 u32 max_recv_sge;
1110 u32 max_inline_data;
Christoph Hellwiga060b562016-05-03 18:01:09 +02001111
1112 /*
1113 * Maximum number of rdma_rw_ctx structures in flight at a time.
1114 * ib_create_qp() will calculate the right amount of neededed WRs
1115 * and MRs based on this.
1116 */
1117 u32 max_rdma_ctxs;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001118};
1119
1120enum ib_sig_type {
1121 IB_SIGNAL_ALL_WR,
1122 IB_SIGNAL_REQ_WR
1123};
1124
1125enum ib_qp_type {
1126 /*
1127 * IB_QPT_SMI and IB_QPT_GSI have to be the first two entries
1128 * here (and in that order) since the MAD layer uses them as
1129 * indices into a 2-entry table.
1130 */
1131 IB_QPT_SMI,
1132 IB_QPT_GSI,
1133
1134 IB_QPT_RC,
1135 IB_QPT_UC,
1136 IB_QPT_UD,
1137 IB_QPT_RAW_IPV6,
Sean Heftyb42b63c2011-05-23 19:59:25 -07001138 IB_QPT_RAW_ETHERTYPE,
Or Gerlitzc938a612012-03-01 12:17:51 +02001139 IB_QPT_RAW_PACKET = 8,
Sean Heftyb42b63c2011-05-23 19:59:25 -07001140 IB_QPT_XRC_INI = 9,
1141 IB_QPT_XRC_TGT,
Jack Morgenstein0134f162013-07-07 17:25:52 +03001142 IB_QPT_MAX,
Moni Shoua8011c1e2018-01-02 16:19:30 +02001143 IB_QPT_DRIVER = 0xFF,
Jack Morgenstein0134f162013-07-07 17:25:52 +03001144 /* Reserve a range for qp types internal to the low level driver.
1145 * These qp types will not be visible at the IB core layer, so the
1146 * IB_QPT_MAX usages should not be affected in the core layer
1147 */
1148 IB_QPT_RESERVED1 = 0x1000,
1149 IB_QPT_RESERVED2,
1150 IB_QPT_RESERVED3,
1151 IB_QPT_RESERVED4,
1152 IB_QPT_RESERVED5,
1153 IB_QPT_RESERVED6,
1154 IB_QPT_RESERVED7,
1155 IB_QPT_RESERVED8,
1156 IB_QPT_RESERVED9,
1157 IB_QPT_RESERVED10,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158};
1159
Eli Cohenb846f252008-04-16 21:09:27 -07001160enum ib_qp_create_flags {
Ron Livne47ee1b92008-07-14 23:48:48 -07001161 IB_QP_CREATE_IPOIB_UD_LSO = 1 << 0,
1162 IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK = 1 << 1,
Leon Romanovsky8a06ce52015-12-20 12:16:10 +02001163 IB_QP_CREATE_CROSS_CHANNEL = 1 << 2,
1164 IB_QP_CREATE_MANAGED_SEND = 1 << 3,
1165 IB_QP_CREATE_MANAGED_RECV = 1 << 4,
Matan Barak90f1d1b2013-11-07 15:25:12 +02001166 IB_QP_CREATE_NETIF_QP = 1 << 5,
Sagi Grimberg1b01d332014-02-23 14:19:05 +02001167 IB_QP_CREATE_SIGNATURE_EN = 1 << 6,
Leon Romanovsky7855f582017-05-23 14:38:16 +03001168 /* FREE = 1 << 7, */
Majd Dibbinyb531b902016-04-17 17:19:36 +03001169 IB_QP_CREATE_SCATTER_FCS = 1 << 8,
Noa Osherovich9c2b2702017-01-18 15:39:56 +02001170 IB_QP_CREATE_CVLAN_STRIPPING = 1 << 9,
Yishai Hadas02984cc2017-06-08 16:15:06 +03001171 IB_QP_CREATE_SOURCE_QPN = 1 << 10,
Noa Osheroviche1d2e882017-10-29 13:59:44 +02001172 IB_QP_CREATE_PCI_WRITE_END_PADDING = 1 << 11,
Jack Morgensteind2b57062012-08-03 08:40:37 +00001173 /* reserve bits 26-31 for low level drivers' internal use */
1174 IB_QP_CREATE_RESERVED_START = 1 << 26,
1175 IB_QP_CREATE_RESERVED_END = 1 << 31,
Eli Cohenb846f252008-04-16 21:09:27 -07001176};
1177
Yishai Hadas73c40c62013-08-01 18:49:53 +03001178/*
1179 * Note: users may not call ib_close_qp or ib_destroy_qp from the event_handler
1180 * callback to destroy the passed in QP.
1181 */
1182
Linus Torvalds1da177e2005-04-16 15:20:36 -07001183struct ib_qp_init_attr {
Chuck Levereb93c82e2018-09-04 11:45:20 -04001184 /* Consumer's event_handler callback must not block */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001185 void (*event_handler)(struct ib_event *, void *);
Chuck Levereb93c82e2018-09-04 11:45:20 -04001186
Linus Torvalds1da177e2005-04-16 15:20:36 -07001187 void *qp_context;
1188 struct ib_cq *send_cq;
1189 struct ib_cq *recv_cq;
1190 struct ib_srq *srq;
Sean Heftyb42b63c2011-05-23 19:59:25 -07001191 struct ib_xrcd *xrcd; /* XRC TGT QPs only */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192 struct ib_qp_cap cap;
1193 enum ib_sig_type sq_sig_type;
1194 enum ib_qp_type qp_type;
Nathan Chancellorb56511c2018-09-24 12:57:16 -07001195 u32 create_flags;
Christoph Hellwiga060b562016-05-03 18:01:09 +02001196
1197 /*
1198 * Only needed for special QP types, or when using the RW API.
1199 */
1200 u8 port_num;
Yishai Hadasa9017e22016-05-23 15:20:54 +03001201 struct ib_rwq_ind_table *rwq_ind_tbl;
Yishai Hadas02984cc2017-06-08 16:15:06 +03001202 u32 source_qpn;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001203};
1204
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07001205struct ib_qp_open_attr {
1206 void (*event_handler)(struct ib_event *, void *);
1207 void *qp_context;
1208 u32 qp_num;
1209 enum ib_qp_type qp_type;
1210};
1211
Linus Torvalds1da177e2005-04-16 15:20:36 -07001212enum ib_rnr_timeout {
1213 IB_RNR_TIMER_655_36 = 0,
1214 IB_RNR_TIMER_000_01 = 1,
1215 IB_RNR_TIMER_000_02 = 2,
1216 IB_RNR_TIMER_000_03 = 3,
1217 IB_RNR_TIMER_000_04 = 4,
1218 IB_RNR_TIMER_000_06 = 5,
1219 IB_RNR_TIMER_000_08 = 6,
1220 IB_RNR_TIMER_000_12 = 7,
1221 IB_RNR_TIMER_000_16 = 8,
1222 IB_RNR_TIMER_000_24 = 9,
1223 IB_RNR_TIMER_000_32 = 10,
1224 IB_RNR_TIMER_000_48 = 11,
1225 IB_RNR_TIMER_000_64 = 12,
1226 IB_RNR_TIMER_000_96 = 13,
1227 IB_RNR_TIMER_001_28 = 14,
1228 IB_RNR_TIMER_001_92 = 15,
1229 IB_RNR_TIMER_002_56 = 16,
1230 IB_RNR_TIMER_003_84 = 17,
1231 IB_RNR_TIMER_005_12 = 18,
1232 IB_RNR_TIMER_007_68 = 19,
1233 IB_RNR_TIMER_010_24 = 20,
1234 IB_RNR_TIMER_015_36 = 21,
1235 IB_RNR_TIMER_020_48 = 22,
1236 IB_RNR_TIMER_030_72 = 23,
1237 IB_RNR_TIMER_040_96 = 24,
1238 IB_RNR_TIMER_061_44 = 25,
1239 IB_RNR_TIMER_081_92 = 26,
1240 IB_RNR_TIMER_122_88 = 27,
1241 IB_RNR_TIMER_163_84 = 28,
1242 IB_RNR_TIMER_245_76 = 29,
1243 IB_RNR_TIMER_327_68 = 30,
1244 IB_RNR_TIMER_491_52 = 31
1245};
1246
1247enum ib_qp_attr_mask {
1248 IB_QP_STATE = 1,
1249 IB_QP_CUR_STATE = (1<<1),
1250 IB_QP_EN_SQD_ASYNC_NOTIFY = (1<<2),
1251 IB_QP_ACCESS_FLAGS = (1<<3),
1252 IB_QP_PKEY_INDEX = (1<<4),
1253 IB_QP_PORT = (1<<5),
1254 IB_QP_QKEY = (1<<6),
1255 IB_QP_AV = (1<<7),
1256 IB_QP_PATH_MTU = (1<<8),
1257 IB_QP_TIMEOUT = (1<<9),
1258 IB_QP_RETRY_CNT = (1<<10),
1259 IB_QP_RNR_RETRY = (1<<11),
1260 IB_QP_RQ_PSN = (1<<12),
1261 IB_QP_MAX_QP_RD_ATOMIC = (1<<13),
1262 IB_QP_ALT_PATH = (1<<14),
1263 IB_QP_MIN_RNR_TIMER = (1<<15),
1264 IB_QP_SQ_PSN = (1<<16),
1265 IB_QP_MAX_DEST_RD_ATOMIC = (1<<17),
1266 IB_QP_PATH_MIG_STATE = (1<<18),
1267 IB_QP_CAP = (1<<19),
Matan Barakdd5f03b2013-12-12 18:03:11 +02001268 IB_QP_DEST_QPN = (1<<20),
Matan Barakaa744cc2015-10-15 18:38:53 +03001269 IB_QP_RESERVED1 = (1<<21),
1270 IB_QP_RESERVED2 = (1<<22),
1271 IB_QP_RESERVED3 = (1<<23),
1272 IB_QP_RESERVED4 = (1<<24),
Bodong Wang528e5a12016-12-01 13:43:14 +02001273 IB_QP_RATE_LIMIT = (1<<25),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001274};
1275
1276enum ib_qp_state {
1277 IB_QPS_RESET,
1278 IB_QPS_INIT,
1279 IB_QPS_RTR,
1280 IB_QPS_RTS,
1281 IB_QPS_SQD,
1282 IB_QPS_SQE,
1283 IB_QPS_ERR
1284};
1285
1286enum ib_mig_state {
1287 IB_MIG_MIGRATED,
1288 IB_MIG_REARM,
1289 IB_MIG_ARMED
1290};
1291
Shani Michaeli7083e422013-02-06 16:19:12 +00001292enum ib_mw_type {
1293 IB_MW_TYPE_1 = 1,
1294 IB_MW_TYPE_2 = 2
1295};
1296
Linus Torvalds1da177e2005-04-16 15:20:36 -07001297struct ib_qp_attr {
1298 enum ib_qp_state qp_state;
1299 enum ib_qp_state cur_qp_state;
1300 enum ib_mtu path_mtu;
1301 enum ib_mig_state path_mig_state;
1302 u32 qkey;
1303 u32 rq_psn;
1304 u32 sq_psn;
1305 u32 dest_qp_num;
1306 int qp_access_flags;
1307 struct ib_qp_cap cap;
Dasaratharaman Chandramouli90898852017-04-29 14:41:18 -04001308 struct rdma_ah_attr ah_attr;
1309 struct rdma_ah_attr alt_ah_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 u16 pkey_index;
1311 u16 alt_pkey_index;
1312 u8 en_sqd_async_notify;
1313 u8 sq_draining;
1314 u8 max_rd_atomic;
1315 u8 max_dest_rd_atomic;
1316 u8 min_rnr_timer;
1317 u8 port_num;
1318 u8 timeout;
1319 u8 retry_cnt;
1320 u8 rnr_retry;
1321 u8 alt_port_num;
1322 u8 alt_timeout;
Bodong Wang528e5a12016-12-01 13:43:14 +02001323 u32 rate_limit;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324};
1325
1326enum ib_wr_opcode {
Jason Gunthorpe9a597392018-08-14 15:33:02 -07001327 /* These are shared with userspace */
1328 IB_WR_RDMA_WRITE = IB_UVERBS_WR_RDMA_WRITE,
1329 IB_WR_RDMA_WRITE_WITH_IMM = IB_UVERBS_WR_RDMA_WRITE_WITH_IMM,
1330 IB_WR_SEND = IB_UVERBS_WR_SEND,
1331 IB_WR_SEND_WITH_IMM = IB_UVERBS_WR_SEND_WITH_IMM,
1332 IB_WR_RDMA_READ = IB_UVERBS_WR_RDMA_READ,
1333 IB_WR_ATOMIC_CMP_AND_SWP = IB_UVERBS_WR_ATOMIC_CMP_AND_SWP,
1334 IB_WR_ATOMIC_FETCH_AND_ADD = IB_UVERBS_WR_ATOMIC_FETCH_AND_ADD,
1335 IB_WR_LSO = IB_UVERBS_WR_TSO,
1336 IB_WR_SEND_WITH_INV = IB_UVERBS_WR_SEND_WITH_INV,
1337 IB_WR_RDMA_READ_WITH_INV = IB_UVERBS_WR_RDMA_READ_WITH_INV,
1338 IB_WR_LOCAL_INV = IB_UVERBS_WR_LOCAL_INV,
1339 IB_WR_MASKED_ATOMIC_CMP_AND_SWP =
1340 IB_UVERBS_WR_MASKED_ATOMIC_CMP_AND_SWP,
1341 IB_WR_MASKED_ATOMIC_FETCH_AND_ADD =
1342 IB_UVERBS_WR_MASKED_ATOMIC_FETCH_AND_ADD,
1343
1344 /* These are kernel only and can not be issued by userspace */
1345 IB_WR_REG_MR = 0x20,
Sagi Grimberg1b01d332014-02-23 14:19:05 +02001346 IB_WR_REG_SIG_MR,
Jason Gunthorpe9a597392018-08-14 15:33:02 -07001347
Jack Morgenstein0134f162013-07-07 17:25:52 +03001348 /* reserve values for low level drivers' internal use.
1349 * These values will not be used at all in the ib core layer.
1350 */
1351 IB_WR_RESERVED1 = 0xf0,
1352 IB_WR_RESERVED2,
1353 IB_WR_RESERVED3,
1354 IB_WR_RESERVED4,
1355 IB_WR_RESERVED5,
1356 IB_WR_RESERVED6,
1357 IB_WR_RESERVED7,
1358 IB_WR_RESERVED8,
1359 IB_WR_RESERVED9,
1360 IB_WR_RESERVED10,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001361};
1362
1363enum ib_send_flags {
1364 IB_SEND_FENCE = 1,
1365 IB_SEND_SIGNALED = (1<<1),
1366 IB_SEND_SOLICITED = (1<<2),
Eli Cohene0605d92008-01-30 18:30:57 +02001367 IB_SEND_INLINE = (1<<3),
Jack Morgenstein0134f162013-07-07 17:25:52 +03001368 IB_SEND_IP_CSUM = (1<<4),
1369
1370 /* reserve bits 26-31 for low level drivers' internal use */
1371 IB_SEND_RESERVED_START = (1 << 26),
1372 IB_SEND_RESERVED_END = (1 << 31),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001373};
1374
1375struct ib_sge {
1376 u64 addr;
1377 u32 length;
1378 u32 lkey;
1379};
1380
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001381struct ib_cqe {
1382 void (*done)(struct ib_cq *cq, struct ib_wc *wc);
1383};
1384
Linus Torvalds1da177e2005-04-16 15:20:36 -07001385struct ib_send_wr {
1386 struct ib_send_wr *next;
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001387 union {
1388 u64 wr_id;
1389 struct ib_cqe *wr_cqe;
1390 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001391 struct ib_sge *sg_list;
1392 int num_sge;
1393 enum ib_wr_opcode opcode;
1394 int send_flags;
Roland Dreier0f39cf32008-04-16 21:09:32 -07001395 union {
1396 __be32 imm_data;
1397 u32 invalidate_rkey;
1398 } ex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001399};
1400
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001401struct ib_rdma_wr {
1402 struct ib_send_wr wr;
1403 u64 remote_addr;
1404 u32 rkey;
1405};
1406
Bart Van Asschef696bf62018-07-18 09:25:14 -07001407static inline const struct ib_rdma_wr *rdma_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001408{
1409 return container_of(wr, struct ib_rdma_wr, wr);
1410}
1411
1412struct ib_atomic_wr {
1413 struct ib_send_wr wr;
1414 u64 remote_addr;
1415 u64 compare_add;
1416 u64 swap;
1417 u64 compare_add_mask;
1418 u64 swap_mask;
1419 u32 rkey;
1420};
1421
Bart Van Asschef696bf62018-07-18 09:25:14 -07001422static inline const struct ib_atomic_wr *atomic_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001423{
1424 return container_of(wr, struct ib_atomic_wr, wr);
1425}
1426
1427struct ib_ud_wr {
1428 struct ib_send_wr wr;
1429 struct ib_ah *ah;
1430 void *header;
1431 int hlen;
1432 int mss;
1433 u32 remote_qpn;
1434 u32 remote_qkey;
1435 u16 pkey_index; /* valid for GSI only */
1436 u8 port_num; /* valid for DR SMPs on switch only */
1437};
1438
Bart Van Asschef696bf62018-07-18 09:25:14 -07001439static inline const struct ib_ud_wr *ud_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001440{
1441 return container_of(wr, struct ib_ud_wr, wr);
1442}
1443
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001444struct ib_reg_wr {
1445 struct ib_send_wr wr;
1446 struct ib_mr *mr;
1447 u32 key;
1448 int access;
1449};
1450
Bart Van Asschef696bf62018-07-18 09:25:14 -07001451static inline const struct ib_reg_wr *reg_wr(const struct ib_send_wr *wr)
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001452{
1453 return container_of(wr, struct ib_reg_wr, wr);
1454}
1455
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001456struct ib_sig_handover_wr {
1457 struct ib_send_wr wr;
1458 struct ib_sig_attrs *sig_attrs;
1459 struct ib_mr *sig_mr;
1460 int access_flags;
1461 struct ib_sge *prot;
1462};
1463
Bart Van Asschef696bf62018-07-18 09:25:14 -07001464static inline const struct ib_sig_handover_wr *
1465sig_handover_wr(const struct ib_send_wr *wr)
Christoph Hellwige622f2f2015-10-08 09:16:33 +01001466{
1467 return container_of(wr, struct ib_sig_handover_wr, wr);
1468}
1469
Linus Torvalds1da177e2005-04-16 15:20:36 -07001470struct ib_recv_wr {
1471 struct ib_recv_wr *next;
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001472 union {
1473 u64 wr_id;
1474 struct ib_cqe *wr_cqe;
1475 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476 struct ib_sge *sg_list;
1477 int num_sge;
1478};
1479
1480enum ib_access_flags {
Jason Gunthorpe4fca0372018-07-11 16:20:44 -06001481 IB_ACCESS_LOCAL_WRITE = IB_UVERBS_ACCESS_LOCAL_WRITE,
1482 IB_ACCESS_REMOTE_WRITE = IB_UVERBS_ACCESS_REMOTE_WRITE,
1483 IB_ACCESS_REMOTE_READ = IB_UVERBS_ACCESS_REMOTE_READ,
1484 IB_ACCESS_REMOTE_ATOMIC = IB_UVERBS_ACCESS_REMOTE_ATOMIC,
1485 IB_ACCESS_MW_BIND = IB_UVERBS_ACCESS_MW_BIND,
1486 IB_ZERO_BASED = IB_UVERBS_ACCESS_ZERO_BASED,
1487 IB_ACCESS_ON_DEMAND = IB_UVERBS_ACCESS_ON_DEMAND,
1488 IB_ACCESS_HUGETLB = IB_UVERBS_ACCESS_HUGETLB,
1489
1490 IB_ACCESS_SUPPORTED = ((IB_ACCESS_HUGETLB << 1) - 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001491};
1492
Christoph Hellwigb7d3e0a2015-12-23 19:12:47 +01001493/*
1494 * XXX: these are apparently used for ->rereg_user_mr, no idea why they
1495 * are hidden here instead of a uapi header!
1496 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497enum ib_mr_rereg_flags {
1498 IB_MR_REREG_TRANS = 1,
1499 IB_MR_REREG_PD = (1<<1),
Matan Barak7e6edb92014-07-31 11:01:28 +03001500 IB_MR_REREG_ACCESS = (1<<2),
1501 IB_MR_REREG_SUPPORTED = ((IB_MR_REREG_ACCESS << 1) - 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001502};
1503
Linus Torvalds1da177e2005-04-16 15:20:36 -07001504struct ib_fmr_attr {
1505 int max_pages;
1506 int max_maps;
Or Gerlitzd36f34a2006-02-02 10:43:45 -08001507 u8 page_shift;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001508};
1509
Haggai Eran882214e2014-12-11 17:04:18 +02001510struct ib_umem;
1511
Matan Barak38321252017-04-04 13:31:42 +03001512enum rdma_remove_reason {
Yishai Hadas1c774832018-06-20 17:11:39 +03001513 /*
1514 * Userspace requested uobject deletion or initial try
1515 * to remove uobject via cleanup. Call could fail
1516 */
Matan Barak38321252017-04-04 13:31:42 +03001517 RDMA_REMOVE_DESTROY,
1518 /* Context deletion. This call should delete the actual object itself */
1519 RDMA_REMOVE_CLOSE,
1520 /* Driver is being hot-unplugged. This call should delete the actual object itself */
1521 RDMA_REMOVE_DRIVER_REMOVE,
Jason Gunthorpe87ad80a2018-07-25 21:40:12 -06001522 /* uobj is being cleaned-up before being committed */
1523 RDMA_REMOVE_ABORT,
Matan Barak38321252017-04-04 13:31:42 +03001524};
1525
Parav Pandit43579b52017-01-10 00:02:14 +00001526struct ib_rdmacg_object {
1527#ifdef CONFIG_CGROUP_RDMA
1528 struct rdma_cgroup *cg; /* owner rdma cgroup */
1529#endif
1530};
1531
Roland Dreiere2773c02005-07-07 17:57:10 -07001532struct ib_ucontext {
1533 struct ib_device *device;
Matan Barak771addf2017-04-04 13:31:41 +03001534 struct ib_uverbs_file *ufile;
Jason Gunthorpee9517472018-07-10 20:55:19 -06001535 /*
1536 * 'closing' can be read by the driver only during a destroy callback,
1537 * it is set when we are closing the file descriptor and indicates
1538 * that mm_sem may be locked.
1539 */
Leon Romanovsky6ceb6332018-09-03 20:18:03 +03001540 bool closing;
Shachar Raindel8ada2c12014-12-11 17:04:17 +02001541
Yishai Hadas1c774832018-06-20 17:11:39 +03001542 bool cleanup_retryable;
Matan Barak38321252017-04-04 13:31:42 +03001543
Jason Gunthorpeb5231b02018-09-16 20:48:04 +03001544 void (*invalidate_range)(struct ib_umem_odp *umem_odp,
Haggai Eran882214e2014-12-11 17:04:18 +02001545 unsigned long start, unsigned long end);
Jason Gunthorpef27a0d52018-09-16 20:48:08 +03001546 struct mutex per_mm_list_lock;
1547 struct list_head per_mm_list;
Parav Pandit43579b52017-01-10 00:02:14 +00001548
1549 struct ib_rdmacg_object cg_obj;
Leon Romanovsky60615212018-11-28 13:16:43 +02001550 /*
1551 * Implementation details of the RDMA core, don't use in drivers:
1552 */
1553 struct rdma_restrack_entry res;
Roland Dreiere2773c02005-07-07 17:57:10 -07001554};
1555
1556struct ib_uobject {
1557 u64 user_handle; /* handle given to us by userspace */
Jason Gunthorpe6a5e9c82018-07-04 11:32:07 +03001558 /* ufile & ucontext owning this object */
1559 struct ib_uverbs_file *ufile;
1560 /* FIXME, save memory: ufile->context == context */
Roland Dreiere2773c02005-07-07 17:57:10 -07001561 struct ib_ucontext *context; /* associated user context */
Roland Dreier9ead1902006-06-17 20:44:49 -07001562 void *object; /* containing object */
Roland Dreiere2773c02005-07-07 17:57:10 -07001563 struct list_head list; /* link to context's list */
Parav Pandit43579b52017-01-10 00:02:14 +00001564 struct ib_rdmacg_object cg_obj; /* rdmacg object */
Roland Dreierb3d636b2008-04-16 21:01:06 -07001565 int id; /* index into kernel idr */
Roland Dreier9ead1902006-06-17 20:44:49 -07001566 struct kref ref;
Matan Barak38321252017-04-04 13:31:42 +03001567 atomic_t usecnt; /* protects exclusive access */
Mike Marciniszynd144da82015-11-02 12:13:25 -05001568 struct rcu_head rcu; /* kfree_rcu() overhead */
Matan Barak38321252017-04-04 13:31:42 +03001569
Jason Gunthorpe6b0d08f2018-08-09 20:14:37 -06001570 const struct uverbs_api_object *uapi_object;
Roland Dreiere2773c02005-07-07 17:57:10 -07001571};
1572
Roland Dreiere2773c02005-07-07 17:57:10 -07001573struct ib_udata {
Yann Droneaud309243e2013-12-11 23:01:44 +01001574 const void __user *inbuf;
Roland Dreiere2773c02005-07-07 17:57:10 -07001575 void __user *outbuf;
1576 size_t inlen;
1577 size_t outlen;
1578};
1579
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580struct ib_pd {
Jason Gunthorpe96249d72015-08-05 14:14:45 -06001581 u32 local_dma_lkey;
Christoph Hellwiged082d32016-09-05 12:56:17 +02001582 u32 flags;
Roland Dreiere2773c02005-07-07 17:57:10 -07001583 struct ib_device *device;
1584 struct ib_uobject *uobject;
1585 atomic_t usecnt; /* count all resources */
Christoph Hellwig50d46332016-09-05 12:56:16 +02001586
Christoph Hellwiged082d32016-09-05 12:56:17 +02001587 u32 unsafe_global_rkey;
1588
Christoph Hellwig50d46332016-09-05 12:56:16 +02001589 /*
1590 * Implementation details of the RDMA core, don't use in drivers:
1591 */
1592 struct ib_mr *__internal_mr;
Leon Romanovsky02d88832018-01-28 11:17:20 +02001593 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001594};
1595
Sean Hefty59991f92011-05-23 17:52:46 -07001596struct ib_xrcd {
1597 struct ib_device *device;
Sean Heftyd3d72d92011-05-26 23:06:44 -07001598 atomic_t usecnt; /* count all exposed resources */
Sean Hefty53d0bd12011-05-24 08:33:46 -07001599 struct inode *inode;
Sean Heftyd3d72d92011-05-26 23:06:44 -07001600
1601 struct mutex tgt_qp_mutex;
1602 struct list_head tgt_qp_list;
Sean Hefty59991f92011-05-23 17:52:46 -07001603};
1604
Linus Torvalds1da177e2005-04-16 15:20:36 -07001605struct ib_ah {
1606 struct ib_device *device;
1607 struct ib_pd *pd;
Roland Dreiere2773c02005-07-07 17:57:10 -07001608 struct ib_uobject *uobject;
Jason Gunthorpe1a1f4602018-06-13 10:22:08 +03001609 const struct ib_gid_attr *sgid_attr;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04001610 enum rdma_ah_attr_type type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001611};
1612
1613typedef void (*ib_comp_handler)(struct ib_cq *cq, void *cq_context);
1614
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001615enum ib_poll_context {
Jack Morgensteinf7948092018-08-27 08:35:55 +03001616 IB_POLL_DIRECT, /* caller context, no hw completions */
1617 IB_POLL_SOFTIRQ, /* poll from softirq context */
1618 IB_POLL_WORKQUEUE, /* poll from workqueue */
1619 IB_POLL_UNBOUND_WORKQUEUE, /* poll from unbound workqueue */
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001620};
1621
Linus Torvalds1da177e2005-04-16 15:20:36 -07001622struct ib_cq {
Roland Dreiere2773c02005-07-07 17:57:10 -07001623 struct ib_device *device;
1624 struct ib_uobject *uobject;
1625 ib_comp_handler comp_handler;
1626 void (*event_handler)(struct ib_event *, void *);
Dotan Barak4deccd62008-07-14 23:48:44 -07001627 void *cq_context;
Roland Dreiere2773c02005-07-07 17:57:10 -07001628 int cqe;
1629 atomic_t usecnt; /* count number of work queues */
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08001630 enum ib_poll_context poll_ctx;
1631 struct ib_wc *wc;
1632 union {
1633 struct irq_poll iop;
1634 struct work_struct work;
1635 };
Jack Morgensteinf7948092018-08-27 08:35:55 +03001636 struct workqueue_struct *comp_wq;
Leon Romanovsky02d88832018-01-28 11:17:20 +02001637 /*
1638 * Implementation details of the RDMA core, don't use in drivers:
1639 */
1640 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001641};
1642
1643struct ib_srq {
Roland Dreierd41fcc62005-08-18 12:23:08 -07001644 struct ib_device *device;
1645 struct ib_pd *pd;
1646 struct ib_uobject *uobject;
1647 void (*event_handler)(struct ib_event *, void *);
1648 void *srq_context;
Sean Hefty96104ed2011-05-23 16:31:36 -07001649 enum ib_srq_type srq_type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001650 atomic_t usecnt;
Sean Hefty418d5132011-05-23 19:42:29 -07001651
Artemy Kovalyov1a56ff62017-08-17 15:52:04 +03001652 struct {
1653 struct ib_cq *cq;
1654 union {
1655 struct {
1656 struct ib_xrcd *xrcd;
1657 u32 srq_num;
1658 } xrc;
1659 };
Sean Hefty418d5132011-05-23 19:42:29 -07001660 } ext;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001661};
1662
Noa Osherovichebaaee22017-01-18 15:39:54 +02001663enum ib_raw_packet_caps {
1664 /* Strip cvlan from incoming packet and report it in the matching work
1665 * completion is supported.
1666 */
1667 IB_RAW_PACKET_CAP_CVLAN_STRIPPING = (1 << 0),
1668 /* Scatter FCS field of an incoming packet to host memory is supported.
1669 */
1670 IB_RAW_PACKET_CAP_SCATTER_FCS = (1 << 1),
1671 /* Checksum offloads are supported (for both send and receive). */
1672 IB_RAW_PACKET_CAP_IP_CSUM = (1 << 2),
Maor Gottlieb7d9336d2017-05-30 10:29:10 +03001673 /* When a packet is received for an RQ with no receive WQEs, the
1674 * packet processing is delayed.
1675 */
1676 IB_RAW_PACKET_CAP_DELAY_DROP = (1 << 3),
Noa Osherovichebaaee22017-01-18 15:39:54 +02001677};
1678
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001679enum ib_wq_type {
1680 IB_WQT_RQ
1681};
1682
1683enum ib_wq_state {
1684 IB_WQS_RESET,
1685 IB_WQS_RDY,
1686 IB_WQS_ERR
1687};
1688
1689struct ib_wq {
1690 struct ib_device *device;
1691 struct ib_uobject *uobject;
1692 void *wq_context;
1693 void (*event_handler)(struct ib_event *, void *);
1694 struct ib_pd *pd;
1695 struct ib_cq *cq;
1696 u32 wq_num;
1697 enum ib_wq_state state;
1698 enum ib_wq_type wq_type;
1699 atomic_t usecnt;
1700};
1701
Noa Osherovich10bac722017-01-18 15:39:55 +02001702enum ib_wq_flags {
1703 IB_WQ_FLAGS_CVLAN_STRIPPING = 1 << 0,
Noa Osherovich27b0df12017-01-18 15:39:57 +02001704 IB_WQ_FLAGS_SCATTER_FCS = 1 << 1,
Maor Gottlieb7d9336d2017-05-30 10:29:10 +03001705 IB_WQ_FLAGS_DELAY_DROP = 1 << 2,
Noa Osheroviche1d2e882017-10-29 13:59:44 +02001706 IB_WQ_FLAGS_PCI_WRITE_END_PADDING = 1 << 3,
Noa Osherovich10bac722017-01-18 15:39:55 +02001707};
1708
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001709struct ib_wq_init_attr {
1710 void *wq_context;
1711 enum ib_wq_type wq_type;
1712 u32 max_wr;
1713 u32 max_sge;
1714 struct ib_cq *cq;
1715 void (*event_handler)(struct ib_event *, void *);
Noa Osherovich10bac722017-01-18 15:39:55 +02001716 u32 create_flags; /* Use enum ib_wq_flags */
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001717};
1718
1719enum ib_wq_attr_mask {
Noa Osherovich10bac722017-01-18 15:39:55 +02001720 IB_WQ_STATE = 1 << 0,
1721 IB_WQ_CUR_STATE = 1 << 1,
1722 IB_WQ_FLAGS = 1 << 2,
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001723};
1724
1725struct ib_wq_attr {
1726 enum ib_wq_state wq_state;
1727 enum ib_wq_state curr_wq_state;
Noa Osherovich10bac722017-01-18 15:39:55 +02001728 u32 flags; /* Use enum ib_wq_flags */
1729 u32 flags_mask; /* Use enum ib_wq_flags */
Yishai Hadas5fd251c2016-05-23 15:20:48 +03001730};
1731
Yishai Hadas6d397862016-05-23 15:20:51 +03001732struct ib_rwq_ind_table {
1733 struct ib_device *device;
1734 struct ib_uobject *uobject;
1735 atomic_t usecnt;
1736 u32 ind_tbl_num;
1737 u32 log_ind_tbl_size;
1738 struct ib_wq **ind_tbl;
1739};
1740
1741struct ib_rwq_ind_table_init_attr {
1742 u32 log_ind_tbl_size;
1743 /* Each entry is a pointer to Receive Work Queue */
1744 struct ib_wq **ind_tbl;
1745};
1746
Daniel Jurgensd291f1a2017-05-19 15:48:52 +03001747enum port_pkey_state {
1748 IB_PORT_PKEY_NOT_VALID = 0,
1749 IB_PORT_PKEY_VALID = 1,
1750 IB_PORT_PKEY_LISTED = 2,
1751};
1752
1753struct ib_qp_security;
1754
1755struct ib_port_pkey {
1756 enum port_pkey_state state;
1757 u16 pkey_index;
1758 u8 port_num;
1759 struct list_head qp_list;
1760 struct list_head to_error_list;
1761 struct ib_qp_security *sec;
1762};
1763
1764struct ib_ports_pkeys {
1765 struct ib_port_pkey main;
1766 struct ib_port_pkey alt;
1767};
1768
1769struct ib_qp_security {
1770 struct ib_qp *qp;
1771 struct ib_device *dev;
1772 /* Hold this mutex when changing port and pkey settings. */
1773 struct mutex mutex;
1774 struct ib_ports_pkeys *ports_pkeys;
1775 /* A list of all open shared QP handles. Required to enforce security
1776 * properly for all users of a shared QP.
1777 */
1778 struct list_head shared_qp_list;
1779 void *security;
1780 bool destroying;
1781 atomic_t error_list_count;
1782 struct completion error_complete;
1783 int error_comps_pending;
1784};
1785
Bart Van Assche632bc3f2016-07-21 13:03:30 -07001786/*
1787 * @max_write_sge: Maximum SGE elements per RDMA WRITE request.
1788 * @max_read_sge: Maximum SGE elements per RDMA READ request.
1789 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001790struct ib_qp {
1791 struct ib_device *device;
1792 struct ib_pd *pd;
1793 struct ib_cq *send_cq;
1794 struct ib_cq *recv_cq;
Christoph Hellwigfffb0382016-05-03 18:01:07 +02001795 spinlock_t mr_lock;
1796 int mrs_used;
Christoph Hellwiga060b562016-05-03 18:01:09 +02001797 struct list_head rdma_mrs;
Christoph Hellwig0e353e32016-05-03 18:01:12 +02001798 struct list_head sig_mrs;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001799 struct ib_srq *srq;
Sean Heftyb42b63c2011-05-23 19:59:25 -07001800 struct ib_xrcd *xrcd; /* XRC TGT QPs only */
Sean Heftyd3d72d92011-05-26 23:06:44 -07001801 struct list_head xrcd_list;
Christoph Hellwigfffb0382016-05-03 18:01:07 +02001802
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001803 /* count times opened, mcast attaches, flow attaches */
1804 atomic_t usecnt;
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07001805 struct list_head open_list;
1806 struct ib_qp *real_qp;
Roland Dreiere2773c02005-07-07 17:57:10 -07001807 struct ib_uobject *uobject;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001808 void (*event_handler)(struct ib_event *, void *);
1809 void *qp_context;
Jason Gunthorpe1a1f4602018-06-13 10:22:08 +03001810 /* sgid_attrs associated with the AV's */
1811 const struct ib_gid_attr *av_sgid_attr;
1812 const struct ib_gid_attr *alt_path_sgid_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001813 u32 qp_num;
Bart Van Assche632bc3f2016-07-21 13:03:30 -07001814 u32 max_write_sge;
1815 u32 max_read_sge;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001816 enum ib_qp_type qp_type;
Yishai Hadasa9017e22016-05-23 15:20:54 +03001817 struct ib_rwq_ind_table *rwq_ind_tbl;
Daniel Jurgensd291f1a2017-05-19 15:48:52 +03001818 struct ib_qp_security *qp_sec;
Noa Osherovich498ca3c2017-08-23 08:35:40 +03001819 u8 port;
Leon Romanovsky02d88832018-01-28 11:17:20 +02001820
1821 /*
1822 * Implementation details of the RDMA core, don't use in drivers:
1823 */
1824 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001825};
1826
Ariel Levkovichbee76d72018-04-05 18:53:24 +03001827struct ib_dm {
1828 struct ib_device *device;
1829 u32 length;
1830 u32 flags;
1831 struct ib_uobject *uobject;
1832 atomic_t usecnt;
1833};
1834
Linus Torvalds1da177e2005-04-16 15:20:36 -07001835struct ib_mr {
Roland Dreiere2773c02005-07-07 17:57:10 -07001836 struct ib_device *device;
1837 struct ib_pd *pd;
Roland Dreiere2773c02005-07-07 17:57:10 -07001838 u32 lkey;
1839 u32 rkey;
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001840 u64 iova;
Parav Panditedd31552017-09-24 21:46:31 +03001841 u64 length;
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03001842 unsigned int page_size;
Steve Wised4a85c32016-05-03 18:01:08 +02001843 bool need_inval;
Christoph Hellwigfffb0382016-05-03 18:01:07 +02001844 union {
1845 struct ib_uobject *uobject; /* user */
1846 struct list_head qp_entry; /* FR */
1847 };
Steve Wisefccec5b2018-03-01 13:58:13 -08001848
Ariel Levkovichbe934cc2018-04-05 18:53:25 +03001849 struct ib_dm *dm;
1850
Steve Wisefccec5b2018-03-01 13:58:13 -08001851 /*
1852 * Implementation details of the RDMA core, don't use in drivers:
1853 */
1854 struct rdma_restrack_entry res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001855};
1856
1857struct ib_mw {
1858 struct ib_device *device;
1859 struct ib_pd *pd;
Roland Dreiere2773c02005-07-07 17:57:10 -07001860 struct ib_uobject *uobject;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001861 u32 rkey;
Shani Michaeli7083e422013-02-06 16:19:12 +00001862 enum ib_mw_type type;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001863};
1864
1865struct ib_fmr {
1866 struct ib_device *device;
1867 struct ib_pd *pd;
1868 struct list_head list;
1869 u32 lkey;
1870 u32 rkey;
1871};
1872
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001873/* Supported steering options */
1874enum ib_flow_attr_type {
1875 /* steering according to rule specifications */
1876 IB_FLOW_ATTR_NORMAL = 0x0,
1877 /* default unicast and multicast rule -
1878 * receive all Eth traffic which isn't steered to any QP
1879 */
1880 IB_FLOW_ATTR_ALL_DEFAULT = 0x1,
1881 /* default multicast rule -
1882 * receive all Eth multicast traffic which isn't steered to any QP
1883 */
1884 IB_FLOW_ATTR_MC_DEFAULT = 0x2,
1885 /* sniffer rule - receive all port traffic */
1886 IB_FLOW_ATTR_SNIFFER = 0x3
1887};
1888
1889/* Supported steering header types */
1890enum ib_flow_spec_type {
1891 /* L2 headers*/
Moses Reuben76bd23b2016-11-14 19:04:48 +02001892 IB_FLOW_SPEC_ETH = 0x20,
1893 IB_FLOW_SPEC_IB = 0x22,
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001894 /* L3 header*/
Moses Reuben76bd23b2016-11-14 19:04:48 +02001895 IB_FLOW_SPEC_IPV4 = 0x30,
1896 IB_FLOW_SPEC_IPV6 = 0x31,
Matan Barak56ab0b32018-03-28 09:27:49 +03001897 IB_FLOW_SPEC_ESP = 0x34,
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001898 /* L4 headers*/
Moses Reuben76bd23b2016-11-14 19:04:48 +02001899 IB_FLOW_SPEC_TCP = 0x40,
1900 IB_FLOW_SPEC_UDP = 0x41,
Moses Reuben0dbf3332016-11-14 19:04:47 +02001901 IB_FLOW_SPEC_VXLAN_TUNNEL = 0x50,
Ariel Levkovichd90e5e52018-05-13 14:33:30 +03001902 IB_FLOW_SPEC_GRE = 0x51,
Ariel Levkovichb04f0f02018-05-13 14:33:32 +03001903 IB_FLOW_SPEC_MPLS = 0x60,
Moses Reubenfbf46862016-11-14 19:04:51 +02001904 IB_FLOW_SPEC_INNER = 0x100,
Moses Reuben460d0192017-01-18 14:59:48 +02001905 /* Actions */
1906 IB_FLOW_SPEC_ACTION_TAG = 0x1000,
Slava Shwartsman483a3962017-04-03 13:13:51 +03001907 IB_FLOW_SPEC_ACTION_DROP = 0x1001,
Matan Barak9b828442018-03-28 09:27:46 +03001908 IB_FLOW_SPEC_ACTION_HANDLE = 0x1002,
Raed Salem7eea23a2018-05-31 16:43:36 +03001909 IB_FLOW_SPEC_ACTION_COUNT = 0x1003,
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001910};
Matan Barak240ae002013-11-07 15:25:13 +02001911#define IB_FLOW_SPEC_LAYER_MASK 0xF0
Raed Salem7eea23a2018-05-31 16:43:36 +03001912#define IB_FLOW_SPEC_SUPPORT_LAYERS 10
Matan Barak22878db2013-09-01 18:39:52 +03001913
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001914/* Flow steering rule priority is set according to it's domain.
1915 * Lower domain value means higher priority.
1916 */
1917enum ib_flow_domain {
1918 IB_FLOW_DOMAIN_USER,
1919 IB_FLOW_DOMAIN_ETHTOOL,
1920 IB_FLOW_DOMAIN_RFS,
1921 IB_FLOW_DOMAIN_NIC,
1922 IB_FLOW_DOMAIN_NUM /* Must be last */
1923};
1924
Marina Varshavera3100a72016-02-18 18:31:05 +02001925enum ib_flow_flags {
1926 IB_FLOW_ATTR_FLAGS_DONT_TRAP = 1UL << 1, /* Continue match, no steal */
Boris Pismenny21e82d32018-03-28 09:27:47 +03001927 IB_FLOW_ATTR_FLAGS_EGRESS = 1UL << 2, /* Egress flow */
1928 IB_FLOW_ATTR_FLAGS_RESERVED = 1UL << 3 /* Must be last */
Marina Varshavera3100a72016-02-18 18:31:05 +02001929};
1930
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001931struct ib_flow_eth_filter {
1932 u8 dst_mac[6];
1933 u8 src_mac[6];
1934 __be16 ether_type;
1935 __be16 vlan_tag;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001936 /* Must be last */
1937 u8 real_sz[0];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001938};
1939
1940struct ib_flow_spec_eth {
Moses Reubenfbf46862016-11-14 19:04:51 +02001941 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001942 u16 size;
1943 struct ib_flow_eth_filter val;
1944 struct ib_flow_eth_filter mask;
1945};
1946
Matan Barak240ae002013-11-07 15:25:13 +02001947struct ib_flow_ib_filter {
1948 __be16 dlid;
1949 __u8 sl;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001950 /* Must be last */
1951 u8 real_sz[0];
Matan Barak240ae002013-11-07 15:25:13 +02001952};
1953
1954struct ib_flow_spec_ib {
Moses Reubenfbf46862016-11-14 19:04:51 +02001955 u32 type;
Matan Barak240ae002013-11-07 15:25:13 +02001956 u16 size;
1957 struct ib_flow_ib_filter val;
1958 struct ib_flow_ib_filter mask;
1959};
1960
Maor Gottlieb989a3a82016-08-30 16:58:33 +03001961/* IPv4 header flags */
1962enum ib_ipv4_flags {
1963 IB_IPV4_DONT_FRAG = 0x2, /* Don't enable packet fragmentation */
1964 IB_IPV4_MORE_FRAG = 0X4 /* For All fragmented packets except the
1965 last have this flag set */
1966};
1967
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001968struct ib_flow_ipv4_filter {
1969 __be32 src_ip;
1970 __be32 dst_ip;
Maor Gottlieb989a3a82016-08-30 16:58:33 +03001971 u8 proto;
1972 u8 tos;
1973 u8 ttl;
1974 u8 flags;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001975 /* Must be last */
1976 u8 real_sz[0];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001977};
1978
1979struct ib_flow_spec_ipv4 {
Moses Reubenfbf46862016-11-14 19:04:51 +02001980 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03001981 u16 size;
1982 struct ib_flow_ipv4_filter val;
1983 struct ib_flow_ipv4_filter mask;
1984};
1985
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03001986struct ib_flow_ipv6_filter {
1987 u8 src_ip[16];
1988 u8 dst_ip[16];
Maor Gottlieba72c6a22016-08-30 16:58:34 +03001989 __be32 flow_label;
1990 u8 next_hdr;
1991 u8 traffic_class;
1992 u8 hop_limit;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03001993 /* Must be last */
1994 u8 real_sz[0];
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03001995};
1996
1997struct ib_flow_spec_ipv6 {
Moses Reubenfbf46862016-11-14 19:04:51 +02001998 u32 type;
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03001999 u16 size;
2000 struct ib_flow_ipv6_filter val;
2001 struct ib_flow_ipv6_filter mask;
2002};
2003
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002004struct ib_flow_tcp_udp_filter {
2005 __be16 dst_port;
2006 __be16 src_port;
Maor Gottlieb15dfbd62016-08-30 16:58:32 +03002007 /* Must be last */
2008 u8 real_sz[0];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002009};
2010
2011struct ib_flow_spec_tcp_udp {
Moses Reubenfbf46862016-11-14 19:04:51 +02002012 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002013 u16 size;
2014 struct ib_flow_tcp_udp_filter val;
2015 struct ib_flow_tcp_udp_filter mask;
2016};
2017
Moses Reuben0dbf3332016-11-14 19:04:47 +02002018struct ib_flow_tunnel_filter {
2019 __be32 tunnel_id;
2020 u8 real_sz[0];
2021};
2022
2023/* ib_flow_spec_tunnel describes the Vxlan tunnel
2024 * the tunnel_id from val has the vni value
2025 */
2026struct ib_flow_spec_tunnel {
Moses Reubenfbf46862016-11-14 19:04:51 +02002027 u32 type;
Moses Reuben0dbf3332016-11-14 19:04:47 +02002028 u16 size;
2029 struct ib_flow_tunnel_filter val;
2030 struct ib_flow_tunnel_filter mask;
2031};
2032
Matan Barak56ab0b32018-03-28 09:27:49 +03002033struct ib_flow_esp_filter {
2034 __be32 spi;
2035 __be32 seq;
2036 /* Must be last */
2037 u8 real_sz[0];
2038};
2039
2040struct ib_flow_spec_esp {
2041 u32 type;
2042 u16 size;
2043 struct ib_flow_esp_filter val;
2044 struct ib_flow_esp_filter mask;
2045};
2046
Ariel Levkovichd90e5e52018-05-13 14:33:30 +03002047struct ib_flow_gre_filter {
2048 __be16 c_ks_res0_ver;
2049 __be16 protocol;
2050 __be32 key;
2051 /* Must be last */
2052 u8 real_sz[0];
2053};
2054
2055struct ib_flow_spec_gre {
2056 u32 type;
2057 u16 size;
2058 struct ib_flow_gre_filter val;
2059 struct ib_flow_gre_filter mask;
2060};
2061
Ariel Levkovichb04f0f02018-05-13 14:33:32 +03002062struct ib_flow_mpls_filter {
2063 __be32 tag;
2064 /* Must be last */
2065 u8 real_sz[0];
2066};
2067
2068struct ib_flow_spec_mpls {
2069 u32 type;
2070 u16 size;
2071 struct ib_flow_mpls_filter val;
2072 struct ib_flow_mpls_filter mask;
2073};
2074
Moses Reuben460d0192017-01-18 14:59:48 +02002075struct ib_flow_spec_action_tag {
2076 enum ib_flow_spec_type type;
2077 u16 size;
2078 u32 tag_id;
2079};
2080
Slava Shwartsman483a3962017-04-03 13:13:51 +03002081struct ib_flow_spec_action_drop {
2082 enum ib_flow_spec_type type;
2083 u16 size;
2084};
2085
Matan Barak9b828442018-03-28 09:27:46 +03002086struct ib_flow_spec_action_handle {
2087 enum ib_flow_spec_type type;
2088 u16 size;
2089 struct ib_flow_action *act;
2090};
2091
Raed Salem7eea23a2018-05-31 16:43:36 +03002092enum ib_counters_description {
2093 IB_COUNTER_PACKETS,
2094 IB_COUNTER_BYTES,
2095};
2096
2097struct ib_flow_spec_action_count {
2098 enum ib_flow_spec_type type;
2099 u16 size;
2100 struct ib_counters *counters;
2101};
2102
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002103union ib_flow_spec {
2104 struct {
Moses Reubenfbf46862016-11-14 19:04:51 +02002105 u32 type;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002106 u16 size;
2107 };
2108 struct ib_flow_spec_eth eth;
Matan Barak240ae002013-11-07 15:25:13 +02002109 struct ib_flow_spec_ib ib;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002110 struct ib_flow_spec_ipv4 ipv4;
2111 struct ib_flow_spec_tcp_udp tcp_udp;
Maor Gottlieb4c2aae72016-06-17 15:14:50 +03002112 struct ib_flow_spec_ipv6 ipv6;
Moses Reuben0dbf3332016-11-14 19:04:47 +02002113 struct ib_flow_spec_tunnel tunnel;
Matan Barak56ab0b32018-03-28 09:27:49 +03002114 struct ib_flow_spec_esp esp;
Ariel Levkovichd90e5e52018-05-13 14:33:30 +03002115 struct ib_flow_spec_gre gre;
Ariel Levkovichb04f0f02018-05-13 14:33:32 +03002116 struct ib_flow_spec_mpls mpls;
Moses Reuben460d0192017-01-18 14:59:48 +02002117 struct ib_flow_spec_action_tag flow_tag;
Slava Shwartsman483a3962017-04-03 13:13:51 +03002118 struct ib_flow_spec_action_drop drop;
Matan Barak9b828442018-03-28 09:27:46 +03002119 struct ib_flow_spec_action_handle action;
Raed Salem7eea23a2018-05-31 16:43:36 +03002120 struct ib_flow_spec_action_count flow_count;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002121};
2122
2123struct ib_flow_attr {
2124 enum ib_flow_attr_type type;
2125 u16 size;
2126 u16 priority;
2127 u32 flags;
2128 u8 num_of_specs;
2129 u8 port;
Matthew Wilcox7654cb12018-06-07 07:57:16 -07002130 union ib_flow_spec flows[];
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002131};
2132
2133struct ib_flow {
2134 struct ib_qp *qp;
Yishai Hadas6cd080a2018-07-23 15:25:08 +03002135 struct ib_device *device;
Hadar Hen Zion319a4412013-08-07 14:01:59 +03002136 struct ib_uobject *uobject;
2137};
2138
Matan Barak2eb9bea2018-03-28 09:27:45 +03002139enum ib_flow_action_type {
2140 IB_FLOW_ACTION_UNSPECIFIED,
2141 IB_FLOW_ACTION_ESP = 1,
2142};
2143
2144struct ib_flow_action_attrs_esp_keymats {
2145 enum ib_uverbs_flow_action_esp_keymat protocol;
2146 union {
2147 struct ib_uverbs_flow_action_esp_keymat_aes_gcm aes_gcm;
2148 } keymat;
2149};
2150
2151struct ib_flow_action_attrs_esp_replays {
2152 enum ib_uverbs_flow_action_esp_replay protocol;
2153 union {
2154 struct ib_uverbs_flow_action_esp_replay_bmp bmp;
2155 } replay;
2156};
2157
2158enum ib_flow_action_attrs_esp_flags {
2159 /* All user-space flags at the top: Use enum ib_uverbs_flow_action_esp_flags
2160 * This is done in order to share the same flags between user-space and
2161 * kernel and spare an unnecessary translation.
2162 */
2163
2164 /* Kernel flags */
2165 IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED = 1ULL << 32,
Matan Barak7d12f8d2018-03-28 09:27:48 +03002166 IB_FLOW_ACTION_ESP_FLAGS_MOD_ESP_ATTRS = 1ULL << 33,
Matan Barak2eb9bea2018-03-28 09:27:45 +03002167};
2168
2169struct ib_flow_spec_list {
2170 struct ib_flow_spec_list *next;
2171 union ib_flow_spec spec;
2172};
2173
2174struct ib_flow_action_attrs_esp {
2175 struct ib_flow_action_attrs_esp_keymats *keymat;
2176 struct ib_flow_action_attrs_esp_replays *replay;
2177 struct ib_flow_spec_list *encap;
2178 /* Used only if IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED is enabled.
2179 * Value of 0 is a valid value.
2180 */
2181 u32 esn;
2182 u32 spi;
2183 u32 seq;
2184 u32 tfc_pad;
2185 /* Use enum ib_flow_action_attrs_esp_flags */
2186 u64 flags;
2187 u64 hard_limit_pkts;
2188};
2189
2190struct ib_flow_action {
2191 struct ib_device *device;
2192 struct ib_uobject *uobject;
2193 enum ib_flow_action_type type;
2194 atomic_t usecnt;
2195};
2196
Ira Weiny4cd7c942015-06-06 14:38:31 -04002197struct ib_mad_hdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002198struct ib_grh;
2199
2200enum ib_process_mad_flags {
2201 IB_MAD_IGNORE_MKEY = 1,
2202 IB_MAD_IGNORE_BKEY = 2,
2203 IB_MAD_IGNORE_ALL = IB_MAD_IGNORE_MKEY | IB_MAD_IGNORE_BKEY
2204};
2205
2206enum ib_mad_result {
2207 IB_MAD_RESULT_FAILURE = 0, /* (!SUCCESS is the important flag) */
2208 IB_MAD_RESULT_SUCCESS = 1 << 0, /* MAD was successfully processed */
2209 IB_MAD_RESULT_REPLY = 1 << 1, /* Reply packet needs to be sent */
2210 IB_MAD_RESULT_CONSUMED = 1 << 2 /* Packet consumed: stop processing */
2211};
2212
Jack Wang21d64542017-01-17 10:11:12 +01002213struct ib_port_cache {
Daniel Jurgens883c71f2017-05-19 15:48:51 +03002214 u64 subnet_prefix;
Jack Wang21d64542017-01-17 10:11:12 +01002215 struct ib_pkey_cache *pkey;
2216 struct ib_gid_table *gid;
2217 u8 lmc;
2218 enum ib_port_state port_state;
2219};
2220
Linus Torvalds1da177e2005-04-16 15:20:36 -07002221struct ib_cache {
2222 rwlock_t lock;
2223 struct ib_event_handler event_handler;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002224};
2225
Ira Weiny77386132015-05-13 20:02:58 -04002226struct ib_port_immutable {
2227 int pkey_tbl_len;
2228 int gid_tbl_len;
Ira Weinyf9b22e32015-05-13 20:02:59 -04002229 u32 core_cap_flags;
Ira Weiny337877a2015-06-06 14:38:29 -04002230 u32 max_mad_size;
Ira Weiny77386132015-05-13 20:02:58 -04002231};
2232
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002233struct ib_port_data {
Jason Gunthorpe324e2272019-02-12 21:12:51 -07002234 struct ib_device *ib_dev;
2235
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002236 struct ib_port_immutable immutable;
2237
2238 spinlock_t pkey_list_lock;
2239 struct list_head pkey_list;
Jason Gunthorpe8faea9f2019-02-12 21:12:49 -07002240
2241 struct ib_port_cache cache;
Jason Gunthorpec2261dd2019-02-12 21:12:50 -07002242
2243 spinlock_t netdev_lock;
Jason Gunthorpe324e2272019-02-12 21:12:51 -07002244 struct net_device __rcu *netdev;
2245 struct hlist_node ndev_hash_link;
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002246};
2247
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002248/* rdma netdev type - specifies protocol type */
2249enum rdma_netdev_t {
Niranjana Vishwanathapuraf0ad83ac2017-04-10 11:22:25 +03002250 RDMA_NETDEV_OPA_VNIC,
2251 RDMA_NETDEV_IPOIB,
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002252};
2253
2254/**
2255 * struct rdma_netdev - rdma netdev
2256 * For cases where netstack interfacing is required.
2257 */
2258struct rdma_netdev {
2259 void *clnt_priv;
2260 struct ib_device *hca;
2261 u8 port_num;
2262
Jason Gunthorpe9f49a5b2018-07-29 11:34:56 +03002263 /*
2264 * cleanup function must be specified.
2265 * FIXME: This is only used for OPA_VNIC and that usage should be
2266 * removed too.
2267 */
Niranjana Vishwanathapura8e959602017-06-30 13:14:46 -07002268 void (*free_rdma_netdev)(struct net_device *netdev);
2269
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002270 /* control functions */
2271 void (*set_id)(struct net_device *netdev, int id);
Niranjana Vishwanathapuraf0ad83ac2017-04-10 11:22:25 +03002272 /* send packet */
2273 int (*send)(struct net_device *dev, struct sk_buff *skb,
2274 struct ib_ah *address, u32 dqpn);
2275 /* multicast */
2276 int (*attach_mcast)(struct net_device *dev, struct ib_device *hca,
2277 union ib_gid *gid, u16 mlid,
2278 int set_qkey, u32 qkey);
2279 int (*detach_mcast)(struct net_device *dev, struct ib_device *hca,
2280 union ib_gid *gid, u16 mlid);
Vishwanathapura, Niranjana2fc77572017-04-12 20:29:20 -07002281};
2282
Denis Drozdovf6a8a192018-08-14 14:08:51 +03002283struct rdma_netdev_alloc_params {
2284 size_t sizeof_priv;
2285 unsigned int txqs;
2286 unsigned int rxqs;
2287 void *param;
2288
2289 int (*initialize_rdma_netdev)(struct ib_device *device, u8 port_num,
2290 struct net_device *netdev, void *param);
2291};
2292
Raed Salemfa9b1802018-05-31 16:43:31 +03002293struct ib_counters {
2294 struct ib_device *device;
2295 struct ib_uobject *uobject;
2296 /* num of objects attached */
2297 atomic_t usecnt;
2298};
2299
Raed Salem51d7a532018-05-31 16:43:33 +03002300struct ib_counters_read_attr {
2301 u64 *counters_buff;
2302 u32 ncounters;
2303 u32 flags; /* use enum ib_read_counters_flags */
2304};
2305
Matan Barak2eb9bea2018-03-28 09:27:45 +03002306struct uverbs_attr_bundle;
Kamal Heibdd05cb82019-04-29 14:59:06 +03002307struct iw_cm_id;
2308struct iw_cm_conn_param;
Matan Barak2eb9bea2018-03-28 09:27:45 +03002309
Leon Romanovsky30471d42019-02-03 14:55:50 +02002310#define INIT_RDMA_OBJ_SIZE(ib_struct, drv_struct, member) \
2311 .size_##ib_struct = \
2312 (sizeof(struct drv_struct) + \
2313 BUILD_BUG_ON_ZERO(offsetof(struct drv_struct, member)) + \
2314 BUILD_BUG_ON_ZERO( \
2315 !__same_type(((struct drv_struct *)NULL)->member, \
2316 struct ib_struct)))
2317
Leon Romanovskyf6316032019-03-28 15:12:58 +02002318#define rdma_zalloc_drv_obj_gfp(ib_dev, ib_type, gfp) \
2319 ((struct ib_type *)kzalloc(ib_dev->ops.size_##ib_type, gfp))
2320
Leon Romanovsky30471d42019-02-03 14:55:50 +02002321#define rdma_zalloc_drv_obj(ib_dev, ib_type) \
Leon Romanovskyf6316032019-03-28 15:12:58 +02002322 rdma_zalloc_drv_obj_gfp(ib_dev, ib_type, GFP_KERNEL)
Leon Romanovsky30471d42019-02-03 14:55:50 +02002323
2324#define DECLARE_RDMA_OBJ_SIZE(ib_struct) size_t size_##ib_struct
2325
Kamal Heib521ed0d2018-12-10 21:09:30 +02002326/**
2327 * struct ib_device_ops - InfiniBand device operations
2328 * This structure defines all the InfiniBand device operations, providers will
2329 * need to define the supported operations, otherwise they will be set to null.
2330 */
2331struct ib_device_ops {
Jason Gunthorpeb9560a42019-06-05 14:39:24 -03002332 enum rdma_driver_id driver_id;
2333
Kamal Heib521ed0d2018-12-10 21:09:30 +02002334 int (*post_send)(struct ib_qp *qp, const struct ib_send_wr *send_wr,
2335 const struct ib_send_wr **bad_send_wr);
2336 int (*post_recv)(struct ib_qp *qp, const struct ib_recv_wr *recv_wr,
2337 const struct ib_recv_wr **bad_recv_wr);
2338 void (*drain_rq)(struct ib_qp *qp);
2339 void (*drain_sq)(struct ib_qp *qp);
2340 int (*poll_cq)(struct ib_cq *cq, int num_entries, struct ib_wc *wc);
2341 int (*peek_cq)(struct ib_cq *cq, int wc_cnt);
2342 int (*req_notify_cq)(struct ib_cq *cq, enum ib_cq_notify_flags flags);
2343 int (*req_ncomp_notif)(struct ib_cq *cq, int wc_cnt);
2344 int (*post_srq_recv)(struct ib_srq *srq,
2345 const struct ib_recv_wr *recv_wr,
2346 const struct ib_recv_wr **bad_recv_wr);
2347 int (*process_mad)(struct ib_device *device, int process_mad_flags,
2348 u8 port_num, const struct ib_wc *in_wc,
2349 const struct ib_grh *in_grh,
2350 const struct ib_mad_hdr *in_mad, size_t in_mad_size,
2351 struct ib_mad_hdr *out_mad, size_t *out_mad_size,
2352 u16 *out_mad_pkey_index);
2353 int (*query_device)(struct ib_device *device,
2354 struct ib_device_attr *device_attr,
2355 struct ib_udata *udata);
2356 int (*modify_device)(struct ib_device *device, int device_modify_mask,
2357 struct ib_device_modify *device_modify);
2358 void (*get_dev_fw_str)(struct ib_device *device, char *str);
2359 const struct cpumask *(*get_vector_affinity)(struct ib_device *ibdev,
2360 int comp_vector);
2361 int (*query_port)(struct ib_device *device, u8 port_num,
2362 struct ib_port_attr *port_attr);
2363 int (*modify_port)(struct ib_device *device, u8 port_num,
2364 int port_modify_mask,
2365 struct ib_port_modify *port_modify);
2366 /**
2367 * The following mandatory functions are used only at device
2368 * registration. Keep functions such as these at the end of this
2369 * structure to avoid cache line misses when accessing struct ib_device
2370 * in fast paths.
2371 */
2372 int (*get_port_immutable)(struct ib_device *device, u8 port_num,
2373 struct ib_port_immutable *immutable);
2374 enum rdma_link_layer (*get_link_layer)(struct ib_device *device,
2375 u8 port_num);
2376 /**
2377 * When calling get_netdev, the HW vendor's driver should return the
2378 * net device of device @device at port @port_num or NULL if such
2379 * a net device doesn't exist. The vendor driver should call dev_hold
2380 * on this net device. The HW vendor's device driver must guarantee
2381 * that this function returns NULL before the net device has finished
2382 * NETDEV_UNREGISTER state.
2383 */
2384 struct net_device *(*get_netdev)(struct ib_device *device, u8 port_num);
2385 /**
2386 * rdma netdev operation
2387 *
2388 * Driver implementing alloc_rdma_netdev or rdma_netdev_get_params
2389 * must return -EOPNOTSUPP if it doesn't support the specified type.
2390 */
2391 struct net_device *(*alloc_rdma_netdev)(
2392 struct ib_device *device, u8 port_num, enum rdma_netdev_t type,
2393 const char *name, unsigned char name_assign_type,
2394 void (*setup)(struct net_device *));
2395
2396 int (*rdma_netdev_get_params)(struct ib_device *device, u8 port_num,
2397 enum rdma_netdev_t type,
2398 struct rdma_netdev_alloc_params *params);
2399 /**
2400 * query_gid should be return GID value for @device, when @port_num
2401 * link layer is either IB or iWarp. It is no-op if @port_num port
2402 * is RoCE link layer.
2403 */
2404 int (*query_gid)(struct ib_device *device, u8 port_num, int index,
2405 union ib_gid *gid);
2406 /**
2407 * When calling add_gid, the HW vendor's driver should add the gid
2408 * of device of port at gid index available at @attr. Meta-info of
2409 * that gid (for example, the network device related to this gid) is
2410 * available at @attr. @context allows the HW vendor driver to store
2411 * extra information together with a GID entry. The HW vendor driver may
2412 * allocate memory to contain this information and store it in @context
2413 * when a new GID entry is written to. Params are consistent until the
2414 * next call of add_gid or delete_gid. The function should return 0 on
2415 * success or error otherwise. The function could be called
2416 * concurrently for different ports. This function is only called when
2417 * roce_gid_table is used.
2418 */
2419 int (*add_gid)(const struct ib_gid_attr *attr, void **context);
2420 /**
2421 * When calling del_gid, the HW vendor's driver should delete the
2422 * gid of device @device at gid index gid_index of port port_num
2423 * available in @attr.
2424 * Upon the deletion of a GID entry, the HW vendor must free any
2425 * allocated memory. The caller will clear @context afterwards.
2426 * This function is only called when roce_gid_table is used.
2427 */
2428 int (*del_gid)(const struct ib_gid_attr *attr, void **context);
2429 int (*query_pkey)(struct ib_device *device, u8 port_num, u16 index,
2430 u16 *pkey);
Leon Romanovskya2a074e2019-02-12 20:39:16 +02002431 int (*alloc_ucontext)(struct ib_ucontext *context,
2432 struct ib_udata *udata);
2433 void (*dealloc_ucontext)(struct ib_ucontext *context);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002434 int (*mmap)(struct ib_ucontext *context, struct vm_area_struct *vma);
2435 void (*disassociate_ucontext)(struct ib_ucontext *ibcontext);
Shamir Rabinovitchff23dfa2019-03-31 19:10:07 +03002436 int (*alloc_pd)(struct ib_pd *pd, struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002437 void (*dealloc_pd)(struct ib_pd *pd, struct ib_udata *udata);
Leon Romanovskyd3456912019-04-03 16:42:42 +03002438 int (*create_ah)(struct ib_ah *ah, struct rdma_ah_attr *ah_attr,
2439 u32 flags, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002440 int (*modify_ah)(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
2441 int (*query_ah)(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
Leon Romanovskyd3456912019-04-03 16:42:42 +03002442 void (*destroy_ah)(struct ib_ah *ah, u32 flags);
Leon Romanovsky68e326d2019-04-03 16:42:43 +03002443 int (*create_srq)(struct ib_srq *srq,
2444 struct ib_srq_init_attr *srq_init_attr,
2445 struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002446 int (*modify_srq)(struct ib_srq *srq, struct ib_srq_attr *srq_attr,
2447 enum ib_srq_attr_mask srq_attr_mask,
2448 struct ib_udata *udata);
2449 int (*query_srq)(struct ib_srq *srq, struct ib_srq_attr *srq_attr);
Leon Romanovsky68e326d2019-04-03 16:42:43 +03002450 void (*destroy_srq)(struct ib_srq *srq, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002451 struct ib_qp *(*create_qp)(struct ib_pd *pd,
2452 struct ib_qp_init_attr *qp_init_attr,
2453 struct ib_udata *udata);
2454 int (*modify_qp)(struct ib_qp *qp, struct ib_qp_attr *qp_attr,
2455 int qp_attr_mask, struct ib_udata *udata);
2456 int (*query_qp)(struct ib_qp *qp, struct ib_qp_attr *qp_attr,
2457 int qp_attr_mask, struct ib_qp_init_attr *qp_init_attr);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002458 int (*destroy_qp)(struct ib_qp *qp, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002459 struct ib_cq *(*create_cq)(struct ib_device *device,
2460 const struct ib_cq_init_attr *attr,
Kamal Heib521ed0d2018-12-10 21:09:30 +02002461 struct ib_udata *udata);
2462 int (*modify_cq)(struct ib_cq *cq, u16 cq_count, u16 cq_period);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002463 int (*destroy_cq)(struct ib_cq *cq, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002464 int (*resize_cq)(struct ib_cq *cq, int cqe, struct ib_udata *udata);
2465 struct ib_mr *(*get_dma_mr)(struct ib_pd *pd, int mr_access_flags);
2466 struct ib_mr *(*reg_user_mr)(struct ib_pd *pd, u64 start, u64 length,
2467 u64 virt_addr, int mr_access_flags,
2468 struct ib_udata *udata);
2469 int (*rereg_user_mr)(struct ib_mr *mr, int flags, u64 start, u64 length,
2470 u64 virt_addr, int mr_access_flags,
2471 struct ib_pd *pd, struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002472 int (*dereg_mr)(struct ib_mr *mr, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002473 struct ib_mr *(*alloc_mr)(struct ib_pd *pd, enum ib_mr_type mr_type,
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002474 u32 max_num_sg, struct ib_udata *udata);
Moni Shouaad8a4492018-12-11 13:37:52 +02002475 int (*advise_mr)(struct ib_pd *pd,
2476 enum ib_uverbs_advise_mr_advice advice, u32 flags,
2477 struct ib_sge *sg_list, u32 num_sge,
2478 struct uverbs_attr_bundle *attrs);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002479 int (*map_mr_sg)(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
2480 unsigned int *sg_offset);
2481 int (*check_mr_status)(struct ib_mr *mr, u32 check_mask,
2482 struct ib_mr_status *mr_status);
2483 struct ib_mw *(*alloc_mw)(struct ib_pd *pd, enum ib_mw_type type,
2484 struct ib_udata *udata);
2485 int (*dealloc_mw)(struct ib_mw *mw);
2486 struct ib_fmr *(*alloc_fmr)(struct ib_pd *pd, int mr_access_flags,
2487 struct ib_fmr_attr *fmr_attr);
2488 int (*map_phys_fmr)(struct ib_fmr *fmr, u64 *page_list, int list_len,
2489 u64 iova);
2490 int (*unmap_fmr)(struct list_head *fmr_list);
2491 int (*dealloc_fmr)(struct ib_fmr *fmr);
2492 int (*attach_mcast)(struct ib_qp *qp, union ib_gid *gid, u16 lid);
2493 int (*detach_mcast)(struct ib_qp *qp, union ib_gid *gid, u16 lid);
2494 struct ib_xrcd *(*alloc_xrcd)(struct ib_device *device,
Kamal Heib521ed0d2018-12-10 21:09:30 +02002495 struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002496 int (*dealloc_xrcd)(struct ib_xrcd *xrcd, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002497 struct ib_flow *(*create_flow)(struct ib_qp *qp,
2498 struct ib_flow_attr *flow_attr,
2499 int domain, struct ib_udata *udata);
2500 int (*destroy_flow)(struct ib_flow *flow_id);
2501 struct ib_flow_action *(*create_flow_action_esp)(
2502 struct ib_device *device,
2503 const struct ib_flow_action_attrs_esp *attr,
2504 struct uverbs_attr_bundle *attrs);
2505 int (*destroy_flow_action)(struct ib_flow_action *action);
2506 int (*modify_flow_action_esp)(
2507 struct ib_flow_action *action,
2508 const struct ib_flow_action_attrs_esp *attr,
2509 struct uverbs_attr_bundle *attrs);
2510 int (*set_vf_link_state)(struct ib_device *device, int vf, u8 port,
2511 int state);
2512 int (*get_vf_config)(struct ib_device *device, int vf, u8 port,
2513 struct ifla_vf_info *ivf);
2514 int (*get_vf_stats)(struct ib_device *device, int vf, u8 port,
2515 struct ifla_vf_stats *stats);
2516 int (*set_vf_guid)(struct ib_device *device, int vf, u8 port, u64 guid,
2517 int type);
2518 struct ib_wq *(*create_wq)(struct ib_pd *pd,
2519 struct ib_wq_init_attr *init_attr,
2520 struct ib_udata *udata);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002521 int (*destroy_wq)(struct ib_wq *wq, struct ib_udata *udata);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002522 int (*modify_wq)(struct ib_wq *wq, struct ib_wq_attr *attr,
2523 u32 wq_attr_mask, struct ib_udata *udata);
2524 struct ib_rwq_ind_table *(*create_rwq_ind_table)(
2525 struct ib_device *device,
2526 struct ib_rwq_ind_table_init_attr *init_attr,
2527 struct ib_udata *udata);
2528 int (*destroy_rwq_ind_table)(struct ib_rwq_ind_table *wq_ind_table);
2529 struct ib_dm *(*alloc_dm)(struct ib_device *device,
2530 struct ib_ucontext *context,
2531 struct ib_dm_alloc_attr *attr,
2532 struct uverbs_attr_bundle *attrs);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03002533 int (*dealloc_dm)(struct ib_dm *dm, struct uverbs_attr_bundle *attrs);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002534 struct ib_mr *(*reg_dm_mr)(struct ib_pd *pd, struct ib_dm *dm,
2535 struct ib_dm_mr_attr *attr,
2536 struct uverbs_attr_bundle *attrs);
2537 struct ib_counters *(*create_counters)(
2538 struct ib_device *device, struct uverbs_attr_bundle *attrs);
2539 int (*destroy_counters)(struct ib_counters *counters);
2540 int (*read_counters)(struct ib_counters *counters,
2541 struct ib_counters_read_attr *counters_read_attr,
2542 struct uverbs_attr_bundle *attrs);
2543 /**
2544 * alloc_hw_stats - Allocate a struct rdma_hw_stats and fill in the
2545 * driver initialized data. The struct is kfree()'ed by the sysfs
2546 * core when the device is removed. A lifespan of -1 in the return
2547 * struct tells the core to set a default lifespan.
2548 */
2549 struct rdma_hw_stats *(*alloc_hw_stats)(struct ib_device *device,
2550 u8 port_num);
2551 /**
2552 * get_hw_stats - Fill in the counter value(s) in the stats struct.
2553 * @index - The index in the value array we wish to have updated, or
2554 * num_counters if we want all stats updated
2555 * Return codes -
2556 * < 0 - Error, no counters updated
2557 * index - Updated the single counter pointed to by index
2558 * num_counters - Updated all counters (will reset the timestamp
2559 * and prevent further calls for lifespan milliseconds)
2560 * Drivers are allowed to update all counters in leiu of just the
2561 * one given in index at their option
2562 */
2563 int (*get_hw_stats)(struct ib_device *device,
2564 struct rdma_hw_stats *stats, u8 port, int index);
Parav Panditea4baf72018-12-18 14:28:30 +02002565 /*
2566 * This function is called once for each port when a ib device is
2567 * registered.
2568 */
2569 int (*init_port)(struct ib_device *device, u8 port_num,
2570 struct kobject *port_sysfs);
Leon Romanovsky02da3752019-01-30 12:49:02 +02002571 /**
2572 * Allows rdma drivers to add their own restrack attributes.
2573 */
2574 int (*fill_res_entry)(struct sk_buff *msg,
2575 struct rdma_restrack_entry *entry);
Leon Romanovsky21a428a2019-02-03 14:55:51 +02002576
Jason Gunthorped0899892019-02-12 21:12:53 -07002577 /* Device lifecycle callbacks */
2578 /*
Jason Gunthorpeca223542019-02-12 21:12:56 -07002579 * Called after the device becomes registered, before clients are
2580 * attached
2581 */
2582 int (*enable_driver)(struct ib_device *dev);
2583 /*
Jason Gunthorped0899892019-02-12 21:12:53 -07002584 * This is called as part of ib_dealloc_device().
2585 */
2586 void (*dealloc_driver)(struct ib_device *dev);
2587
Kamal Heibdd05cb82019-04-29 14:59:06 +03002588 /* iWarp CM callbacks */
2589 void (*iw_add_ref)(struct ib_qp *qp);
2590 void (*iw_rem_ref)(struct ib_qp *qp);
2591 struct ib_qp *(*iw_get_qp)(struct ib_device *device, int qpn);
2592 int (*iw_connect)(struct iw_cm_id *cm_id,
2593 struct iw_cm_conn_param *conn_param);
2594 int (*iw_accept)(struct iw_cm_id *cm_id,
2595 struct iw_cm_conn_param *conn_param);
2596 int (*iw_reject)(struct iw_cm_id *cm_id, const void *pdata,
2597 u8 pdata_len);
2598 int (*iw_create_listen)(struct iw_cm_id *cm_id, int backlog);
2599 int (*iw_destroy_listen)(struct iw_cm_id *cm_id);
2600
Leon Romanovskyd3456912019-04-03 16:42:42 +03002601 DECLARE_RDMA_OBJ_SIZE(ib_ah);
Leon Romanovsky21a428a2019-02-03 14:55:51 +02002602 DECLARE_RDMA_OBJ_SIZE(ib_pd);
Leon Romanovsky68e326d2019-04-03 16:42:43 +03002603 DECLARE_RDMA_OBJ_SIZE(ib_srq);
Leon Romanovskya2a074e2019-02-12 20:39:16 +02002604 DECLARE_RDMA_OBJ_SIZE(ib_ucontext);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002605};
2606
Parav Panditcebe5562019-02-26 13:56:11 +02002607struct ib_core_device {
2608 /* device must be the first element in structure until,
2609 * union of ib_core_device and device exists in ib_device.
2610 */
2611 struct device dev;
Parav Pandit4e0f7b92019-02-26 13:56:13 +02002612 possible_net_t rdma_net;
Parav Panditcebe5562019-02-26 13:56:11 +02002613 struct kobject *ports_kobj;
2614 struct list_head port_list;
2615 struct ib_device *owner; /* reach back to owner ib_device */
2616};
Leon Romanovsky41eda652019-02-18 22:25:47 +02002617
Parav Panditcebe5562019-02-26 13:56:11 +02002618struct rdma_restrack_root;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002619struct ib_device {
Bart Van Assche0957c292017-03-07 22:56:53 +00002620 /* Do not access @dma_device directly from ULP nor from HW drivers. */
2621 struct device *dma_device;
Kamal Heib3023a1e2018-12-10 21:09:48 +02002622 struct ib_device_ops ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002623 char name[IB_DEVICE_NAME_MAX];
Jason Gunthorpe324e2272019-02-12 21:12:51 -07002624 struct rcu_head rcu_head;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002625
2626 struct list_head event_handler_list;
2627 spinlock_t event_handler_lock;
2628
Jason Gunthorpe921eab12019-02-06 22:41:54 -07002629 struct rw_semaphore client_data_rwsem;
Jason Gunthorpe0df91bb2019-02-06 22:41:53 -07002630 struct xarray client_data;
Jason Gunthorped0899892019-02-12 21:12:53 -07002631 struct mutex unregistration_lock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002632
2633 struct ib_cache cache;
Ira Weiny77386132015-05-13 20:02:58 -04002634 /**
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002635 * port_data is indexed by port number
Ira Weiny77386132015-05-13 20:02:58 -04002636 */
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002637 struct ib_port_data *port_data;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002638
Michael S. Tsirkinf4fd0b22007-05-03 13:48:47 +03002639 int num_comp_vectors;
2640
Roland Dreiere2773c02005-07-07 17:57:10 -07002641 struct module *owner;
Parav Panditcebe5562019-02-26 13:56:11 +02002642 union {
2643 struct device dev;
2644 struct ib_core_device coredev;
2645 };
2646
Parav Panditd4122f52018-10-11 22:31:53 +03002647 /* First group for device attributes,
2648 * Second group for driver provided attributes (optional).
2649 * It is NULL terminated array.
2650 */
2651 const struct attribute_group *groups[3];
Parav Panditadee9f32018-09-05 09:47:58 +03002652
Roland Dreier274c0892005-09-29 14:17:48 -07002653 int uverbs_abi_ver;
Alexander Chiang17a55f72010-02-02 19:09:16 +00002654 u64 uverbs_cmd_mask;
Yann Droneaudf21519b2013-11-06 23:21:49 +01002655 u64 uverbs_ex_cmd_mask;
Roland Dreier274c0892005-09-29 14:17:48 -07002656
Yuval Shaiabd99fde2016-08-25 10:57:07 -07002657 char node_desc[IB_DEVICE_NODE_DESC_MAX];
Sean Heftycf311cd2006-01-10 07:39:34 -08002658 __be64 node_guid;
Steve Wise96f15c02008-07-14 23:48:53 -07002659 u32 local_dma_lkey;
Hal Rosenstock41390322015-06-29 09:57:00 -04002660 u16 is_switch:1;
Gal Pressman6780c4f2019-01-22 10:08:22 +02002661 /* Indicates kernel verbs support, should not be used in drivers */
2662 u16 kverbs_provider:1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002663 u8 node_type;
2664 u8 phys_port_cnt;
Ira Weiny3e153a92015-12-18 10:59:44 +02002665 struct ib_device_attr attrs;
Christoph Lameterb40f4752016-05-16 12:49:33 -05002666 struct attribute_group *hw_stats_ag;
2667 struct rdma_hw_stats *hw_stats;
Ira Weiny77386132015-05-13 20:02:58 -04002668
Parav Pandit43579b52017-01-10 00:02:14 +00002669#ifdef CONFIG_CGROUP_RDMA
2670 struct rdmacg_device cg_device;
2671#endif
2672
Leon Romanovskyecc82c52017-06-18 14:39:59 +03002673 u32 index;
Leon Romanovsky41eda652019-02-18 22:25:47 +02002674 struct rdma_restrack_root *res;
Leon Romanovskyecc82c52017-06-18 14:39:59 +03002675
Jason Gunthorpe0cbf4322018-11-12 22:59:50 +02002676 const struct uapi_definition *driver_def;
Jason Gunthorped79af722019-01-10 14:02:24 -07002677
Parav Pandit01b67112018-11-16 03:50:57 +02002678 /*
Jason Gunthorped79af722019-01-10 14:02:24 -07002679 * Positive refcount indicates that the device is currently
2680 * registered and cannot be unregistered.
Parav Pandit01b67112018-11-16 03:50:57 +02002681 */
2682 refcount_t refcount;
2683 struct completion unreg_completion;
Jason Gunthorped0899892019-02-12 21:12:53 -07002684 struct work_struct unregistration_work;
Steve Wise3856ec42019-02-15 11:03:53 -08002685
2686 const struct rdma_link_ops *link_ops;
Parav Pandit4e0f7b92019-02-26 13:56:13 +02002687
2688 /* Protects compat_devs xarray modifications */
2689 struct mutex compat_devs_mutex;
2690 /* Maintains compat devices for each net namespace */
2691 struct xarray compat_devs;
Kamal Heibdd05cb82019-04-29 14:59:06 +03002692
2693 /* Used by iWarp CM */
2694 char iw_ifname[IFNAMSIZ];
2695 u32 iw_driver_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002696};
2697
2698struct ib_client {
Jason Gunthorpee59178d2019-02-06 22:41:52 -07002699 const char *name;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002700 void (*add) (struct ib_device *);
Haggai Eran7c1eb452015-07-30 17:50:14 +03002701 void (*remove)(struct ib_device *, void *client_data);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002702
Yotam Kenneth9268f722015-07-30 17:50:15 +03002703 /* Returns the net_dev belonging to this ib_client and matching the
2704 * given parameters.
2705 * @dev: An RDMA device that the net_dev use for communication.
2706 * @port: A physical port number on the RDMA device.
2707 * @pkey: P_Key that the net_dev uses if applicable.
2708 * @gid: A GID that the net_dev uses to communicate.
2709 * @addr: An IP address the net_dev is configured with.
2710 * @client_data: The device's client data set by ib_set_client_data().
2711 *
2712 * An ib_client that implements a net_dev on top of RDMA devices
2713 * (such as IP over IB) should implement this callback, allowing the
2714 * rdma_cm module to find the right net_dev for a given request.
2715 *
2716 * The caller is responsible for calling dev_put on the returned
2717 * netdev. */
2718 struct net_device *(*get_net_dev_by_params)(
2719 struct ib_device *dev,
2720 u8 port,
2721 u16 pkey,
2722 const union ib_gid *gid,
2723 const struct sockaddr *addr,
2724 void *client_data);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002725 struct list_head list;
Jason Gunthorpee59178d2019-02-06 22:41:52 -07002726 u32 client_id;
Gal Pressman6780c4f2019-01-22 10:08:22 +02002727
2728 /* kverbs are not required by the client */
2729 u8 no_kverbs_req:1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002730};
2731
Shiraz Saleema8082732019-05-06 08:53:33 -05002732/*
2733 * IB block DMA iterator
2734 *
2735 * Iterates the DMA-mapped SGL in contiguous memory blocks aligned
2736 * to a HW supported page size.
2737 */
2738struct ib_block_iter {
2739 /* internal states */
2740 struct scatterlist *__sg; /* sg holding the current aligned block */
2741 dma_addr_t __dma_addr; /* unaligned DMA address of this block */
2742 unsigned int __sg_nents; /* number of SG entries */
2743 unsigned int __sg_advance; /* number of bytes to advance in sg in next step */
2744 unsigned int __pg_bit; /* alignment of current block */
2745};
2746
Leon Romanovsky459cc692019-01-30 12:49:11 +02002747struct ib_device *_ib_alloc_device(size_t size);
2748#define ib_alloc_device(drv_struct, member) \
2749 container_of(_ib_alloc_device(sizeof(struct drv_struct) + \
2750 BUILD_BUG_ON_ZERO(offsetof( \
2751 struct drv_struct, member))), \
2752 struct drv_struct, member)
2753
Linus Torvalds1da177e2005-04-16 15:20:36 -07002754void ib_dealloc_device(struct ib_device *device);
2755
Leon Romanovsky9abb0d12017-06-27 16:49:53 +03002756void ib_get_device_fw_str(struct ib_device *device, char *str);
Ira Weiny5fa76c22016-06-15 02:21:56 -04002757
Parav Panditea4baf72018-12-18 14:28:30 +02002758int ib_register_device(struct ib_device *device, const char *name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002759void ib_unregister_device(struct ib_device *device);
Jason Gunthorped0899892019-02-12 21:12:53 -07002760void ib_unregister_driver(enum rdma_driver_id driver_id);
2761void ib_unregister_device_and_put(struct ib_device *device);
2762void ib_unregister_device_queued(struct ib_device *ib_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002763
2764int ib_register_client (struct ib_client *client);
2765void ib_unregister_client(struct ib_client *client);
2766
Shiraz Saleema8082732019-05-06 08:53:33 -05002767void __rdma_block_iter_start(struct ib_block_iter *biter,
2768 struct scatterlist *sglist,
2769 unsigned int nents,
2770 unsigned long pgsz);
2771bool __rdma_block_iter_next(struct ib_block_iter *biter);
2772
2773/**
2774 * rdma_block_iter_dma_address - get the aligned dma address of the current
2775 * block held by the block iterator.
2776 * @biter: block iterator holding the memory block
2777 */
2778static inline dma_addr_t
2779rdma_block_iter_dma_address(struct ib_block_iter *biter)
2780{
2781 return biter->__dma_addr & ~(BIT_ULL(biter->__pg_bit) - 1);
2782}
2783
2784/**
2785 * rdma_for_each_block - iterate over contiguous memory blocks of the sg list
2786 * @sglist: sglist to iterate over
2787 * @biter: block iterator holding the memory block
2788 * @nents: maximum number of sg entries to iterate over
2789 * @pgsz: best HW supported page size to use
2790 *
2791 * Callers may use rdma_block_iter_dma_address() to get each
2792 * blocks aligned DMA address.
2793 */
2794#define rdma_for_each_block(sglist, biter, nents, pgsz) \
2795 for (__rdma_block_iter_start(biter, sglist, nents, \
2796 pgsz); \
2797 __rdma_block_iter_next(biter);)
2798
Jason Gunthorpe0df91bb2019-02-06 22:41:53 -07002799/**
2800 * ib_get_client_data - Get IB client context
2801 * @device:Device to get context for
2802 * @client:Client to get context for
2803 *
2804 * ib_get_client_data() returns the client context data set with
2805 * ib_set_client_data(). This can only be called while the client is
2806 * registered to the device, once the ib_client remove() callback returns this
2807 * cannot be called.
2808 */
2809static inline void *ib_get_client_data(struct ib_device *device,
2810 struct ib_client *client)
2811{
2812 return xa_load(&device->client_data, client->client_id);
2813}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002814void ib_set_client_data(struct ib_device *device, struct ib_client *client,
2815 void *data);
Kamal Heib521ed0d2018-12-10 21:09:30 +02002816void ib_set_device_ops(struct ib_device *device,
2817 const struct ib_device_ops *ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002818
Jason Gunthorpe5f9794d2018-09-16 20:43:08 +03002819#if IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS)
2820int rdma_user_mmap_io(struct ib_ucontext *ucontext, struct vm_area_struct *vma,
2821 unsigned long pfn, unsigned long size, pgprot_t prot);
Jason Gunthorpe5f9794d2018-09-16 20:43:08 +03002822#else
2823static inline int rdma_user_mmap_io(struct ib_ucontext *ucontext,
2824 struct vm_area_struct *vma,
2825 unsigned long pfn, unsigned long size,
2826 pgprot_t prot)
2827{
2828 return -EINVAL;
2829}
Jason Gunthorpe5f9794d2018-09-16 20:43:08 +03002830#endif
2831
Roland Dreiere2773c02005-07-07 17:57:10 -07002832static inline int ib_copy_from_udata(void *dest, struct ib_udata *udata, size_t len)
2833{
2834 return copy_from_user(dest, udata->inbuf, len) ? -EFAULT : 0;
2835}
2836
2837static inline int ib_copy_to_udata(struct ib_udata *udata, void *src, size_t len)
2838{
Yann Droneaud43c611652015-02-05 22:10:18 +01002839 return copy_to_user(udata->outbuf, src, len) ? -EFAULT : 0;
Roland Dreiere2773c02005-07-07 17:57:10 -07002840}
2841
Matan Barakc66db312018-03-19 15:02:36 +02002842static inline bool ib_is_buffer_cleared(const void __user *p,
2843 size_t len)
Matan Barak301a7212015-12-15 20:30:10 +02002844{
Markus Elfring92d27ae2016-08-22 18:23:24 +02002845 bool ret;
Matan Barak301a7212015-12-15 20:30:10 +02002846 u8 *buf;
2847
2848 if (len > USHRT_MAX)
2849 return false;
2850
Markus Elfring92d27ae2016-08-22 18:23:24 +02002851 buf = memdup_user(p, len);
2852 if (IS_ERR(buf))
Matan Barak301a7212015-12-15 20:30:10 +02002853 return false;
2854
Matan Barak301a7212015-12-15 20:30:10 +02002855 ret = !memchr_inv(buf, 0, len);
Matan Barak301a7212015-12-15 20:30:10 +02002856 kfree(buf);
2857 return ret;
2858}
2859
Matan Barakc66db312018-03-19 15:02:36 +02002860static inline bool ib_is_udata_cleared(struct ib_udata *udata,
2861 size_t offset,
2862 size_t len)
2863{
2864 return ib_is_buffer_cleared(udata->inbuf + offset, len);
2865}
2866
Roland Dreier8a518662006-02-13 12:48:12 -08002867/**
Yishai Hadas1c774832018-06-20 17:11:39 +03002868 * ib_is_destroy_retryable - Check whether the uobject destruction
2869 * is retryable.
2870 * @ret: The initial destruction return code
2871 * @why: remove reason
2872 * @uobj: The uobject that is destroyed
2873 *
2874 * This function is a helper function that IB layer and low-level drivers
2875 * can use to consider whether the destruction of the given uobject is
2876 * retry-able.
2877 * It checks the original return code, if it wasn't success the destruction
2878 * is retryable according to the ucontext state (i.e. cleanup_retryable) and
2879 * the remove reason. (i.e. why).
2880 * Must be called with the object locked for destroy.
2881 */
2882static inline bool ib_is_destroy_retryable(int ret, enum rdma_remove_reason why,
2883 struct ib_uobject *uobj)
2884{
2885 return ret && (why == RDMA_REMOVE_DESTROY ||
2886 uobj->context->cleanup_retryable);
2887}
2888
2889/**
2890 * ib_destroy_usecnt - Called during destruction to check the usecnt
2891 * @usecnt: The usecnt atomic
2892 * @why: remove reason
2893 * @uobj: The uobject that is destroyed
2894 *
2895 * Non-zero usecnts will block destruction unless destruction was triggered by
2896 * a ucontext cleanup.
2897 */
2898static inline int ib_destroy_usecnt(atomic_t *usecnt,
2899 enum rdma_remove_reason why,
2900 struct ib_uobject *uobj)
2901{
2902 if (atomic_read(usecnt) && ib_is_destroy_retryable(-EBUSY, why, uobj))
2903 return -EBUSY;
2904 return 0;
2905}
2906
2907/**
Roland Dreier8a518662006-02-13 12:48:12 -08002908 * ib_modify_qp_is_ok - Check that the supplied attribute mask
2909 * contains all required attributes and no attributes not allowed for
2910 * the given QP state transition.
2911 * @cur_state: Current QP state
2912 * @next_state: Next QP state
2913 * @type: QP type
2914 * @mask: Mask of supplied QP attributes
2915 *
2916 * This function is a helper function that a low-level driver's
2917 * modify_qp method can use to validate the consumer's input. It
2918 * checks that cur_state and next_state are valid QP states, that a
2919 * transition from cur_state to next_state is allowed by the IB spec,
2920 * and that the attribute mask supplied is allowed for the transition.
2921 */
Leon Romanovsky19b1f542018-03-11 13:51:35 +02002922bool ib_modify_qp_is_ok(enum ib_qp_state cur_state, enum ib_qp_state next_state,
Kamal Heibd31131b2018-10-02 16:11:21 +03002923 enum ib_qp_type type, enum ib_qp_attr_mask mask);
Roland Dreier8a518662006-02-13 12:48:12 -08002924
Leon Romanovskydcc98812017-08-17 15:50:36 +03002925void ib_register_event_handler(struct ib_event_handler *event_handler);
2926void ib_unregister_event_handler(struct ib_event_handler *event_handler);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002927void ib_dispatch_event(struct ib_event *event);
2928
Linus Torvalds1da177e2005-04-16 15:20:36 -07002929int ib_query_port(struct ib_device *device,
2930 u8 port_num, struct ib_port_attr *port_attr);
2931
Eli Cohena3f5ada2010-09-27 17:51:10 -07002932enum rdma_link_layer rdma_port_get_link_layer(struct ib_device *device,
2933 u8 port_num);
2934
Ira Weiny0cf18d72015-05-13 20:02:55 -04002935/**
Hal Rosenstock41390322015-06-29 09:57:00 -04002936 * rdma_cap_ib_switch - Check if the device is IB switch
2937 * @device: Device to check
2938 *
2939 * Device driver is responsible for setting is_switch bit on
2940 * in ib_device structure at init time.
2941 *
2942 * Return: true if the device is IB switch.
2943 */
2944static inline bool rdma_cap_ib_switch(const struct ib_device *device)
2945{
2946 return device->is_switch;
2947}
2948
2949/**
Ira Weiny0cf18d72015-05-13 20:02:55 -04002950 * rdma_start_port - Return the first valid port number for the device
2951 * specified
2952 *
2953 * @device: Device to be checked
2954 *
2955 * Return start port number
2956 */
2957static inline u8 rdma_start_port(const struct ib_device *device)
2958{
Hal Rosenstock41390322015-06-29 09:57:00 -04002959 return rdma_cap_ib_switch(device) ? 0 : 1;
Ira Weiny0cf18d72015-05-13 20:02:55 -04002960}
2961
2962/**
Jason Gunthorpeea1075e2019-02-12 21:12:47 -07002963 * rdma_for_each_port - Iterate over all valid port numbers of the IB device
2964 * @device - The struct ib_device * to iterate over
2965 * @iter - The unsigned int to store the port number
2966 */
2967#define rdma_for_each_port(device, iter) \
2968 for (iter = rdma_start_port(device + BUILD_BUG_ON_ZERO(!__same_type( \
2969 unsigned int, iter))); \
2970 iter <= rdma_end_port(device); (iter)++)
2971
2972/**
Ira Weiny0cf18d72015-05-13 20:02:55 -04002973 * rdma_end_port - Return the last valid port number for the device
2974 * specified
2975 *
2976 * @device: Device to be checked
2977 *
2978 * Return last port number
2979 */
2980static inline u8 rdma_end_port(const struct ib_device *device)
2981{
Hal Rosenstock41390322015-06-29 09:57:00 -04002982 return rdma_cap_ib_switch(device) ? 0 : device->phys_port_cnt;
Ira Weiny0cf18d72015-05-13 20:02:55 -04002983}
2984
Yuval Shaia24dc8312017-01-25 18:41:37 +02002985static inline int rdma_is_port_valid(const struct ib_device *device,
2986 unsigned int port)
2987{
2988 return (port >= rdma_start_port(device) &&
2989 port <= rdma_end_port(device));
2990}
2991
Artemy Kovalyovb02289b2018-07-04 15:57:50 +03002992static inline bool rdma_is_grh_required(const struct ib_device *device,
2993 u8 port_num)
2994{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07002995 return device->port_data[port_num].immutable.core_cap_flags &
2996 RDMA_CORE_PORT_IB_GRH_REQUIRED;
Artemy Kovalyovb02289b2018-07-04 15:57:50 +03002997}
2998
Ira Weiny5ede9282015-05-31 17:15:29 -04002999static inline bool rdma_protocol_ib(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003000{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003001 return device->port_data[port_num].immutable.core_cap_flags &
3002 RDMA_CORE_CAP_PROT_IB;
Michael Wangde66be92015-05-05 14:50:19 +02003003}
3004
Ira Weiny5ede9282015-05-31 17:15:29 -04003005static inline bool rdma_protocol_roce(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003006{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003007 return device->port_data[port_num].immutable.core_cap_flags &
3008 (RDMA_CORE_CAP_PROT_ROCE | RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP);
Matan Barak7766a992015-12-23 14:56:50 +02003009}
3010
3011static inline bool rdma_protocol_roce_udp_encap(const struct ib_device *device, u8 port_num)
3012{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003013 return device->port_data[port_num].immutable.core_cap_flags &
3014 RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP;
Matan Barak7766a992015-12-23 14:56:50 +02003015}
3016
3017static inline bool rdma_protocol_roce_eth_encap(const struct ib_device *device, u8 port_num)
3018{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003019 return device->port_data[port_num].immutable.core_cap_flags &
3020 RDMA_CORE_CAP_PROT_ROCE;
Michael Wangde66be92015-05-05 14:50:19 +02003021}
3022
Ira Weiny5ede9282015-05-31 17:15:29 -04003023static inline bool rdma_protocol_iwarp(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003024{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003025 return device->port_data[port_num].immutable.core_cap_flags &
3026 RDMA_CORE_CAP_PROT_IWARP;
Michael Wangde66be92015-05-05 14:50:19 +02003027}
3028
Ira Weiny5ede9282015-05-31 17:15:29 -04003029static inline bool rdma_ib_or_roce(const struct ib_device *device, u8 port_num)
Michael Wangde66be92015-05-05 14:50:19 +02003030{
Matan Barak7766a992015-12-23 14:56:50 +02003031 return rdma_protocol_ib(device, port_num) ||
3032 rdma_protocol_roce(device, port_num);
Michael Wangde66be92015-05-05 14:50:19 +02003033}
3034
Or Gerlitzaa773bd2017-01-24 13:02:35 +02003035static inline bool rdma_protocol_raw_packet(const struct ib_device *device, u8 port_num)
3036{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003037 return device->port_data[port_num].immutable.core_cap_flags &
3038 RDMA_CORE_CAP_PROT_RAW_PACKET;
Or Gerlitzaa773bd2017-01-24 13:02:35 +02003039}
3040
Or Gerlitzce1e0552017-01-24 13:02:38 +02003041static inline bool rdma_protocol_usnic(const struct ib_device *device, u8 port_num)
3042{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003043 return device->port_data[port_num].immutable.core_cap_flags &
3044 RDMA_CORE_CAP_PROT_USNIC;
Or Gerlitzce1e0552017-01-24 13:02:38 +02003045}
3046
Michael Wangc757dea2015-05-05 14:50:32 +02003047/**
Michael Wang296ec002015-05-18 10:41:45 +02003048 * rdma_cap_ib_mad - Check if the port of a device supports Infiniband
Michael Wangc757dea2015-05-05 14:50:32 +02003049 * Management Datagrams.
Michael Wang296ec002015-05-18 10:41:45 +02003050 * @device: Device to check
3051 * @port_num: Port number to check
Michael Wangc757dea2015-05-05 14:50:32 +02003052 *
Michael Wang296ec002015-05-18 10:41:45 +02003053 * Management Datagrams (MAD) are a required part of the InfiniBand
3054 * specification and are supported on all InfiniBand devices. A slightly
3055 * extended version are also supported on OPA interfaces.
Michael Wangc757dea2015-05-05 14:50:32 +02003056 *
Michael Wang296ec002015-05-18 10:41:45 +02003057 * Return: true if the port supports sending/receiving of MAD packets.
Michael Wangc757dea2015-05-05 14:50:32 +02003058 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003059static inline bool rdma_cap_ib_mad(const struct ib_device *device, u8 port_num)
Michael Wangc757dea2015-05-05 14:50:32 +02003060{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003061 return device->port_data[port_num].immutable.core_cap_flags &
3062 RDMA_CORE_CAP_IB_MAD;
Michael Wangc757dea2015-05-05 14:50:32 +02003063}
3064
Michael Wang29541e32015-05-05 14:50:33 +02003065/**
Ira Weiny65995fe2015-06-06 14:38:32 -04003066 * rdma_cap_opa_mad - Check if the port of device provides support for OPA
3067 * Management Datagrams.
3068 * @device: Device to check
3069 * @port_num: Port number to check
3070 *
3071 * Intel OmniPath devices extend and/or replace the InfiniBand Management
3072 * datagrams with their own versions. These OPA MADs share many but not all of
3073 * the characteristics of InfiniBand MADs.
3074 *
3075 * OPA MADs differ in the following ways:
3076 *
3077 * 1) MADs are variable size up to 2K
3078 * IBTA defined MADs remain fixed at 256 bytes
3079 * 2) OPA SMPs must carry valid PKeys
3080 * 3) OPA SMP packets are a different format
3081 *
3082 * Return: true if the port supports OPA MAD packet formats.
3083 */
3084static inline bool rdma_cap_opa_mad(struct ib_device *device, u8 port_num)
3085{
Leon Romanovskyd3243da2019-03-10 17:27:46 +02003086 return device->port_data[port_num].immutable.core_cap_flags &
3087 RDMA_CORE_CAP_OPA_MAD;
Ira Weiny65995fe2015-06-06 14:38:32 -04003088}
3089
3090/**
Michael Wang296ec002015-05-18 10:41:45 +02003091 * rdma_cap_ib_smi - Check if the port of a device provides an Infiniband
3092 * Subnet Management Agent (SMA) on the Subnet Management Interface (SMI).
3093 * @device: Device to check
3094 * @port_num: Port number to check
Michael Wang29541e32015-05-05 14:50:33 +02003095 *
Michael Wang296ec002015-05-18 10:41:45 +02003096 * Each InfiniBand node is required to provide a Subnet Management Agent
3097 * that the subnet manager can access. Prior to the fabric being fully
3098 * configured by the subnet manager, the SMA is accessed via a well known
3099 * interface called the Subnet Management Interface (SMI). This interface
3100 * uses directed route packets to communicate with the SM to get around the
3101 * chicken and egg problem of the SM needing to know what's on the fabric
3102 * in order to configure the fabric, and needing to configure the fabric in
3103 * order to send packets to the devices on the fabric. These directed
3104 * route packets do not need the fabric fully configured in order to reach
3105 * their destination. The SMI is the only method allowed to send
3106 * directed route packets on an InfiniBand fabric.
Michael Wang29541e32015-05-05 14:50:33 +02003107 *
Michael Wang296ec002015-05-18 10:41:45 +02003108 * Return: true if the port provides an SMI.
Michael Wang29541e32015-05-05 14:50:33 +02003109 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003110static inline bool rdma_cap_ib_smi(const struct ib_device *device, u8 port_num)
Michael Wang29541e32015-05-05 14:50:33 +02003111{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003112 return device->port_data[port_num].immutable.core_cap_flags &
3113 RDMA_CORE_CAP_IB_SMI;
Michael Wang29541e32015-05-05 14:50:33 +02003114}
3115
Michael Wang72219cea2015-05-05 14:50:34 +02003116/**
3117 * rdma_cap_ib_cm - Check if the port of device has the capability Infiniband
3118 * Communication Manager.
Michael Wang296ec002015-05-18 10:41:45 +02003119 * @device: Device to check
3120 * @port_num: Port number to check
Michael Wang72219cea2015-05-05 14:50:34 +02003121 *
Michael Wang296ec002015-05-18 10:41:45 +02003122 * The InfiniBand Communication Manager is one of many pre-defined General
3123 * Service Agents (GSA) that are accessed via the General Service
3124 * Interface (GSI). It's role is to facilitate establishment of connections
3125 * between nodes as well as other management related tasks for established
3126 * connections.
Michael Wang72219cea2015-05-05 14:50:34 +02003127 *
Michael Wang296ec002015-05-18 10:41:45 +02003128 * Return: true if the port supports an IB CM (this does not guarantee that
3129 * a CM is actually running however).
Michael Wang72219cea2015-05-05 14:50:34 +02003130 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003131static inline bool rdma_cap_ib_cm(const struct ib_device *device, u8 port_num)
Michael Wang72219cea2015-05-05 14:50:34 +02003132{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003133 return device->port_data[port_num].immutable.core_cap_flags &
3134 RDMA_CORE_CAP_IB_CM;
Michael Wang72219cea2015-05-05 14:50:34 +02003135}
3136
Michael Wang04215332015-05-05 14:50:35 +02003137/**
3138 * rdma_cap_iw_cm - Check if the port of device has the capability IWARP
3139 * Communication Manager.
Michael Wang296ec002015-05-18 10:41:45 +02003140 * @device: Device to check
3141 * @port_num: Port number to check
Michael Wang04215332015-05-05 14:50:35 +02003142 *
Michael Wang296ec002015-05-18 10:41:45 +02003143 * Similar to above, but specific to iWARP connections which have a different
3144 * managment protocol than InfiniBand.
Michael Wang04215332015-05-05 14:50:35 +02003145 *
Michael Wang296ec002015-05-18 10:41:45 +02003146 * Return: true if the port supports an iWARP CM (this does not guarantee that
3147 * a CM is actually running however).
Michael Wang04215332015-05-05 14:50:35 +02003148 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003149static inline bool rdma_cap_iw_cm(const struct ib_device *device, u8 port_num)
Michael Wang04215332015-05-05 14:50:35 +02003150{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003151 return device->port_data[port_num].immutable.core_cap_flags &
3152 RDMA_CORE_CAP_IW_CM;
Michael Wang04215332015-05-05 14:50:35 +02003153}
3154
Michael Wangfe53ba22015-05-05 14:50:36 +02003155/**
3156 * rdma_cap_ib_sa - Check if the port of device has the capability Infiniband
3157 * Subnet Administration.
Michael Wang296ec002015-05-18 10:41:45 +02003158 * @device: Device to check
3159 * @port_num: Port number to check
Michael Wangfe53ba22015-05-05 14:50:36 +02003160 *
Michael Wang296ec002015-05-18 10:41:45 +02003161 * An InfiniBand Subnet Administration (SA) service is a pre-defined General
3162 * Service Agent (GSA) provided by the Subnet Manager (SM). On InfiniBand
3163 * fabrics, devices should resolve routes to other hosts by contacting the
3164 * SA to query the proper route.
Michael Wangfe53ba22015-05-05 14:50:36 +02003165 *
Michael Wang296ec002015-05-18 10:41:45 +02003166 * Return: true if the port should act as a client to the fabric Subnet
3167 * Administration interface. This does not imply that the SA service is
3168 * running locally.
Michael Wangfe53ba22015-05-05 14:50:36 +02003169 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003170static inline bool rdma_cap_ib_sa(const struct ib_device *device, u8 port_num)
Michael Wangfe53ba22015-05-05 14:50:36 +02003171{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003172 return device->port_data[port_num].immutable.core_cap_flags &
3173 RDMA_CORE_CAP_IB_SA;
Michael Wangfe53ba22015-05-05 14:50:36 +02003174}
3175
Michael Wanga31ad3b2015-05-05 14:50:37 +02003176/**
3177 * rdma_cap_ib_mcast - Check if the port of device has the capability Infiniband
3178 * Multicast.
Michael Wang296ec002015-05-18 10:41:45 +02003179 * @device: Device to check
3180 * @port_num: Port number to check
Michael Wanga31ad3b2015-05-05 14:50:37 +02003181 *
Michael Wang296ec002015-05-18 10:41:45 +02003182 * InfiniBand multicast registration is more complex than normal IPv4 or
3183 * IPv6 multicast registration. Each Host Channel Adapter must register
3184 * with the Subnet Manager when it wishes to join a multicast group. It
3185 * should do so only once regardless of how many queue pairs it subscribes
3186 * to this group. And it should leave the group only after all queue pairs
3187 * attached to the group have been detached.
Michael Wanga31ad3b2015-05-05 14:50:37 +02003188 *
Michael Wang296ec002015-05-18 10:41:45 +02003189 * Return: true if the port must undertake the additional adminstrative
3190 * overhead of registering/unregistering with the SM and tracking of the
3191 * total number of queue pairs attached to the multicast group.
Michael Wanga31ad3b2015-05-05 14:50:37 +02003192 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003193static inline bool rdma_cap_ib_mcast(const struct ib_device *device, u8 port_num)
Michael Wanga31ad3b2015-05-05 14:50:37 +02003194{
3195 return rdma_cap_ib_sa(device, port_num);
3196}
3197
Michael Wangbc0f1d72015-05-05 14:50:38 +02003198/**
Michael Wang30a74ef2015-05-05 14:50:39 +02003199 * rdma_cap_af_ib - Check if the port of device has the capability
3200 * Native Infiniband Address.
Michael Wang296ec002015-05-18 10:41:45 +02003201 * @device: Device to check
3202 * @port_num: Port number to check
Michael Wang30a74ef2015-05-05 14:50:39 +02003203 *
Michael Wang296ec002015-05-18 10:41:45 +02003204 * InfiniBand addressing uses a port's GUID + Subnet Prefix to make a default
3205 * GID. RoCE uses a different mechanism, but still generates a GID via
3206 * a prescribed mechanism and port specific data.
Michael Wang30a74ef2015-05-05 14:50:39 +02003207 *
Michael Wang296ec002015-05-18 10:41:45 +02003208 * Return: true if the port uses a GID address to identify devices on the
3209 * network.
Michael Wang30a74ef2015-05-05 14:50:39 +02003210 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003211static inline bool rdma_cap_af_ib(const struct ib_device *device, u8 port_num)
Michael Wang30a74ef2015-05-05 14:50:39 +02003212{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003213 return device->port_data[port_num].immutable.core_cap_flags &
3214 RDMA_CORE_CAP_AF_IB;
Michael Wang30a74ef2015-05-05 14:50:39 +02003215}
3216
3217/**
Michael Wang227128f2015-05-05 14:50:40 +02003218 * rdma_cap_eth_ah - Check if the port of device has the capability
Michael Wang296ec002015-05-18 10:41:45 +02003219 * Ethernet Address Handle.
3220 * @device: Device to check
3221 * @port_num: Port number to check
Michael Wang227128f2015-05-05 14:50:40 +02003222 *
Michael Wang296ec002015-05-18 10:41:45 +02003223 * RoCE is InfiniBand over Ethernet, and it uses a well defined technique
3224 * to fabricate GIDs over Ethernet/IP specific addresses native to the
3225 * port. Normally, packet headers are generated by the sending host
3226 * adapter, but when sending connectionless datagrams, we must manually
3227 * inject the proper headers for the fabric we are communicating over.
Michael Wang227128f2015-05-05 14:50:40 +02003228 *
Michael Wang296ec002015-05-18 10:41:45 +02003229 * Return: true if we are running as a RoCE port and must force the
3230 * addition of a Global Route Header built from our Ethernet Address
3231 * Handle into our header list for connectionless packets.
Michael Wang227128f2015-05-05 14:50:40 +02003232 */
Ira Weiny5ede9282015-05-31 17:15:29 -04003233static inline bool rdma_cap_eth_ah(const struct ib_device *device, u8 port_num)
Michael Wang227128f2015-05-05 14:50:40 +02003234{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003235 return device->port_data[port_num].immutable.core_cap_flags &
3236 RDMA_CORE_CAP_ETH_AH;
Michael Wang227128f2015-05-05 14:50:40 +02003237}
3238
3239/**
Dasaratharaman Chandramouli94d595c2017-03-20 19:38:09 -04003240 * rdma_cap_opa_ah - Check if the port of device supports
3241 * OPA Address handles
3242 * @device: Device to check
3243 * @port_num: Port number to check
3244 *
3245 * Return: true if we are running on an OPA device which supports
3246 * the extended OPA addressing.
3247 */
3248static inline bool rdma_cap_opa_ah(struct ib_device *device, u8 port_num)
3249{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003250 return (device->port_data[port_num].immutable.core_cap_flags &
Dasaratharaman Chandramouli94d595c2017-03-20 19:38:09 -04003251 RDMA_CORE_CAP_OPA_AH) == RDMA_CORE_CAP_OPA_AH;
3252}
3253
3254/**
Ira Weiny337877a2015-06-06 14:38:29 -04003255 * rdma_max_mad_size - Return the max MAD size required by this RDMA Port.
3256 *
3257 * @device: Device
3258 * @port_num: Port number
3259 *
3260 * This MAD size includes the MAD headers and MAD payload. No other headers
3261 * are included.
3262 *
3263 * Return the max MAD size required by the Port. Will return 0 if the port
3264 * does not support MADs
3265 */
3266static inline size_t rdma_max_mad_size(const struct ib_device *device, u8 port_num)
3267{
Jason Gunthorpe8ceb1352019-02-12 21:12:48 -07003268 return device->port_data[port_num].immutable.max_mad_size;
Ira Weiny337877a2015-06-06 14:38:29 -04003269}
3270
Matan Barak03db3a22015-07-30 18:33:26 +03003271/**
3272 * rdma_cap_roce_gid_table - Check if the port of device uses roce_gid_table
3273 * @device: Device to check
3274 * @port_num: Port number to check
3275 *
3276 * RoCE GID table mechanism manages the various GIDs for a device.
3277 *
3278 * NOTE: if allocating the port's GID table has failed, this call will still
3279 * return true, but any RoCE GID table API will fail.
3280 *
3281 * Return: true if the port uses RoCE GID table mechanism in order to manage
3282 * its GIDs.
3283 */
3284static inline bool rdma_cap_roce_gid_table(const struct ib_device *device,
3285 u8 port_num)
3286{
3287 return rdma_protocol_roce(device, port_num) &&
Kamal Heib3023a1e2018-12-10 21:09:48 +02003288 device->ops.add_gid && device->ops.del_gid;
Matan Barak03db3a22015-07-30 18:33:26 +03003289}
3290
Christoph Hellwig002516e2016-05-03 18:01:05 +02003291/*
3292 * Check if the device supports READ W/ INVALIDATE.
3293 */
3294static inline bool rdma_cap_read_inv(struct ib_device *dev, u32 port_num)
3295{
3296 /*
3297 * iWarp drivers must support READ W/ INVALIDATE. No other protocol
3298 * has support for it yet.
3299 */
3300 return rdma_protocol_iwarp(dev, port_num);
3301}
3302
Shiraz Saleem4a353392019-05-06 08:53:32 -05003303/**
3304 * rdma_find_pg_bit - Find page bit given address and HW supported page sizes
3305 *
3306 * @addr: address
3307 * @pgsz_bitmap: bitmap of HW supported page sizes
3308 */
3309static inline unsigned int rdma_find_pg_bit(unsigned long addr,
3310 unsigned long pgsz_bitmap)
3311{
3312 unsigned long align;
3313 unsigned long pgsz;
3314
3315 align = addr & -addr;
3316
3317 /* Find page bit such that addr is aligned to the highest supported
3318 * HW page size
3319 */
3320 pgsz = pgsz_bitmap & ~(-align << 1);
3321 if (!pgsz)
3322 return __ffs(pgsz_bitmap);
3323
3324 return __fls(pgsz);
3325}
3326
Eli Cohen50174a72016-03-11 22:58:38 +02003327int ib_set_vf_link_state(struct ib_device *device, int vf, u8 port,
3328 int state);
3329int ib_get_vf_config(struct ib_device *device, int vf, u8 port,
3330 struct ifla_vf_info *info);
3331int ib_get_vf_stats(struct ib_device *device, int vf, u8 port,
3332 struct ifla_vf_stats *stats);
3333int ib_set_vf_guid(struct ib_device *device, int vf, u8 port, u64 guid,
3334 int type);
3335
Linus Torvalds1da177e2005-04-16 15:20:36 -07003336int ib_query_pkey(struct ib_device *device,
3337 u8 port_num, u16 index, u16 *pkey);
3338
3339int ib_modify_device(struct ib_device *device,
3340 int device_modify_mask,
3341 struct ib_device_modify *device_modify);
3342
3343int ib_modify_port(struct ib_device *device,
3344 u8 port_num, int port_modify_mask,
3345 struct ib_port_modify *port_modify);
3346
Yosef Etigin5eb620c2007-05-14 07:26:51 +03003347int ib_find_gid(struct ib_device *device, union ib_gid *gid,
Parav Panditb26c4a12018-03-13 16:06:12 +02003348 u8 *port_num, u16 *index);
Yosef Etigin5eb620c2007-05-14 07:26:51 +03003349
3350int ib_find_pkey(struct ib_device *device,
3351 u8 port_num, u16 pkey, u16 *index);
3352
Christoph Hellwiged082d32016-09-05 12:56:17 +02003353enum ib_pd_flags {
3354 /*
3355 * Create a memory registration for all memory in the system and place
3356 * the rkey for it into pd->unsafe_global_rkey. This can be used by
3357 * ULPs to avoid the overhead of dynamic MRs.
3358 *
3359 * This flag is generally considered unsafe and must only be used in
3360 * extremly trusted environments. Every use of it will log a warning
3361 * in the kernel log.
3362 */
3363 IB_PD_UNSAFE_GLOBAL_RKEY = 0x01,
3364};
Linus Torvalds1da177e2005-04-16 15:20:36 -07003365
Christoph Hellwiged082d32016-09-05 12:56:17 +02003366struct ib_pd *__ib_alloc_pd(struct ib_device *device, unsigned int flags,
3367 const char *caller);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003368
Christoph Hellwiged082d32016-09-05 12:56:17 +02003369#define ib_alloc_pd(device, flags) \
Leon Romanovskye4496442018-01-28 11:17:18 +02003370 __ib_alloc_pd((device), (flags), KBUILD_MODNAME)
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003371
3372/**
3373 * ib_dealloc_pd_user - Deallocate kernel/user PD
3374 * @pd: The protection domain
3375 * @udata: Valid user data or NULL for kernel objects
3376 */
3377void ib_dealloc_pd_user(struct ib_pd *pd, struct ib_udata *udata);
3378
3379/**
3380 * ib_dealloc_pd - Deallocate kernel PD
3381 * @pd: The protection domain
3382 *
3383 * NOTE: for user PD use ib_dealloc_pd_user with valid udata!
3384 */
3385static inline void ib_dealloc_pd(struct ib_pd *pd)
3386{
3387 ib_dealloc_pd_user(pd, NULL);
3388}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003389
Gal Pressmanb090c4e2018-12-12 11:09:05 +02003390enum rdma_create_ah_flags {
3391 /* In a sleepable context */
3392 RDMA_CREATE_AH_SLEEPABLE = BIT(0),
3393};
3394
Linus Torvalds1da177e2005-04-16 15:20:36 -07003395/**
Dasaratharaman Chandramouli0a18cfe2017-04-29 14:41:19 -04003396 * rdma_create_ah - Creates an address handle for the given address vector.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003397 * @pd: The protection domain associated with the address handle.
3398 * @ah_attr: The attributes of the address vector.
Gal Pressmanb090c4e2018-12-12 11:09:05 +02003399 * @flags: Create address handle flags (see enum rdma_create_ah_flags).
Linus Torvalds1da177e2005-04-16 15:20:36 -07003400 *
3401 * The address handle is used to reference a local or global destination
3402 * in all UD QP post sends.
3403 */
Gal Pressmanb090c4e2018-12-12 11:09:05 +02003404struct ib_ah *rdma_create_ah(struct ib_pd *pd, struct rdma_ah_attr *ah_attr,
3405 u32 flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003406
3407/**
Parav Pandit5cda6582017-10-16 08:45:12 +03003408 * rdma_create_user_ah - Creates an address handle for the given address vector.
3409 * It resolves destination mac address for ah attribute of RoCE type.
3410 * @pd: The protection domain associated with the address handle.
3411 * @ah_attr: The attributes of the address vector.
3412 * @udata: pointer to user's input output buffer information need by
3413 * provider driver.
3414 *
3415 * It returns 0 on success and returns appropriate error code on error.
3416 * The address handle is used to reference a local or global destination
3417 * in all UD QP post sends.
3418 */
3419struct ib_ah *rdma_create_user_ah(struct ib_pd *pd,
3420 struct rdma_ah_attr *ah_attr,
3421 struct ib_udata *udata);
3422/**
Moni Shoua850d8fd2016-11-10 11:30:56 +02003423 * ib_get_gids_from_rdma_hdr - Get sgid and dgid from GRH or IPv4 header
3424 * work completion.
3425 * @hdr: the L3 header to parse
3426 * @net_type: type of header to parse
3427 * @sgid: place to store source gid
3428 * @dgid: place to store destination gid
3429 */
3430int ib_get_gids_from_rdma_hdr(const union rdma_network_hdr *hdr,
3431 enum rdma_network_type net_type,
3432 union ib_gid *sgid, union ib_gid *dgid);
3433
3434/**
3435 * ib_get_rdma_header_version - Get the header version
3436 * @hdr: the L3 header to parse
3437 */
3438int ib_get_rdma_header_version(const union rdma_network_hdr *hdr);
3439
3440/**
Parav Panditf6bdb142017-11-14 14:52:17 +02003441 * ib_init_ah_attr_from_wc - Initializes address handle attributes from a
Sean Hefty4e00d692006-06-17 20:37:39 -07003442 * work completion.
3443 * @device: Device on which the received message arrived.
3444 * @port_num: Port on which the received message arrived.
3445 * @wc: Work completion associated with the received message.
3446 * @grh: References the received global route header. This parameter is
3447 * ignored unless the work completion indicates that the GRH is valid.
3448 * @ah_attr: Returned attributes that can be used when creating an address
3449 * handle for replying to the message.
Parav Panditb7403212018-06-19 10:59:14 +03003450 * When ib_init_ah_attr_from_wc() returns success,
3451 * (a) for IB link layer it optionally contains a reference to SGID attribute
3452 * when GRH is present for IB link layer.
3453 * (b) for RoCE link layer it contains a reference to SGID attribute.
3454 * User must invoke rdma_cleanup_ah_attr_gid_attr() to release reference to SGID
3455 * attributes which are initialized using ib_init_ah_attr_from_wc().
3456 *
Sean Hefty4e00d692006-06-17 20:37:39 -07003457 */
Parav Panditf6bdb142017-11-14 14:52:17 +02003458int ib_init_ah_attr_from_wc(struct ib_device *device, u8 port_num,
3459 const struct ib_wc *wc, const struct ib_grh *grh,
3460 struct rdma_ah_attr *ah_attr);
Sean Hefty4e00d692006-06-17 20:37:39 -07003461
3462/**
Hal Rosenstock513789e2005-07-27 11:45:34 -07003463 * ib_create_ah_from_wc - Creates an address handle associated with the
3464 * sender of the specified work completion.
3465 * @pd: The protection domain associated with the address handle.
3466 * @wc: Work completion information associated with a received message.
3467 * @grh: References the received global route header. This parameter is
3468 * ignored unless the work completion indicates that the GRH is valid.
3469 * @port_num: The outbound port number to associate with the address.
3470 *
3471 * The address handle is used to reference a local or global destination
3472 * in all UD QP post sends.
3473 */
Ira Weiny73cdaae2015-05-31 17:15:31 -04003474struct ib_ah *ib_create_ah_from_wc(struct ib_pd *pd, const struct ib_wc *wc,
3475 const struct ib_grh *grh, u8 port_num);
Hal Rosenstock513789e2005-07-27 11:45:34 -07003476
3477/**
Dasaratharaman Chandramouli67b985b2017-04-29 14:41:20 -04003478 * rdma_modify_ah - Modifies the address vector associated with an address
Linus Torvalds1da177e2005-04-16 15:20:36 -07003479 * handle.
3480 * @ah: The address handle to modify.
3481 * @ah_attr: The new address vector attributes to associate with the
3482 * address handle.
3483 */
Dasaratharaman Chandramouli67b985b2017-04-29 14:41:20 -04003484int rdma_modify_ah(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003485
3486/**
Dasaratharaman Chandramoulibfbfd662017-04-29 14:41:21 -04003487 * rdma_query_ah - Queries the address vector associated with an address
Linus Torvalds1da177e2005-04-16 15:20:36 -07003488 * handle.
3489 * @ah: The address handle to query.
3490 * @ah_attr: The address vector attributes associated with the address
3491 * handle.
3492 */
Dasaratharaman Chandramoulibfbfd662017-04-29 14:41:21 -04003493int rdma_query_ah(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003494
Gal Pressman2553ba22018-12-12 11:09:06 +02003495enum rdma_destroy_ah_flags {
3496 /* In a sleepable context */
3497 RDMA_DESTROY_AH_SLEEPABLE = BIT(0),
3498};
3499
Linus Torvalds1da177e2005-04-16 15:20:36 -07003500/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003501 * rdma_destroy_ah_user - Destroys an address handle.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003502 * @ah: The address handle to destroy.
Gal Pressman2553ba22018-12-12 11:09:06 +02003503 * @flags: Destroy address handle flags (see enum rdma_destroy_ah_flags).
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003504 * @udata: Valid user data or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003505 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003506int rdma_destroy_ah_user(struct ib_ah *ah, u32 flags, struct ib_udata *udata);
3507
3508/**
3509 * rdma_destroy_ah - Destroys an kernel address handle.
3510 * @ah: The address handle to destroy.
3511 * @flags: Destroy address handle flags (see enum rdma_destroy_ah_flags).
3512 *
3513 * NOTE: for user ah use rdma_destroy_ah_user with valid udata!
3514 */
3515static inline int rdma_destroy_ah(struct ib_ah *ah, u32 flags)
3516{
3517 return rdma_destroy_ah_user(ah, flags, NULL);
3518}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003519
3520/**
Roland Dreierd41fcc62005-08-18 12:23:08 -07003521 * ib_create_srq - Creates a SRQ associated with the specified protection
3522 * domain.
3523 * @pd: The protection domain associated with the SRQ.
Dotan Barakabb6e9b2006-02-23 12:13:51 -08003524 * @srq_init_attr: A list of initial attributes required to create the
3525 * SRQ. If SRQ creation succeeds, then the attributes are updated to
3526 * the actual capabilities of the created SRQ.
Roland Dreierd41fcc62005-08-18 12:23:08 -07003527 *
3528 * srq_attr->max_wr and srq_attr->max_sge are read the determine the
3529 * requested size of the SRQ, and set to the actual values allocated
3530 * on return. If ib_create_srq() succeeds, then max_wr and max_sge
3531 * will always be at least as large as the requested values.
3532 */
3533struct ib_srq *ib_create_srq(struct ib_pd *pd,
3534 struct ib_srq_init_attr *srq_init_attr);
3535
3536/**
3537 * ib_modify_srq - Modifies the attributes for the specified SRQ.
3538 * @srq: The SRQ to modify.
3539 * @srq_attr: On input, specifies the SRQ attributes to modify. On output,
3540 * the current values of selected SRQ attributes are returned.
3541 * @srq_attr_mask: A bit-mask used to specify which attributes of the SRQ
3542 * are being modified.
3543 *
3544 * The mask may contain IB_SRQ_MAX_WR to resize the SRQ and/or
3545 * IB_SRQ_LIMIT to set the SRQ's limit and request notification when
3546 * the number of receives queued drops below the limit.
3547 */
3548int ib_modify_srq(struct ib_srq *srq,
3549 struct ib_srq_attr *srq_attr,
3550 enum ib_srq_attr_mask srq_attr_mask);
3551
3552/**
3553 * ib_query_srq - Returns the attribute list and current values for the
3554 * specified SRQ.
3555 * @srq: The SRQ to query.
3556 * @srq_attr: The attributes of the specified SRQ.
3557 */
3558int ib_query_srq(struct ib_srq *srq,
3559 struct ib_srq_attr *srq_attr);
3560
3561/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003562 * ib_destroy_srq_user - Destroys the specified SRQ.
Roland Dreierd41fcc62005-08-18 12:23:08 -07003563 * @srq: The SRQ to destroy.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003564 * @udata: Valid user data or NULL for kernel objects
Roland Dreierd41fcc62005-08-18 12:23:08 -07003565 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003566int ib_destroy_srq_user(struct ib_srq *srq, struct ib_udata *udata);
3567
3568/**
3569 * ib_destroy_srq - Destroys the specified kernel SRQ.
3570 * @srq: The SRQ to destroy.
3571 *
3572 * NOTE: for user srq use ib_destroy_srq_user with valid udata!
3573 */
3574static inline int ib_destroy_srq(struct ib_srq *srq)
3575{
3576 return ib_destroy_srq_user(srq, NULL);
3577}
Roland Dreierd41fcc62005-08-18 12:23:08 -07003578
3579/**
3580 * ib_post_srq_recv - Posts a list of work requests to the specified SRQ.
3581 * @srq: The SRQ to post the work request on.
3582 * @recv_wr: A list of work requests to post on the receive queue.
3583 * @bad_recv_wr: On an immediate failure, this parameter will reference
3584 * the work request that failed to be posted on the QP.
3585 */
3586static inline int ib_post_srq_recv(struct ib_srq *srq,
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003587 const struct ib_recv_wr *recv_wr,
3588 const struct ib_recv_wr **bad_recv_wr)
Roland Dreierd41fcc62005-08-18 12:23:08 -07003589{
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003590 const struct ib_recv_wr *dummy;
Bart Van Asschebb039a82018-07-18 09:25:16 -07003591
Kamal Heib3023a1e2018-12-10 21:09:48 +02003592 return srq->device->ops.post_srq_recv(srq, recv_wr,
3593 bad_recv_wr ? : &dummy);
Roland Dreierd41fcc62005-08-18 12:23:08 -07003594}
3595
3596/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003597 * ib_create_qp_user - Creates a QP associated with the specified protection
Linus Torvalds1da177e2005-04-16 15:20:36 -07003598 * domain.
3599 * @pd: The protection domain associated with the QP.
Dotan Barakabb6e9b2006-02-23 12:13:51 -08003600 * @qp_init_attr: A list of initial attributes required to create the
3601 * QP. If QP creation succeeds, then the attributes are updated to
3602 * the actual capabilities of the created QP.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003603 * @udata: Valid user data or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003604 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003605struct ib_qp *ib_create_qp_user(struct ib_pd *pd,
3606 struct ib_qp_init_attr *qp_init_attr,
3607 struct ib_udata *udata);
3608
3609/**
3610 * ib_create_qp - Creates a kernel QP associated with the specified protection
3611 * domain.
3612 * @pd: The protection domain associated with the QP.
3613 * @qp_init_attr: A list of initial attributes required to create the
3614 * QP. If QP creation succeeds, then the attributes are updated to
3615 * the actual capabilities of the created QP.
3616 * @udata: Valid user data or NULL for kernel objects
3617 *
3618 * NOTE: for user qp use ib_create_qp_user with valid udata!
3619 */
3620static inline struct ib_qp *ib_create_qp(struct ib_pd *pd,
3621 struct ib_qp_init_attr *qp_init_attr)
3622{
3623 return ib_create_qp_user(pd, qp_init_attr, NULL);
3624}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003625
3626/**
Parav Pandita512c2f2017-05-23 11:26:08 +03003627 * ib_modify_qp_with_udata - Modifies the attributes for the specified QP.
3628 * @qp: The QP to modify.
3629 * @attr: On input, specifies the QP attributes to modify. On output,
3630 * the current values of selected QP attributes are returned.
3631 * @attr_mask: A bit-mask used to specify which attributes of the QP
3632 * are being modified.
3633 * @udata: pointer to user's input output buffer information
3634 * are being modified.
3635 * It returns 0 on success and returns appropriate error code on error.
3636 */
3637int ib_modify_qp_with_udata(struct ib_qp *qp,
3638 struct ib_qp_attr *attr,
3639 int attr_mask,
3640 struct ib_udata *udata);
3641
3642/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07003643 * ib_modify_qp - Modifies the attributes for the specified QP and then
3644 * transitions the QP to the given state.
3645 * @qp: The QP to modify.
3646 * @qp_attr: On input, specifies the QP attributes to modify. On output,
3647 * the current values of selected QP attributes are returned.
3648 * @qp_attr_mask: A bit-mask used to specify which attributes of the QP
3649 * are being modified.
3650 */
3651int ib_modify_qp(struct ib_qp *qp,
3652 struct ib_qp_attr *qp_attr,
3653 int qp_attr_mask);
3654
3655/**
3656 * ib_query_qp - Returns the attribute list and current values for the
3657 * specified QP.
3658 * @qp: The QP to query.
3659 * @qp_attr: The attributes of the specified QP.
3660 * @qp_attr_mask: A bit-mask used to select specific attributes to query.
3661 * @qp_init_attr: Additional attributes of the selected QP.
3662 *
3663 * The qp_attr_mask may be used to limit the query to gathering only the
3664 * selected attributes.
3665 */
3666int ib_query_qp(struct ib_qp *qp,
3667 struct ib_qp_attr *qp_attr,
3668 int qp_attr_mask,
3669 struct ib_qp_init_attr *qp_init_attr);
3670
3671/**
3672 * ib_destroy_qp - Destroys the specified QP.
3673 * @qp: The QP to destroy.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003674 * @udata: Valid udata or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003675 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003676int ib_destroy_qp_user(struct ib_qp *qp, struct ib_udata *udata);
3677
3678/**
3679 * ib_destroy_qp - Destroys the specified kernel QP.
3680 * @qp: The QP to destroy.
3681 *
3682 * NOTE: for user qp use ib_destroy_qp_user with valid udata!
3683 */
3684static inline int ib_destroy_qp(struct ib_qp *qp)
3685{
3686 return ib_destroy_qp_user(qp, NULL);
3687}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003688
3689/**
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07003690 * ib_open_qp - Obtain a reference to an existing sharable QP.
3691 * @xrcd - XRC domain
3692 * @qp_open_attr: Attributes identifying the QP to open.
3693 *
3694 * Returns a reference to a sharable QP.
3695 */
3696struct ib_qp *ib_open_qp(struct ib_xrcd *xrcd,
3697 struct ib_qp_open_attr *qp_open_attr);
3698
3699/**
3700 * ib_close_qp - Release an external reference to a QP.
Sean Heftyd3d72d92011-05-26 23:06:44 -07003701 * @qp: The QP handle to release
3702 *
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07003703 * The opened QP handle is released by the caller. The underlying
3704 * shared QP is not destroyed until all internal references are released.
Sean Heftyd3d72d92011-05-26 23:06:44 -07003705 */
Sean Hefty0e0ec7e2011-08-08 15:31:51 -07003706int ib_close_qp(struct ib_qp *qp);
Sean Heftyd3d72d92011-05-26 23:06:44 -07003707
3708/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07003709 * ib_post_send - Posts a list of work requests to the send queue of
3710 * the specified QP.
3711 * @qp: The QP to post the work request on.
3712 * @send_wr: A list of work requests to post on the send queue.
3713 * @bad_send_wr: On an immediate failure, this parameter will reference
3714 * the work request that failed to be posted on the QP.
Bart Van Assche55464d42009-12-09 14:20:04 -08003715 *
3716 * While IBA Vol. 1 section 11.4.1.1 specifies that if an immediate
3717 * error is returned, the QP state shall not be affected,
3718 * ib_post_send() will return an immediate error after queueing any
3719 * earlier work requests in the list.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003720 */
3721static inline int ib_post_send(struct ib_qp *qp,
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003722 const struct ib_send_wr *send_wr,
3723 const struct ib_send_wr **bad_send_wr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003724{
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003725 const struct ib_send_wr *dummy;
Bart Van Asschebb039a82018-07-18 09:25:16 -07003726
Kamal Heib3023a1e2018-12-10 21:09:48 +02003727 return qp->device->ops.post_send(qp, send_wr, bad_send_wr ? : &dummy);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003728}
3729
3730/**
3731 * ib_post_recv - Posts a list of work requests to the receive queue of
3732 * the specified QP.
3733 * @qp: The QP to post the work request on.
3734 * @recv_wr: A list of work requests to post on the receive queue.
3735 * @bad_recv_wr: On an immediate failure, this parameter will reference
3736 * the work request that failed to be posted on the QP.
3737 */
3738static inline int ib_post_recv(struct ib_qp *qp,
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003739 const struct ib_recv_wr *recv_wr,
3740 const struct ib_recv_wr **bad_recv_wr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003741{
Bart Van Assched34ac5c2018-07-18 09:25:32 -07003742 const struct ib_recv_wr *dummy;
Bart Van Asschebb039a82018-07-18 09:25:16 -07003743
Kamal Heib3023a1e2018-12-10 21:09:48 +02003744 return qp->device->ops.post_recv(qp, recv_wr, bad_recv_wr ? : &dummy);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003745}
3746
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003747struct ib_cq *__ib_alloc_cq_user(struct ib_device *dev, void *private,
3748 int nr_cqe, int comp_vector,
3749 enum ib_poll_context poll_ctx,
3750 const char *caller, struct ib_udata *udata);
Leon Romanovskyf66c8ba2018-01-28 11:17:19 +02003751
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003752/**
3753 * ib_alloc_cq_user: Allocate kernel/user CQ
3754 * @dev: The IB device
3755 * @private: Private data attached to the CQE
3756 * @nr_cqe: Number of CQEs in the CQ
3757 * @comp_vector: Completion vector used for the IRQs
3758 * @poll_ctx: Context used for polling the CQ
3759 * @udata: Valid user data or NULL for kernel objects
3760 */
3761static inline struct ib_cq *ib_alloc_cq_user(struct ib_device *dev,
3762 void *private, int nr_cqe,
3763 int comp_vector,
3764 enum ib_poll_context poll_ctx,
3765 struct ib_udata *udata)
3766{
3767 return __ib_alloc_cq_user(dev, private, nr_cqe, comp_vector, poll_ctx,
3768 KBUILD_MODNAME, udata);
3769}
3770
3771/**
3772 * ib_alloc_cq: Allocate kernel CQ
3773 * @dev: The IB device
3774 * @private: Private data attached to the CQE
3775 * @nr_cqe: Number of CQEs in the CQ
3776 * @comp_vector: Completion vector used for the IRQs
3777 * @poll_ctx: Context used for polling the CQ
3778 *
3779 * NOTE: for user cq use ib_alloc_cq_user with valid udata!
3780 */
3781static inline struct ib_cq *ib_alloc_cq(struct ib_device *dev, void *private,
3782 int nr_cqe, int comp_vector,
3783 enum ib_poll_context poll_ctx)
3784{
3785 return ib_alloc_cq_user(dev, private, nr_cqe, comp_vector, poll_ctx,
3786 NULL);
3787}
3788
3789/**
3790 * ib_free_cq_user - Free kernel/user CQ
3791 * @cq: The CQ to free
3792 * @udata: Valid user data or NULL for kernel objects
3793 */
3794void ib_free_cq_user(struct ib_cq *cq, struct ib_udata *udata);
3795
3796/**
3797 * ib_free_cq - Free kernel CQ
3798 * @cq: The CQ to free
3799 *
3800 * NOTE: for user cq use ib_free_cq_user with valid udata!
3801 */
3802static inline void ib_free_cq(struct ib_cq *cq)
3803{
3804 ib_free_cq_user(cq, NULL);
3805}
3806
Christoph Hellwig14d3a3b2015-12-11 11:53:03 -08003807int ib_process_cq_direct(struct ib_cq *cq, int budget);
3808
Linus Torvalds1da177e2005-04-16 15:20:36 -07003809/**
3810 * ib_create_cq - Creates a CQ on the specified device.
3811 * @device: The device on which to create the CQ.
3812 * @comp_handler: A user-specified callback that is invoked when a
3813 * completion event occurs on the CQ.
3814 * @event_handler: A user-specified callback that is invoked when an
3815 * asynchronous event not associated with a completion occurs on the CQ.
3816 * @cq_context: Context associated with the CQ returned to the user via
3817 * the associated completion and event handlers.
Matan Barak8e372102015-06-11 16:35:21 +03003818 * @cq_attr: The attributes the CQ should be created upon.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003819 *
3820 * Users can examine the cq structure to determine the actual CQ size.
3821 */
Bharat Potnuri7350cdd2018-06-15 20:52:33 +05303822struct ib_cq *__ib_create_cq(struct ib_device *device,
3823 ib_comp_handler comp_handler,
3824 void (*event_handler)(struct ib_event *, void *),
3825 void *cq_context,
3826 const struct ib_cq_init_attr *cq_attr,
3827 const char *caller);
3828#define ib_create_cq(device, cmp_hndlr, evt_hndlr, cq_ctxt, cq_attr) \
3829 __ib_create_cq((device), (cmp_hndlr), (evt_hndlr), (cq_ctxt), (cq_attr), KBUILD_MODNAME)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003830
3831/**
3832 * ib_resize_cq - Modifies the capacity of the CQ.
3833 * @cq: The CQ to resize.
3834 * @cqe: The minimum size of the CQ.
3835 *
3836 * Users can examine the cq structure to determine the actual CQ size.
3837 */
3838int ib_resize_cq(struct ib_cq *cq, int cqe);
3839
3840/**
Leon Romanovsky4190b4e2017-11-13 10:51:19 +02003841 * rdma_set_cq_moderation - Modifies moderation params of the CQ
Eli Cohen2dd57162008-04-16 21:09:33 -07003842 * @cq: The CQ to modify.
3843 * @cq_count: number of CQEs that will trigger an event
3844 * @cq_period: max period of time in usec before triggering an event
3845 *
3846 */
Leon Romanovsky4190b4e2017-11-13 10:51:19 +02003847int rdma_set_cq_moderation(struct ib_cq *cq, u16 cq_count, u16 cq_period);
Eli Cohen2dd57162008-04-16 21:09:33 -07003848
3849/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003850 * ib_destroy_cq_user - Destroys the specified CQ.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003851 * @cq: The CQ to destroy.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003852 * @udata: Valid user data or NULL for kernel objects
Linus Torvalds1da177e2005-04-16 15:20:36 -07003853 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003854int ib_destroy_cq_user(struct ib_cq *cq, struct ib_udata *udata);
3855
3856/**
3857 * ib_destroy_cq - Destroys the specified kernel CQ.
3858 * @cq: The CQ to destroy.
3859 *
3860 * NOTE: for user cq use ib_destroy_cq_user with valid udata!
3861 */
Leon Romanovsky890ac8d2019-05-20 09:54:21 +03003862static inline void ib_destroy_cq(struct ib_cq *cq)
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003863{
Leon Romanovsky890ac8d2019-05-20 09:54:21 +03003864 ib_destroy_cq_user(cq, NULL);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03003865}
Linus Torvalds1da177e2005-04-16 15:20:36 -07003866
3867/**
3868 * ib_poll_cq - poll a CQ for completion(s)
3869 * @cq:the CQ being polled
3870 * @num_entries:maximum number of completions to return
3871 * @wc:array of at least @num_entries &struct ib_wc where completions
3872 * will be returned
3873 *
3874 * Poll a CQ for (possibly multiple) completions. If the return value
3875 * is < 0, an error occurred. If the return value is >= 0, it is the
3876 * number of completions returned. If the return value is
3877 * non-negative and < num_entries, then the CQ was emptied.
3878 */
3879static inline int ib_poll_cq(struct ib_cq *cq, int num_entries,
3880 struct ib_wc *wc)
3881{
Kamal Heib3023a1e2018-12-10 21:09:48 +02003882 return cq->device->ops.poll_cq(cq, num_entries, wc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003883}
3884
3885/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07003886 * ib_req_notify_cq - Request completion notification on a CQ.
3887 * @cq: The CQ to generate an event for.
Roland Dreiered23a722007-05-06 21:02:48 -07003888 * @flags:
3889 * Must contain exactly one of %IB_CQ_SOLICITED or %IB_CQ_NEXT_COMP
3890 * to request an event on the next solicited event or next work
3891 * completion at any type, respectively. %IB_CQ_REPORT_MISSED_EVENTS
3892 * may also be |ed in to request a hint about missed events, as
3893 * described below.
3894 *
3895 * Return Value:
3896 * < 0 means an error occurred while requesting notification
3897 * == 0 means notification was requested successfully, and if
3898 * IB_CQ_REPORT_MISSED_EVENTS was passed in, then no events
3899 * were missed and it is safe to wait for another event. In
3900 * this case is it guaranteed that any work completions added
3901 * to the CQ since the last CQ poll will trigger a completion
3902 * notification event.
3903 * > 0 is only returned if IB_CQ_REPORT_MISSED_EVENTS was passed
3904 * in. It means that the consumer must poll the CQ again to
3905 * make sure it is empty to avoid missing an event because of a
3906 * race between requesting notification and an entry being
3907 * added to the CQ. This return value means it is possible
3908 * (but not guaranteed) that a work completion has been added
3909 * to the CQ since the last poll without triggering a
3910 * completion notification event.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003911 */
3912static inline int ib_req_notify_cq(struct ib_cq *cq,
Roland Dreiered23a722007-05-06 21:02:48 -07003913 enum ib_cq_notify_flags flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003914{
Kamal Heib3023a1e2018-12-10 21:09:48 +02003915 return cq->device->ops.req_notify_cq(cq, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003916}
3917
3918/**
3919 * ib_req_ncomp_notif - Request completion notification when there are
3920 * at least the specified number of unreaped completions on the CQ.
3921 * @cq: The CQ to generate an event for.
3922 * @wc_cnt: The number of unreaped completions that should be on the
3923 * CQ before an event is generated.
3924 */
3925static inline int ib_req_ncomp_notif(struct ib_cq *cq, int wc_cnt)
3926{
Kamal Heib3023a1e2018-12-10 21:09:48 +02003927 return cq->device->ops.req_ncomp_notif ?
3928 cq->device->ops.req_ncomp_notif(cq, wc_cnt) :
Linus Torvalds1da177e2005-04-16 15:20:36 -07003929 -ENOSYS;
3930}
3931
3932/**
Ralph Campbell9b513092006-12-12 14:27:41 -08003933 * ib_dma_mapping_error - check a DMA addr for error
3934 * @dev: The device for which the dma_addr was created
3935 * @dma_addr: The DMA address to check
3936 */
3937static inline int ib_dma_mapping_error(struct ib_device *dev, u64 dma_addr)
3938{
Bart Van Assche0957c292017-03-07 22:56:53 +00003939 return dma_mapping_error(dev->dma_device, dma_addr);
Ralph Campbell9b513092006-12-12 14:27:41 -08003940}
3941
3942/**
3943 * ib_dma_map_single - Map a kernel virtual address to DMA address
3944 * @dev: The device for which the dma_addr is to be created
3945 * @cpu_addr: The kernel virtual address
3946 * @size: The size of the region in bytes
3947 * @direction: The direction of the DMA
3948 */
3949static inline u64 ib_dma_map_single(struct ib_device *dev,
3950 void *cpu_addr, size_t size,
3951 enum dma_data_direction direction)
3952{
Bart Van Assche0957c292017-03-07 22:56:53 +00003953 return dma_map_single(dev->dma_device, cpu_addr, size, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08003954}
3955
3956/**
3957 * ib_dma_unmap_single - Destroy a mapping created by ib_dma_map_single()
3958 * @dev: The device for which the DMA address was created
3959 * @addr: The DMA address
3960 * @size: The size of the region in bytes
3961 * @direction: The direction of the DMA
3962 */
3963static inline void ib_dma_unmap_single(struct ib_device *dev,
3964 u64 addr, size_t size,
3965 enum dma_data_direction direction)
3966{
Bart Van Assche0957c292017-03-07 22:56:53 +00003967 dma_unmap_single(dev->dma_device, addr, size, direction);
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07003968}
3969
Ralph Campbell9b513092006-12-12 14:27:41 -08003970/**
3971 * ib_dma_map_page - Map a physical page to DMA address
3972 * @dev: The device for which the dma_addr is to be created
3973 * @page: The page to be mapped
3974 * @offset: The offset within the page
3975 * @size: The size of the region in bytes
3976 * @direction: The direction of the DMA
3977 */
3978static inline u64 ib_dma_map_page(struct ib_device *dev,
3979 struct page *page,
3980 unsigned long offset,
3981 size_t size,
3982 enum dma_data_direction direction)
3983{
Bart Van Assche0957c292017-03-07 22:56:53 +00003984 return dma_map_page(dev->dma_device, page, offset, size, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08003985}
3986
3987/**
3988 * ib_dma_unmap_page - Destroy a mapping created by ib_dma_map_page()
3989 * @dev: The device for which the DMA address was created
3990 * @addr: The DMA address
3991 * @size: The size of the region in bytes
3992 * @direction: The direction of the DMA
3993 */
3994static inline void ib_dma_unmap_page(struct ib_device *dev,
3995 u64 addr, size_t size,
3996 enum dma_data_direction direction)
3997{
Bart Van Assche0957c292017-03-07 22:56:53 +00003998 dma_unmap_page(dev->dma_device, addr, size, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08003999}
4000
4001/**
4002 * ib_dma_map_sg - Map a scatter/gather list to DMA addresses
4003 * @dev: The device for which the DMA addresses are to be created
4004 * @sg: The array of scatter/gather entries
4005 * @nents: The number of scatter/gather entries
4006 * @direction: The direction of the DMA
4007 */
4008static inline int ib_dma_map_sg(struct ib_device *dev,
4009 struct scatterlist *sg, int nents,
4010 enum dma_data_direction direction)
4011{
Bart Van Assche0957c292017-03-07 22:56:53 +00004012 return dma_map_sg(dev->dma_device, sg, nents, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08004013}
4014
4015/**
4016 * ib_dma_unmap_sg - Unmap a scatter/gather list of DMA addresses
4017 * @dev: The device for which the DMA addresses were created
4018 * @sg: The array of scatter/gather entries
4019 * @nents: The number of scatter/gather entries
4020 * @direction: The direction of the DMA
4021 */
4022static inline void ib_dma_unmap_sg(struct ib_device *dev,
4023 struct scatterlist *sg, int nents,
4024 enum dma_data_direction direction)
4025{
Bart Van Assche0957c292017-03-07 22:56:53 +00004026 dma_unmap_sg(dev->dma_device, sg, nents, direction);
Ralph Campbell9b513092006-12-12 14:27:41 -08004027}
4028
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004029static inline int ib_dma_map_sg_attrs(struct ib_device *dev,
4030 struct scatterlist *sg, int nents,
4031 enum dma_data_direction direction,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07004032 unsigned long dma_attrs)
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004033{
Bart Van Assche0957c292017-03-07 22:56:53 +00004034 return dma_map_sg_attrs(dev->dma_device, sg, nents, direction,
4035 dma_attrs);
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004036}
4037
4038static inline void ib_dma_unmap_sg_attrs(struct ib_device *dev,
4039 struct scatterlist *sg, int nents,
4040 enum dma_data_direction direction,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07004041 unsigned long dma_attrs)
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004042{
Bart Van Assche0957c292017-03-07 22:56:53 +00004043 dma_unmap_sg_attrs(dev->dma_device, sg, nents, direction, dma_attrs);
Arthur Kepnercb9fbc52008-04-29 01:00:34 -07004044}
Ralph Campbell9b513092006-12-12 14:27:41 -08004045
4046/**
Bart Van Assche0b5cb332019-01-22 10:25:20 -08004047 * ib_dma_max_seg_size - Return the size limit of a single DMA transfer
4048 * @dev: The device to query
4049 *
4050 * The returned value represents a size in bytes.
4051 */
4052static inline unsigned int ib_dma_max_seg_size(struct ib_device *dev)
4053{
4054 struct device_dma_parameters *p = dev->dma_device->dma_parms;
4055
4056 return p ? p->max_segment_size : UINT_MAX;
4057}
4058
4059/**
Ralph Campbell9b513092006-12-12 14:27:41 -08004060 * ib_dma_sync_single_for_cpu - Prepare DMA region to be accessed by CPU
4061 * @dev: The device for which the DMA address was created
4062 * @addr: The DMA address
4063 * @size: The size of the region in bytes
4064 * @dir: The direction of the DMA
4065 */
4066static inline void ib_dma_sync_single_for_cpu(struct ib_device *dev,
4067 u64 addr,
4068 size_t size,
4069 enum dma_data_direction dir)
4070{
Bart Van Assche0957c292017-03-07 22:56:53 +00004071 dma_sync_single_for_cpu(dev->dma_device, addr, size, dir);
Ralph Campbell9b513092006-12-12 14:27:41 -08004072}
4073
4074/**
4075 * ib_dma_sync_single_for_device - Prepare DMA region to be accessed by device
4076 * @dev: The device for which the DMA address was created
4077 * @addr: The DMA address
4078 * @size: The size of the region in bytes
4079 * @dir: The direction of the DMA
4080 */
4081static inline void ib_dma_sync_single_for_device(struct ib_device *dev,
4082 u64 addr,
4083 size_t size,
4084 enum dma_data_direction dir)
4085{
Bart Van Assche0957c292017-03-07 22:56:53 +00004086 dma_sync_single_for_device(dev->dma_device, addr, size, dir);
Ralph Campbell9b513092006-12-12 14:27:41 -08004087}
4088
4089/**
4090 * ib_dma_alloc_coherent - Allocate memory and map it for DMA
4091 * @dev: The device for which the DMA address is requested
4092 * @size: The size of the region to allocate in bytes
4093 * @dma_handle: A pointer for returning the DMA address of the region
4094 * @flag: memory allocator flags
4095 */
4096static inline void *ib_dma_alloc_coherent(struct ib_device *dev,
4097 size_t size,
Bart Van Assched43dbac2017-01-20 13:04:10 -08004098 dma_addr_t *dma_handle,
Ralph Campbell9b513092006-12-12 14:27:41 -08004099 gfp_t flag)
4100{
Bart Van Assche0957c292017-03-07 22:56:53 +00004101 return dma_alloc_coherent(dev->dma_device, size, dma_handle, flag);
Ralph Campbell9b513092006-12-12 14:27:41 -08004102}
4103
4104/**
4105 * ib_dma_free_coherent - Free memory allocated by ib_dma_alloc_coherent()
4106 * @dev: The device for which the DMA addresses were allocated
4107 * @size: The size of the region
4108 * @cpu_addr: the address returned by ib_dma_alloc_coherent()
4109 * @dma_handle: the DMA address returned by ib_dma_alloc_coherent()
4110 */
4111static inline void ib_dma_free_coherent(struct ib_device *dev,
4112 size_t size, void *cpu_addr,
Bart Van Assched43dbac2017-01-20 13:04:10 -08004113 dma_addr_t dma_handle)
Ralph Campbell9b513092006-12-12 14:27:41 -08004114{
Bart Van Assche0957c292017-03-07 22:56:53 +00004115 dma_free_coherent(dev->dma_device, size, cpu_addr, dma_handle);
Ralph Campbell9b513092006-12-12 14:27:41 -08004116}
4117
4118/**
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004119 * ib_dereg_mr_user - Deregisters a memory region and removes it from the
4120 * HCA translation table.
4121 * @mr: The memory region to deregister.
4122 * @udata: Valid user data or NULL for kernel object
4123 *
4124 * This function can fail, if the memory region has memory windows bound to it.
4125 */
4126int ib_dereg_mr_user(struct ib_mr *mr, struct ib_udata *udata);
4127
4128/**
4129 * ib_dereg_mr - Deregisters a kernel memory region and removes it from the
Linus Torvalds1da177e2005-04-16 15:20:36 -07004130 * HCA translation table.
4131 * @mr: The memory region to deregister.
Shani Michaeli7083e422013-02-06 16:19:12 +00004132 *
4133 * This function can fail, if the memory region has memory windows bound to it.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004134 *
4135 * NOTE: for user mr use ib_dereg_mr_user with valid udata!
Linus Torvalds1da177e2005-04-16 15:20:36 -07004136 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004137static inline int ib_dereg_mr(struct ib_mr *mr)
4138{
4139 return ib_dereg_mr_user(mr, NULL);
4140}
Linus Torvalds1da177e2005-04-16 15:20:36 -07004141
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004142struct ib_mr *ib_alloc_mr_user(struct ib_pd *pd, enum ib_mr_type mr_type,
4143 u32 max_num_sg, struct ib_udata *udata);
4144
4145static inline struct ib_mr *ib_alloc_mr(struct ib_pd *pd,
4146 enum ib_mr_type mr_type, u32 max_num_sg)
4147{
4148 return ib_alloc_mr_user(pd, mr_type, max_num_sg, NULL);
4149}
Steve Wise00f7ec32008-07-14 23:48:45 -07004150
4151/**
Steve Wise00f7ec32008-07-14 23:48:45 -07004152 * ib_update_fast_reg_key - updates the key portion of the fast_reg MR
4153 * R_Key and L_Key.
4154 * @mr - struct ib_mr pointer to be updated.
4155 * @newkey - new key to be used.
4156 */
4157static inline void ib_update_fast_reg_key(struct ib_mr *mr, u8 newkey)
4158{
4159 mr->lkey = (mr->lkey & 0xffffff00) | newkey;
4160 mr->rkey = (mr->rkey & 0xffffff00) | newkey;
4161}
4162
4163/**
Shani Michaeli7083e422013-02-06 16:19:12 +00004164 * ib_inc_rkey - increments the key portion of the given rkey. Can be used
4165 * for calculating a new rkey for type 2 memory windows.
4166 * @rkey - the rkey to increment.
4167 */
4168static inline u32 ib_inc_rkey(u32 rkey)
4169{
4170 const u32 mask = 0x000000ff;
4171 return ((rkey + 1) & mask) | (rkey & ~mask);
4172}
4173
4174/**
Linus Torvalds1da177e2005-04-16 15:20:36 -07004175 * ib_alloc_fmr - Allocates a unmapped fast memory region.
4176 * @pd: The protection domain associated with the unmapped region.
4177 * @mr_access_flags: Specifies the memory access rights.
4178 * @fmr_attr: Attributes of the unmapped region.
4179 *
4180 * A fast memory region must be mapped before it can be used as part of
4181 * a work request.
4182 */
4183struct ib_fmr *ib_alloc_fmr(struct ib_pd *pd,
4184 int mr_access_flags,
4185 struct ib_fmr_attr *fmr_attr);
4186
4187/**
4188 * ib_map_phys_fmr - Maps a list of physical pages to a fast memory region.
4189 * @fmr: The fast memory region to associate with the pages.
4190 * @page_list: An array of physical pages to map to the fast memory region.
4191 * @list_len: The number of pages in page_list.
4192 * @iova: The I/O virtual address to use with the mapped region.
4193 */
4194static inline int ib_map_phys_fmr(struct ib_fmr *fmr,
4195 u64 *page_list, int list_len,
4196 u64 iova)
4197{
Kamal Heib3023a1e2018-12-10 21:09:48 +02004198 return fmr->device->ops.map_phys_fmr(fmr, page_list, list_len, iova);
Linus Torvalds1da177e2005-04-16 15:20:36 -07004199}
4200
4201/**
4202 * ib_unmap_fmr - Removes the mapping from a list of fast memory regions.
4203 * @fmr_list: A linked list of fast memory regions to unmap.
4204 */
4205int ib_unmap_fmr(struct list_head *fmr_list);
4206
4207/**
4208 * ib_dealloc_fmr - Deallocates a fast memory region.
4209 * @fmr: The fast memory region to deallocate.
4210 */
4211int ib_dealloc_fmr(struct ib_fmr *fmr);
4212
4213/**
4214 * ib_attach_mcast - Attaches the specified QP to a multicast group.
4215 * @qp: QP to attach to the multicast group. The QP must be type
4216 * IB_QPT_UD.
4217 * @gid: Multicast group GID.
4218 * @lid: Multicast group LID in host byte order.
4219 *
4220 * In order to send and receive multicast packets, subnet
4221 * administration must have created the multicast group and configured
4222 * the fabric appropriately. The port associated with the specified
4223 * QP must also be a member of the multicast group.
4224 */
4225int ib_attach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
4226
4227/**
4228 * ib_detach_mcast - Detaches the specified QP from a multicast group.
4229 * @qp: QP to detach from the multicast group.
4230 * @gid: Multicast group GID.
4231 * @lid: Multicast group LID in host byte order.
4232 */
4233int ib_detach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
4234
Sean Hefty59991f92011-05-23 17:52:46 -07004235/**
4236 * ib_alloc_xrcd - Allocates an XRC domain.
4237 * @device: The device on which to allocate the XRC domain.
Leon Romanovskyf66c8ba2018-01-28 11:17:19 +02004238 * @caller: Module name for kernel consumers
Sean Hefty59991f92011-05-23 17:52:46 -07004239 */
Leon Romanovskyf66c8ba2018-01-28 11:17:19 +02004240struct ib_xrcd *__ib_alloc_xrcd(struct ib_device *device, const char *caller);
4241#define ib_alloc_xrcd(device) \
4242 __ib_alloc_xrcd((device), KBUILD_MODNAME)
Sean Hefty59991f92011-05-23 17:52:46 -07004243
4244/**
4245 * ib_dealloc_xrcd - Deallocates an XRC domain.
4246 * @xrcd: The XRC domain to deallocate.
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004247 * @udata: Valid user data or NULL for kernel object
Sean Hefty59991f92011-05-23 17:52:46 -07004248 */
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004249int ib_dealloc_xrcd(struct ib_xrcd *xrcd, struct ib_udata *udata);
Sean Hefty59991f92011-05-23 17:52:46 -07004250
Eli Cohen1c636f82013-10-31 15:26:32 +02004251static inline int ib_check_mr_access(int flags)
4252{
4253 /*
4254 * Local write permission is required if remote write or
4255 * remote atomic permission is also requested.
4256 */
4257 if (flags & (IB_ACCESS_REMOTE_ATOMIC | IB_ACCESS_REMOTE_WRITE) &&
4258 !(flags & IB_ACCESS_LOCAL_WRITE))
4259 return -EINVAL;
4260
4261 return 0;
4262}
4263
Jack Morgenstein08bb5582018-05-23 15:30:30 +03004264static inline bool ib_access_writable(int access_flags)
4265{
4266 /*
4267 * We have writable memory backing the MR if any of the following
4268 * access flags are set. "Local write" and "remote write" obviously
4269 * require write access. "Remote atomic" can do things like fetch and
4270 * add, which will modify memory, and "MW bind" can change permissions
4271 * by binding a window.
4272 */
4273 return access_flags &
4274 (IB_ACCESS_LOCAL_WRITE | IB_ACCESS_REMOTE_WRITE |
4275 IB_ACCESS_REMOTE_ATOMIC | IB_ACCESS_MW_BIND);
4276}
4277
Sagi Grimberg1b01d332014-02-23 14:19:05 +02004278/**
4279 * ib_check_mr_status: lightweight check of MR status.
4280 * This routine may provide status checks on a selected
4281 * ib_mr. first use is for signature status check.
4282 *
4283 * @mr: A memory region.
4284 * @check_mask: Bitmask of which checks to perform from
4285 * ib_mr_status_check enumeration.
4286 * @mr_status: The container of relevant status checks.
4287 * failed checks will be indicated in the status bitmask
4288 * and the relevant info shall be in the error item.
4289 */
4290int ib_check_mr_status(struct ib_mr *mr, u32 check_mask,
4291 struct ib_mr_status *mr_status);
4292
Jason Gunthorped79af722019-01-10 14:02:24 -07004293/**
4294 * ib_device_try_get: Hold a registration lock
4295 * device: The device to lock
4296 *
4297 * A device under an active registration lock cannot become unregistered. It
4298 * is only possible to obtain a registration lock on a device that is fully
4299 * registered, otherwise this function returns false.
4300 *
4301 * The registration lock is only necessary for actions which require the
4302 * device to still be registered. Uses that only require the device pointer to
4303 * be valid should use get_device(&ibdev->dev) to hold the memory.
4304 *
4305 */
4306static inline bool ib_device_try_get(struct ib_device *dev)
4307{
4308 return refcount_inc_not_zero(&dev->refcount);
4309}
4310
4311void ib_device_put(struct ib_device *device);
Jason Gunthorpe324e2272019-02-12 21:12:51 -07004312struct ib_device *ib_device_get_by_netdev(struct net_device *ndev,
4313 enum rdma_driver_id driver_id);
4314struct ib_device *ib_device_get_by_name(const char *name,
4315 enum rdma_driver_id driver_id);
Yotam Kenneth9268f722015-07-30 17:50:15 +03004316struct net_device *ib_get_net_dev_by_params(struct ib_device *dev, u8 port,
4317 u16 pkey, const union ib_gid *gid,
4318 const struct sockaddr *addr);
Jason Gunthorpec2261dd2019-02-12 21:12:50 -07004319int ib_device_set_netdev(struct ib_device *ib_dev, struct net_device *ndev,
4320 unsigned int port);
4321struct net_device *ib_device_netdev(struct ib_device *dev, u8 port);
4322
Yishai Hadas5fd251c2016-05-23 15:20:48 +03004323struct ib_wq *ib_create_wq(struct ib_pd *pd,
4324 struct ib_wq_init_attr *init_attr);
Shamir Rabinovitchc4367a22019-03-31 19:10:05 +03004325int ib_destroy_wq(struct ib_wq *wq, struct ib_udata *udata);
Yishai Hadas5fd251c2016-05-23 15:20:48 +03004326int ib_modify_wq(struct ib_wq *wq, struct ib_wq_attr *attr,
4327 u32 wq_attr_mask);
Yishai Hadas6d397862016-05-23 15:20:51 +03004328struct ib_rwq_ind_table *ib_create_rwq_ind_table(struct ib_device *device,
4329 struct ib_rwq_ind_table_init_attr*
4330 wq_ind_table_init_attr);
4331int ib_destroy_rwq_ind_table(struct ib_rwq_ind_table *wq_ind_table);
Yotam Kenneth9268f722015-07-30 17:50:15 +03004332
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004333int ib_map_mr_sg(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
Bart Van Assche9aa8b322016-05-12 10:49:15 -07004334 unsigned int *sg_offset, unsigned int page_size);
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004335
4336static inline int
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004337ib_map_mr_sg_zbva(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
Bart Van Assche9aa8b322016-05-12 10:49:15 -07004338 unsigned int *sg_offset, unsigned int page_size)
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004339{
4340 int n;
4341
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004342 n = ib_map_mr_sg(mr, sg, sg_nents, sg_offset, page_size);
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004343 mr->iova = 0;
4344
4345 return n;
4346}
4347
Christoph Hellwigff2ba992016-05-03 18:01:04 +02004348int ib_sg_to_pages(struct ib_mr *mr, struct scatterlist *sgl, int sg_nents,
Bart Van Assche9aa8b322016-05-12 10:49:15 -07004349 unsigned int *sg_offset, int (*set_page)(struct ib_mr *, u64));
Sagi Grimberg4c67e2b2015-10-13 19:11:24 +03004350
Steve Wise765d6772016-02-17 08:15:41 -08004351void ib_drain_rq(struct ib_qp *qp);
4352void ib_drain_sq(struct ib_qp *qp);
4353void ib_drain_qp(struct ib_qp *qp);
Moni Shoua850d8fd2016-11-10 11:30:56 +02004354
Yuval Shaiad4186192017-06-14 23:13:34 +03004355int ib_get_eth_speed(struct ib_device *dev, u8 port_num, u8 *speed, u8 *width);
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004356
4357static inline u8 *rdma_ah_retrieve_dmac(struct rdma_ah_attr *attr)
4358{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004359 if (attr->type == RDMA_AH_ATTR_TYPE_ROCE)
4360 return attr->roce.dmac;
4361 return NULL;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004362}
4363
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004364static inline void rdma_ah_set_dlid(struct rdma_ah_attr *attr, u32 dlid)
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004365{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004366 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004367 attr->ib.dlid = (u16)dlid;
4368 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4369 attr->opa.dlid = dlid;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004370}
4371
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004372static inline u32 rdma_ah_get_dlid(const struct rdma_ah_attr *attr)
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004373{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004374 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
4375 return attr->ib.dlid;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004376 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4377 return attr->opa.dlid;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004378 return 0;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004379}
4380
4381static inline void rdma_ah_set_sl(struct rdma_ah_attr *attr, u8 sl)
4382{
4383 attr->sl = sl;
4384}
4385
4386static inline u8 rdma_ah_get_sl(const struct rdma_ah_attr *attr)
4387{
4388 return attr->sl;
4389}
4390
4391static inline void rdma_ah_set_path_bits(struct rdma_ah_attr *attr,
4392 u8 src_path_bits)
4393{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004394 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
4395 attr->ib.src_path_bits = src_path_bits;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004396 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4397 attr->opa.src_path_bits = src_path_bits;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004398}
4399
4400static inline u8 rdma_ah_get_path_bits(const struct rdma_ah_attr *attr)
4401{
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004402 if (attr->type == RDMA_AH_ATTR_TYPE_IB)
4403 return attr->ib.src_path_bits;
Dasaratharaman Chandramouli64b46462017-04-29 14:41:30 -04004404 else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4405 return attr->opa.src_path_bits;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004406 return 0;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004407}
4408
Don Hiattd98bb7f2017-08-04 13:54:16 -07004409static inline void rdma_ah_set_make_grd(struct rdma_ah_attr *attr,
4410 bool make_grd)
4411{
4412 if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4413 attr->opa.make_grd = make_grd;
4414}
4415
4416static inline bool rdma_ah_get_make_grd(const struct rdma_ah_attr *attr)
4417{
4418 if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
4419 return attr->opa.make_grd;
4420 return false;
4421}
4422
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004423static inline void rdma_ah_set_port_num(struct rdma_ah_attr *attr, u8 port_num)
4424{
4425 attr->port_num = port_num;
4426}
4427
4428static inline u8 rdma_ah_get_port_num(const struct rdma_ah_attr *attr)
4429{
4430 return attr->port_num;
4431}
4432
4433static inline void rdma_ah_set_static_rate(struct rdma_ah_attr *attr,
4434 u8 static_rate)
4435{
4436 attr->static_rate = static_rate;
4437}
4438
4439static inline u8 rdma_ah_get_static_rate(const struct rdma_ah_attr *attr)
4440{
4441 return attr->static_rate;
4442}
4443
4444static inline void rdma_ah_set_ah_flags(struct rdma_ah_attr *attr,
4445 enum ib_ah_flags flag)
4446{
4447 attr->ah_flags = flag;
4448}
4449
4450static inline enum ib_ah_flags
4451 rdma_ah_get_ah_flags(const struct rdma_ah_attr *attr)
4452{
4453 return attr->ah_flags;
4454}
4455
4456static inline const struct ib_global_route
4457 *rdma_ah_read_grh(const struct rdma_ah_attr *attr)
4458{
4459 return &attr->grh;
4460}
4461
4462/*To retrieve and modify the grh */
4463static inline struct ib_global_route
4464 *rdma_ah_retrieve_grh(struct rdma_ah_attr *attr)
4465{
4466 return &attr->grh;
4467}
4468
4469static inline void rdma_ah_set_dgid_raw(struct rdma_ah_attr *attr, void *dgid)
4470{
4471 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4472
4473 memcpy(grh->dgid.raw, dgid, sizeof(grh->dgid));
4474}
4475
4476static inline void rdma_ah_set_subnet_prefix(struct rdma_ah_attr *attr,
4477 __be64 prefix)
4478{
4479 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4480
4481 grh->dgid.global.subnet_prefix = prefix;
4482}
4483
4484static inline void rdma_ah_set_interface_id(struct rdma_ah_attr *attr,
4485 __be64 if_id)
4486{
4487 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4488
4489 grh->dgid.global.interface_id = if_id;
4490}
4491
4492static inline void rdma_ah_set_grh(struct rdma_ah_attr *attr,
4493 union ib_gid *dgid, u32 flow_label,
4494 u8 sgid_index, u8 hop_limit,
4495 u8 traffic_class)
4496{
4497 struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
4498
4499 attr->ah_flags = IB_AH_GRH;
4500 if (dgid)
4501 grh->dgid = *dgid;
4502 grh->flow_label = flow_label;
4503 grh->sgid_index = sgid_index;
4504 grh->hop_limit = hop_limit;
4505 grh->traffic_class = traffic_class;
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +03004506 grh->sgid_attr = NULL;
Dasaratharaman Chandramouli2224c472017-04-29 14:41:27 -04004507}
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004508
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +03004509void rdma_destroy_ah_attr(struct rdma_ah_attr *ah_attr);
4510void rdma_move_grh_sgid_attr(struct rdma_ah_attr *attr, union ib_gid *dgid,
4511 u32 flow_label, u8 hop_limit, u8 traffic_class,
4512 const struct ib_gid_attr *sgid_attr);
Jason Gunthorped97099f2018-06-13 10:22:05 +03004513void rdma_copy_ah_attr(struct rdma_ah_attr *dest,
4514 const struct rdma_ah_attr *src);
4515void rdma_replace_ah_attr(struct rdma_ah_attr *old,
4516 const struct rdma_ah_attr *new);
4517void rdma_move_ah_attr(struct rdma_ah_attr *dest, struct rdma_ah_attr *src);
Jason Gunthorpe8d9ec9a2018-06-13 10:22:03 +03004518
Don Hiatt87daac62018-02-01 10:57:03 -08004519/**
4520 * rdma_ah_find_type - Return address handle type.
4521 *
4522 * @dev: Device to be checked
4523 * @port_num: Port number
4524 */
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004525static inline enum rdma_ah_attr_type rdma_ah_find_type(struct ib_device *dev,
Don Hiatt87daac62018-02-01 10:57:03 -08004526 u8 port_num)
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004527{
Parav Pandita6532e72018-01-12 07:58:42 +02004528 if (rdma_protocol_roce(dev, port_num))
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004529 return RDMA_AH_ATTR_TYPE_ROCE;
Don Hiatt87daac62018-02-01 10:57:03 -08004530 if (rdma_protocol_ib(dev, port_num)) {
4531 if (rdma_cap_opa_ah(dev, port_num))
4532 return RDMA_AH_ATTR_TYPE_OPA;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004533 return RDMA_AH_ATTR_TYPE_IB;
Don Hiatt87daac62018-02-01 10:57:03 -08004534 }
4535
4536 return RDMA_AH_ATTR_TYPE_UNDEFINED;
Dasaratharaman Chandramouli44c58482017-04-29 14:41:29 -04004537}
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004538
Hiatt, Don62ede772017-08-14 14:17:43 -04004539/**
4540 * ib_lid_cpu16 - Return lid in 16bit CPU encoding.
4541 * In the current implementation the only way to get
4542 * get the 32bit lid is from other sources for OPA.
4543 * For IB, lids will always be 16bits so cast the
4544 * value accordingly.
4545 *
4546 * @lid: A 32bit LID
4547 */
4548static inline u16 ib_lid_cpu16(u32 lid)
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004549{
Hiatt, Don62ede772017-08-14 14:17:43 -04004550 WARN_ON_ONCE(lid & 0xFFFF0000);
4551 return (u16)lid;
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004552}
4553
Hiatt, Don62ede772017-08-14 14:17:43 -04004554/**
4555 * ib_lid_be16 - Return lid in 16bit BE encoding.
4556 *
4557 * @lid: A 32bit LID
4558 */
4559static inline __be16 ib_lid_be16(u32 lid)
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004560{
Hiatt, Don62ede772017-08-14 14:17:43 -04004561 WARN_ON_ONCE(lid & 0xFFFF0000);
4562 return cpu_to_be16((u16)lid);
Hiatt, Don7db20ec2017-06-08 13:37:49 -04004563}
Doug Ledford32043832017-08-10 14:31:29 -04004564
Sagi Grimbergc66cd352017-07-13 11:09:41 +03004565/**
4566 * ib_get_vector_affinity - Get the affinity mappings of a given completion
4567 * vector
4568 * @device: the rdma device
4569 * @comp_vector: index of completion vector
4570 *
4571 * Returns NULL on failure, otherwise a corresponding cpu map of the
4572 * completion vector (returns all-cpus map if the device driver doesn't
4573 * implement get_vector_affinity).
4574 */
4575static inline const struct cpumask *
4576ib_get_vector_affinity(struct ib_device *device, int comp_vector)
4577{
4578 if (comp_vector < 0 || comp_vector >= device->num_comp_vectors ||
Kamal Heib3023a1e2018-12-10 21:09:48 +02004579 !device->ops.get_vector_affinity)
Sagi Grimbergc66cd352017-07-13 11:09:41 +03004580 return NULL;
4581
Kamal Heib3023a1e2018-12-10 21:09:48 +02004582 return device->ops.get_vector_affinity(device, comp_vector);
Sagi Grimbergc66cd352017-07-13 11:09:41 +03004583
4584}
4585
Daniel Jurgens32f69e42018-01-04 17:25:36 +02004586/**
4587 * rdma_roce_rescan_device - Rescan all of the network devices in the system
4588 * and add their gids, as needed, to the relevant RoCE devices.
4589 *
4590 * @device: the rdma device
4591 */
4592void rdma_roce_rescan_device(struct ib_device *ibdev);
4593
Jason Gunthorpe8313c102018-11-25 20:51:13 +02004594struct ib_ucontext *ib_uverbs_get_ucontext_file(struct ib_uverbs_file *ufile);
Yishai Hadas7dc08dc2018-06-17 12:59:59 +03004595
Jason Gunthorpe15a1b4b2018-11-25 20:51:15 +02004596int uverbs_destroy_def_handler(struct uverbs_attr_bundle *attrs);
Denis Drozdovf6a8a192018-08-14 14:08:51 +03004597
4598struct net_device *rdma_alloc_netdev(struct ib_device *device, u8 port_num,
4599 enum rdma_netdev_t type, const char *name,
4600 unsigned char name_assign_type,
4601 void (*setup)(struct net_device *));
Denis Drozdov5d6b0cb2018-08-14 14:22:35 +03004602
4603int rdma_init_netdev(struct ib_device *device, u8 port_num,
4604 enum rdma_netdev_t type, const char *name,
4605 unsigned char name_assign_type,
4606 void (*setup)(struct net_device *),
4607 struct net_device *netdev);
4608
Parav Panditd4122f52018-10-11 22:31:53 +03004609/**
4610 * rdma_set_device_sysfs_group - Set device attributes group to have
4611 * driver specific sysfs entries at
4612 * for infiniband class.
4613 *
4614 * @device: device pointer for which attributes to be created
4615 * @group: Pointer to group which should be added when device
4616 * is registered with sysfs.
4617 * rdma_set_device_sysfs_group() allows existing drivers to expose one
4618 * group per device to have sysfs attributes.
4619 *
4620 * NOTE: New drivers should not make use of this API; instead new device
4621 * parameter should be exposed via netlink command. This API and mechanism
4622 * exist only for existing drivers.
4623 */
4624static inline void
4625rdma_set_device_sysfs_group(struct ib_device *dev,
4626 const struct attribute_group *group)
4627{
4628 dev->groups[1] = group;
4629}
4630
Parav Pandit54747232018-12-18 14:15:56 +02004631/**
4632 * rdma_device_to_ibdev - Get ib_device pointer from device pointer
4633 *
4634 * @device: device pointer for which ib_device pointer to retrieve
4635 *
4636 * rdma_device_to_ibdev() retrieves ib_device pointer from device.
4637 *
4638 */
4639static inline struct ib_device *rdma_device_to_ibdev(struct device *device)
4640{
Parav Panditcebe5562019-02-26 13:56:11 +02004641 struct ib_core_device *coredev =
4642 container_of(device, struct ib_core_device, dev);
4643
4644 return coredev->owner;
Parav Pandit54747232018-12-18 14:15:56 +02004645}
4646
4647/**
4648 * rdma_device_to_drv_device - Helper macro to reach back to driver's
4649 * ib_device holder structure from device pointer.
4650 *
4651 * NOTE: New drivers should not make use of this API; This API is only for
4652 * existing drivers who have exposed sysfs entries using
4653 * rdma_set_device_sysfs_group().
4654 */
4655#define rdma_device_to_drv_device(dev, drv_dev_struct, ibdev_member) \
4656 container_of(rdma_device_to_ibdev(dev), drv_dev_struct, ibdev_member)
Parav Pandit41c61402019-02-26 14:01:46 +02004657
4658bool rdma_dev_access_netns(const struct ib_device *device,
4659 const struct net *net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07004660#endif /* IB_VERBS_H */