1 /*
2 * Copyright (c) 2004 Mellanox Technologies Ltd. All rights reserved.
3 * Copyright (c) 2004 Infinicon Corporation. All rights reserved.
4 * Copyright (c) 2004 Intel Corporation. All rights reserved.
5 * Copyright (c) 2004 Topspin Corporation. All rights reserved.
6 * Copyright (c) 2004 Voltaire Corporation. All rights reserved.
7 * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
8 * Copyright (c) 2005, 2006, 2007 Cisco Systems. All rights reserved.
9 *
10 * This software is available to you under a choice of one of two
11 * licenses. You may choose to be licensed under the terms of the GNU
12 * General Public License (GPL) Version 2, available from the file
13 * COPYING in the main directory of this source tree, or the
14 * OpenIB.org BSD license below:
15 *
16 * Redistribution and use in source and binary forms, with or
17 * without modification, are permitted provided that the following
18 * conditions are met:
19 *
20 * - Redistributions of source code must retain the above
21 * copyright notice, this list of conditions and the following
22 * disclaimer.
23 *
24 * - Redistributions in binary form must reproduce the above
25 * copyright notice, this list of conditions and the following
26 * disclaimer in the documentation and/or other materials
27 * provided with the distribution.
28 *
29 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
30 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
31 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
32 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
33 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
34 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
35 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
36 * SOFTWARE.
37 */
38
39 #if !defined(IB_VERBS_H)
40 #define IB_VERBS_H
41
42 #include <linux/types.h>
43 #include <linux/device.h>
44 #include <linux/mm.h>
45 #include <linux/dma-mapping.h>
46 #include <linux/kref.h>
47 #include <linux/list.h>
48 #include <linux/rwsem.h>
49 #include <linux/scatterlist.h>
50 #include <linux/workqueue.h>
51
52 #include <asm/uaccess.h>
53 #include <linux/rbtree.h>
54 #include <linux/mutex.h>
55
56 extern struct workqueue_struct *ib_wq;
57
58 union ib_gid {
59 u8 raw[16];
60 struct {
61 __be64 subnet_prefix;
62 __be64 interface_id;
63 } global;
64 };
65
66 enum rdma_node_type {
67 /* IB values map to NodeInfo:NodeType. */
68 RDMA_NODE_IB_CA = 1,
69 RDMA_NODE_IB_SWITCH,
70 RDMA_NODE_IB_ROUTER,
71 RDMA_NODE_RNIC
72 };
73
74 enum rdma_transport_type {
75 RDMA_TRANSPORT_IB,
76 RDMA_TRANSPORT_IWARP
77 };
78
79 enum rdma_transport_type
80 rdma_node_get_transport(enum rdma_node_type node_type) __attribute_const__;
81
82 enum rdma_link_layer {
83 IB_LINK_LAYER_UNSPECIFIED,
84 IB_LINK_LAYER_INFINIBAND,
85 IB_LINK_LAYER_ETHERNET,
86 };
87
88 enum ib_device_cap_flags {
89 IB_DEVICE_RESIZE_MAX_WR = 1,
90 IB_DEVICE_BAD_PKEY_CNTR = (1<<1),
91 IB_DEVICE_BAD_QKEY_CNTR = (1<<2),
92 IB_DEVICE_RAW_MULTI = (1<<3),
93 IB_DEVICE_AUTO_PATH_MIG = (1<<4),
94 IB_DEVICE_CHANGE_PHY_PORT = (1<<5),
95 IB_DEVICE_UD_AV_PORT_ENFORCE = (1<<6),
96 IB_DEVICE_CURR_QP_STATE_MOD = (1<<7),
97 IB_DEVICE_SHUTDOWN_PORT = (1<<8),
98 IB_DEVICE_INIT_TYPE = (1<<9),
99 IB_DEVICE_PORT_ACTIVE_EVENT = (1<<10),
100 IB_DEVICE_SYS_IMAGE_GUID = (1<<11),
101 IB_DEVICE_RC_RNR_NAK_GEN = (1<<12),
102 IB_DEVICE_SRQ_RESIZE = (1<<13),
103 IB_DEVICE_N_NOTIFY_CQ = (1<<14),
104 IB_DEVICE_LOCAL_DMA_LKEY = (1<<15),
105 IB_DEVICE_RESERVED = (1<<16), /* old SEND_W_INV */
106 IB_DEVICE_MEM_WINDOW = (1<<17),
107 /*
108 * Devices should set IB_DEVICE_UD_IP_SUM if they support
109 * insertion of UDP and TCP checksum on outgoing UD IPoIB
110 * messages and can verify the validity of checksum for
111 * incoming messages. Setting this flag implies that the
112 * IPoIB driver may set NETIF_F_IP_CSUM for datagram mode.
113 */
114 IB_DEVICE_UD_IP_CSUM = (1<<18),
115 IB_DEVICE_UD_TSO = (1<<19),
116 IB_DEVICE_XRC = (1<<20),
117 IB_DEVICE_MEM_MGT_EXTENSIONS = (1<<21),
118 IB_DEVICE_BLOCK_MULTICAST_LOOPBACK = (1<<22),
119 IB_DEVICE_MR_ALLOCATE = (1<<23),
120 IB_DEVICE_SHARED_MR = (1<<24),
121 IB_DEVICE_QPG = (1<<25),
122 IB_DEVICE_UD_RSS = (1<<26),
123 IB_DEVICE_UD_TSS = (1<<27)
124 };
125
126 enum ib_atomic_cap {
127 IB_ATOMIC_NONE,
128 IB_ATOMIC_HCA,
129 IB_ATOMIC_GLOB
130 };
131
132 struct ib_device_attr {
133 u64 fw_ver;
134 __be64 sys_image_guid;
135 u64 max_mr_size;
136 u64 page_size_cap;
137 u32 vendor_id;
138 u32 vendor_part_id;
139 u32 hw_ver;
140 int max_qp;
141 int max_qp_wr;
142 int device_cap_flags;
143 int max_sge;
144 int max_sge_rd;
145 int max_cq;
146 int max_cqe;
147 int max_mr;
148 int max_pd;
149 int max_qp_rd_atom;
150 int max_ee_rd_atom;
151 int max_res_rd_atom;
152 int max_qp_init_rd_atom;
153 int max_ee_init_rd_atom;
154 enum ib_atomic_cap atomic_cap;
155 enum ib_atomic_cap masked_atomic_cap;
156 int max_ee;
157 int max_rdd;
158 int max_mw;
159 int max_raw_ipv6_qp;
160 int max_raw_ethy_qp;
161 int max_mcast_grp;
162 int max_mcast_qp_attach;
163 int max_total_mcast_qp_attach;
164 int max_ah;
165 int max_fmr;
166 int max_map_per_fmr;
167 int max_srq;
168 int max_srq_wr;
169 int max_srq_sge;
170 unsigned int max_fast_reg_page_list_len;
171 int max_rss_tbl_sz;
172 u16 max_pkeys;
173 u8 local_ca_ack_delay;
174 };
175
176 enum ib_mtu {
177 IB_MTU_256 = 1,
178 IB_MTU_512 = 2,
179 IB_MTU_1024 = 3,
180 IB_MTU_2048 = 4,
181 IB_MTU_4096 = 5
182 };
183
ib_mtu_enum_to_int(enum ib_mtu mtu)184 static inline int ib_mtu_enum_to_int(enum ib_mtu mtu)
185 {
186 switch (mtu) {
187 case IB_MTU_256: return 256;
188 case IB_MTU_512: return 512;
189 case IB_MTU_1024: return 1024;
190 case IB_MTU_2048: return 2048;
191 case IB_MTU_4096: return 4096;
192 default: return -1;
193 }
194 }
195
196 enum ib_port_state {
197 IB_PORT_NOP = 0,
198 IB_PORT_DOWN = 1,
199 IB_PORT_INIT = 2,
200 IB_PORT_ARMED = 3,
201 IB_PORT_ACTIVE = 4,
202 IB_PORT_ACTIVE_DEFER = 5
203 };
204
205 enum ib_port_cap_flags {
206 IB_PORT_SM = 1 << 1,
207 IB_PORT_NOTICE_SUP = 1 << 2,
208 IB_PORT_TRAP_SUP = 1 << 3,
209 IB_PORT_OPT_IPD_SUP = 1 << 4,
210 IB_PORT_AUTO_MIGR_SUP = 1 << 5,
211 IB_PORT_SL_MAP_SUP = 1 << 6,
212 IB_PORT_MKEY_NVRAM = 1 << 7,
213 IB_PORT_PKEY_NVRAM = 1 << 8,
214 IB_PORT_LED_INFO_SUP = 1 << 9,
215 IB_PORT_SM_DISABLED = 1 << 10,
216 IB_PORT_SYS_IMAGE_GUID_SUP = 1 << 11,
217 IB_PORT_PKEY_SW_EXT_PORT_TRAP_SUP = 1 << 12,
218 IB_PORT_EXTENDED_SPEEDS_SUP = 1 << 14,
219 IB_PORT_CM_SUP = 1 << 16,
220 IB_PORT_SNMP_TUNNEL_SUP = 1 << 17,
221 IB_PORT_REINIT_SUP = 1 << 18,
222 IB_PORT_DEVICE_MGMT_SUP = 1 << 19,
223 IB_PORT_VENDOR_CLASS_SUP = 1 << 20,
224 IB_PORT_DR_NOTICE_SUP = 1 << 21,
225 IB_PORT_CAP_MASK_NOTICE_SUP = 1 << 22,
226 IB_PORT_BOOT_MGMT_SUP = 1 << 23,
227 IB_PORT_LINK_LATENCY_SUP = 1 << 24,
228 IB_PORT_CLIENT_REG_SUP = 1 << 25
229 };
230
231 enum ib_port_width {
232 IB_WIDTH_1X = 1,
233 IB_WIDTH_4X = 2,
234 IB_WIDTH_8X = 4,
235 IB_WIDTH_12X = 8
236 };
237
ib_width_enum_to_int(enum ib_port_width width)238 static inline int ib_width_enum_to_int(enum ib_port_width width)
239 {
240 switch (width) {
241 case IB_WIDTH_1X: return 1;
242 case IB_WIDTH_4X: return 4;
243 case IB_WIDTH_8X: return 8;
244 case IB_WIDTH_12X: return 12;
245 default: return -1;
246 }
247 }
248
249 enum ib_port_speed {
250 IB_SPEED_SDR = 1,
251 IB_SPEED_DDR = 2,
252 IB_SPEED_QDR = 4,
253 IB_SPEED_FDR10 = 8,
254 IB_SPEED_FDR = 16,
255 IB_SPEED_EDR = 32
256 };
257
258 struct ib_protocol_stats {
259 /* TBD... */
260 };
261
262 struct iw_protocol_stats {
263 u64 ipInReceives;
264 u64 ipInHdrErrors;
265 u64 ipInTooBigErrors;
266 u64 ipInNoRoutes;
267 u64 ipInAddrErrors;
268 u64 ipInUnknownProtos;
269 u64 ipInTruncatedPkts;
270 u64 ipInDiscards;
271 u64 ipInDelivers;
272 u64 ipOutForwDatagrams;
273 u64 ipOutRequests;
274 u64 ipOutDiscards;
275 u64 ipOutNoRoutes;
276 u64 ipReasmTimeout;
277 u64 ipReasmReqds;
278 u64 ipReasmOKs;
279 u64 ipReasmFails;
280 u64 ipFragOKs;
281 u64 ipFragFails;
282 u64 ipFragCreates;
283 u64 ipInMcastPkts;
284 u64 ipOutMcastPkts;
285 u64 ipInBcastPkts;
286 u64 ipOutBcastPkts;
287
288 u64 tcpRtoAlgorithm;
289 u64 tcpRtoMin;
290 u64 tcpRtoMax;
291 u64 tcpMaxConn;
292 u64 tcpActiveOpens;
293 u64 tcpPassiveOpens;
294 u64 tcpAttemptFails;
295 u64 tcpEstabResets;
296 u64 tcpCurrEstab;
297 u64 tcpInSegs;
298 u64 tcpOutSegs;
299 u64 tcpRetransSegs;
300 u64 tcpInErrs;
301 u64 tcpOutRsts;
302 };
303
304 union rdma_protocol_stats {
305 struct ib_protocol_stats ib;
306 struct iw_protocol_stats iw;
307 };
308
309 /* Define bits for the various functionality this port needs to be supported by
310 * the core.
311 */
312 /* Management 0x00000FFF */
313 #define RDMA_CORE_CAP_IB_MAD 0x00000001
314 #define RDMA_CORE_CAP_IB_SMI 0x00000002
315 #define RDMA_CORE_CAP_IB_CM 0x00000004
316 #define RDMA_CORE_CAP_IW_CM 0x00000008
317 #define RDMA_CORE_CAP_IB_SA 0x00000010
318 #define RDMA_CORE_CAP_OPA_MAD 0x00000020
319
320 /* Address format 0x000FF000 */
321 #define RDMA_CORE_CAP_AF_IB 0x00001000
322 #define RDMA_CORE_CAP_ETH_AH 0x00002000
323 #define RDMA_CORE_CAP_OPA_AH 0x00004000
324
325 /* Protocol 0xFFF00000 */
326 #define RDMA_CORE_CAP_PROT_IB 0x00100000
327 #define RDMA_CORE_CAP_PROT_ROCE 0x00200000
328 #define RDMA_CORE_CAP_PROT_IWARP 0x00400000
329 #define RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP 0x00800000
330 #define RDMA_CORE_CAP_PROT_RAW_PACKET 0x01000000
331 #define RDMA_CORE_CAP_PROT_USNIC 0x02000000
332
333 #define RDMA_CORE_PORT_IBA_IB (RDMA_CORE_CAP_PROT_IB \
334 | RDMA_CORE_CAP_IB_MAD \
335 | RDMA_CORE_CAP_IB_SMI \
336 | RDMA_CORE_CAP_IB_CM \
337 | RDMA_CORE_CAP_IB_SA \
338 | RDMA_CORE_CAP_AF_IB)
339 #define RDMA_CORE_PORT_IBA_ROCE (RDMA_CORE_CAP_PROT_ROCE \
340 | RDMA_CORE_CAP_IB_MAD \
341 | RDMA_CORE_CAP_IB_CM \
342 | RDMA_CORE_CAP_AF_IB \
343 | RDMA_CORE_CAP_ETH_AH)
344 #define RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP \
345 (RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP \
346 | RDMA_CORE_CAP_IB_MAD \
347 | RDMA_CORE_CAP_IB_CM \
348 | RDMA_CORE_CAP_AF_IB \
349 | RDMA_CORE_CAP_ETH_AH)
350 #define RDMA_CORE_PORT_IWARP (RDMA_CORE_CAP_PROT_IWARP \
351 | RDMA_CORE_CAP_IW_CM)
352 #define RDMA_CORE_PORT_INTEL_OPA (RDMA_CORE_PORT_IBA_IB \
353 | RDMA_CORE_CAP_OPA_MAD)
354
355 #define RDMA_CORE_PORT_RAW_PACKET (RDMA_CORE_CAP_PROT_RAW_PACKET)
356
357 #define RDMA_CORE_PORT_USNIC (RDMA_CORE_CAP_PROT_USNIC)
358
359 struct ib_port_attr {
360 enum ib_port_state state;
361 enum ib_mtu max_mtu;
362 enum ib_mtu active_mtu;
363 int gid_tbl_len;
364 u32 port_cap_flags;
365 u32 max_msg_sz;
366 u32 bad_pkey_cntr;
367 u32 qkey_viol_cntr;
368 u16 pkey_tbl_len;
369 u16 lid;
370 u16 sm_lid;
371 u8 lmc;
372 u8 max_vl_num;
373 u8 sm_sl;
374 u8 subnet_timeout;
375 u8 init_type_reply;
376 u8 active_width;
377 u8 active_speed;
378 u8 phys_state;
379 enum rdma_link_layer link_layer;
380 };
381
382 enum ib_device_modify_flags {
383 IB_DEVICE_MODIFY_SYS_IMAGE_GUID = 1 << 0,
384 IB_DEVICE_MODIFY_NODE_DESC = 1 << 1
385 };
386
387 struct ib_device_modify {
388 u64 sys_image_guid;
389 char node_desc[64];
390 };
391
392 enum ib_port_modify_flags {
393 IB_PORT_SHUTDOWN = 1,
394 IB_PORT_INIT_TYPE = (1<<2),
395 IB_PORT_RESET_QKEY_CNTR = (1<<3)
396 };
397
398 struct ib_port_modify {
399 u32 set_port_cap_mask;
400 u32 clr_port_cap_mask;
401 u8 init_type;
402 };
403
404 enum ib_event_type {
405 IB_EVENT_CQ_ERR,
406 IB_EVENT_QP_FATAL,
407 IB_EVENT_QP_REQ_ERR,
408 IB_EVENT_QP_ACCESS_ERR,
409 IB_EVENT_COMM_EST,
410 IB_EVENT_SQ_DRAINED,
411 IB_EVENT_PATH_MIG,
412 IB_EVENT_PATH_MIG_ERR,
413 IB_EVENT_DEVICE_FATAL,
414 IB_EVENT_PORT_ACTIVE,
415 IB_EVENT_PORT_ERR,
416 IB_EVENT_LID_CHANGE,
417 IB_EVENT_PKEY_CHANGE,
418 IB_EVENT_SM_CHANGE,
419 IB_EVENT_SRQ_ERR,
420 IB_EVENT_SRQ_LIMIT_REACHED,
421 IB_EVENT_QP_LAST_WQE_REACHED,
422 IB_EVENT_CLIENT_REREGISTER,
423 IB_EVENT_GID_CHANGE,
424 };
425
426 enum ib_event_flags {
427 IB_XRC_QP_EVENT_FLAG = 0x80000000,
428 };
429
430 struct ib_event {
431 struct ib_device *device;
432 union {
433 struct ib_cq *cq;
434 struct ib_qp *qp;
435 struct ib_srq *srq;
436 u8 port_num;
437 u32 xrc_qp_num;
438 } element;
439 enum ib_event_type event;
440 };
441
442 struct ib_event_handler {
443 struct ib_device *device;
444 void (*handler)(struct ib_event_handler *, struct ib_event *);
445 struct list_head list;
446 };
447
448 #define INIT_IB_EVENT_HANDLER(_ptr, _device, _handler) \
449 do { \
450 (_ptr)->device = _device; \
451 (_ptr)->handler = _handler; \
452 INIT_LIST_HEAD(&(_ptr)->list); \
453 } while (0)
454
455 struct ib_global_route {
456 union ib_gid dgid;
457 u32 flow_label;
458 u8 sgid_index;
459 u8 hop_limit;
460 u8 traffic_class;
461 };
462
463 struct ib_grh {
464 __be32 version_tclass_flow;
465 __be16 paylen;
466 u8 next_hdr;
467 u8 hop_limit;
468 union ib_gid sgid;
469 union ib_gid dgid;
470 };
471
472 enum {
473 IB_MULTICAST_QPN = 0xffffff
474 };
475
476 #define IB_LID_PERMISSIVE cpu_to_be16(0xFFFF)
477
478 enum ib_ah_flags {
479 IB_AH_GRH = 1
480 };
481
482 enum ib_rate {
483 IB_RATE_PORT_CURRENT = 0,
484 IB_RATE_2_5_GBPS = 2,
485 IB_RATE_5_GBPS = 5,
486 IB_RATE_10_GBPS = 3,
487 IB_RATE_20_GBPS = 6,
488 IB_RATE_30_GBPS = 4,
489 IB_RATE_40_GBPS = 7,
490 IB_RATE_60_GBPS = 8,
491 IB_RATE_80_GBPS = 9,
492 IB_RATE_120_GBPS = 10,
493 IB_RATE_14_GBPS = 11,
494 IB_RATE_56_GBPS = 12,
495 IB_RATE_112_GBPS = 13,
496 IB_RATE_168_GBPS = 14,
497 IB_RATE_25_GBPS = 15,
498 IB_RATE_100_GBPS = 16,
499 IB_RATE_200_GBPS = 17,
500 IB_RATE_300_GBPS = 18
501 };
502
503 /**
504 * ib_rate_to_mult - Convert the IB rate enum to a multiple of the
505 * base rate of 2.5 Gbit/sec. For example, IB_RATE_5_GBPS will be
506 * converted to 2, since 5 Gbit/sec is 2 * 2.5 Gbit/sec.
507 * @rate: rate to convert.
508 */
509 int ib_rate_to_mult(enum ib_rate rate) __attribute_const__;
510
511 /**
512 * ib_rate_to_mbps - Convert the IB rate enum to Mbps.
513 * For example, IB_RATE_2_5_GBPS will be converted to 2500.
514 * @rate: rate to convert.
515 */
516 int ib_rate_to_mbps(enum ib_rate rate) __attribute_const__;
517
518 /**
519 * mult_to_ib_rate - Convert a multiple of 2.5 Gbit/sec to an IB rate
520 * enum.
521 * @mult: multiple to convert.
522 */
523 enum ib_rate mult_to_ib_rate(int mult) __attribute_const__;
524
525 struct ib_ah_attr {
526 struct ib_global_route grh;
527 u16 dlid;
528 u8 sl;
529 u8 src_path_bits;
530 u8 static_rate;
531 u8 ah_flags;
532 u8 port_num;
533 };
534
535 enum ib_wc_status {
536 IB_WC_SUCCESS,
537 IB_WC_LOC_LEN_ERR,
538 IB_WC_LOC_QP_OP_ERR,
539 IB_WC_LOC_EEC_OP_ERR,
540 IB_WC_LOC_PROT_ERR,
541 IB_WC_WR_FLUSH_ERR,
542 IB_WC_MW_BIND_ERR,
543 IB_WC_BAD_RESP_ERR,
544 IB_WC_LOC_ACCESS_ERR,
545 IB_WC_REM_INV_REQ_ERR,
546 IB_WC_REM_ACCESS_ERR,
547 IB_WC_REM_OP_ERR,
548 IB_WC_RETRY_EXC_ERR,
549 IB_WC_RNR_RETRY_EXC_ERR,
550 IB_WC_LOC_RDD_VIOL_ERR,
551 IB_WC_REM_INV_RD_REQ_ERR,
552 IB_WC_REM_ABORT_ERR,
553 IB_WC_INV_EECN_ERR,
554 IB_WC_INV_EEC_STATE_ERR,
555 IB_WC_FATAL_ERR,
556 IB_WC_RESP_TIMEOUT_ERR,
557 IB_WC_GENERAL_ERR
558 };
559
560 enum ib_wc_opcode {
561 IB_WC_SEND,
562 IB_WC_RDMA_WRITE,
563 IB_WC_RDMA_READ,
564 IB_WC_COMP_SWAP,
565 IB_WC_FETCH_ADD,
566 IB_WC_BIND_MW,
567 IB_WC_LSO,
568 IB_WC_LOCAL_INV,
569 IB_WC_FAST_REG_MR,
570 IB_WC_MASKED_COMP_SWAP,
571 IB_WC_MASKED_FETCH_ADD,
572 /*
573 * Set value of IB_WC_RECV so consumers can test if a completion is a
574 * receive by testing (opcode & IB_WC_RECV).
575 */
576 IB_WC_RECV = 1 << 7,
577 IB_WC_RECV_RDMA_WITH_IMM
578 };
579
580 enum ib_wc_flags {
581 IB_WC_GRH = 1,
582 IB_WC_WITH_IMM = (1<<1),
583 IB_WC_WITH_INVALIDATE = (1<<2),
584 IB_WC_IP_CSUM_OK = (1<<3),
585 };
586
587 struct ib_wc {
588 u64 wr_id;
589 enum ib_wc_status status;
590 enum ib_wc_opcode opcode;
591 u32 vendor_err;
592 u32 byte_len;
593 struct ib_qp *qp;
594 union {
595 __be32 imm_data;
596 u32 invalidate_rkey;
597 } ex;
598 u32 src_qp;
599 int wc_flags;
600 u16 pkey_index;
601 u16 slid;
602 u8 sl;
603 u8 dlid_path_bits;
604 u8 port_num; /* valid only for DR SMPs on switches */
605 int csum_ok;
606 };
607
608 enum ib_cq_notify_flags {
609 IB_CQ_SOLICITED = 1 << 0,
610 IB_CQ_NEXT_COMP = 1 << 1,
611 IB_CQ_SOLICITED_MASK = IB_CQ_SOLICITED | IB_CQ_NEXT_COMP,
612 IB_CQ_REPORT_MISSED_EVENTS = 1 << 2,
613 };
614
615 enum ib_srq_type {
616 IB_SRQT_BASIC,
617 IB_SRQT_XRC
618 };
619
620 enum ib_srq_attr_mask {
621 IB_SRQ_MAX_WR = 1 << 0,
622 IB_SRQ_LIMIT = 1 << 1,
623 };
624
625 struct ib_srq_attr {
626 u32 max_wr;
627 u32 max_sge;
628 u32 srq_limit;
629 };
630
631 struct ib_srq_init_attr {
632 void (*event_handler)(struct ib_event *, void *);
633 void *srq_context;
634 struct ib_srq_attr attr;
635 enum ib_srq_type srq_type;
636
637 union {
638 struct {
639 struct ib_xrcd *xrcd;
640 struct ib_cq *cq;
641 } xrc;
642 } ext;
643 };
644
645 struct ib_qp_cap {
646 u32 max_send_wr;
647 u32 max_recv_wr;
648 u32 max_send_sge;
649 u32 max_recv_sge;
650 u32 max_inline_data;
651 u32 qpg_tss_mask_sz;
652 };
653
654 enum ib_sig_type {
655 IB_SIGNAL_ALL_WR,
656 IB_SIGNAL_REQ_WR
657 };
658
659 enum ib_qp_type {
660 /*
661 * IB_QPT_SMI and IB_QPT_GSI have to be the first two entries
662 * here (and in that order) since the MAD layer uses them as
663 * indices into a 2-entry table.
664 */
665 IB_QPT_SMI,
666 IB_QPT_GSI,
667
668 IB_QPT_RC,
669 IB_QPT_UC,
670 IB_QPT_UD,
671 IB_QPT_XRC,
672 IB_QPT_RAW_IPV6,
673 IB_QPT_RAW_ETHERTYPE,
674 IB_QPT_RAW_PACKET = 8,
675 IB_QPT_XRC_INI = 9,
676 IB_QPT_XRC_TGT,
677 IB_QPT_MAX,
678 };
679
680 enum ib_qp_create_flags {
681 IB_QP_CREATE_IPOIB_UD_LSO = 1 << 0,
682 IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK = 1 << 1,
683 IB_QP_CREATE_NETIF_QP = 1 << 2,
684 /* reserve bits 26-31 for low level drivers' internal use */
685 IB_QP_CREATE_RESERVED_START = 1 << 26,
686 IB_QP_CREATE_RESERVED_END = 1 << 31,
687 };
688
689 enum ib_qpg_type {
690 IB_QPG_NONE = 0,
691 IB_QPG_PARENT = (1<<0),
692 IB_QPG_CHILD_RX = (1<<1),
693 IB_QPG_CHILD_TX = (1<<2)
694 };
695
696 struct ib_qpg_init_attrib {
697 u32 tss_child_count;
698 u32 rss_child_count;
699 };
700
701 struct ib_qp_init_attr {
702 void (*event_handler)(struct ib_event *, void *);
703 void *qp_context;
704 struct ib_cq *send_cq;
705 struct ib_cq *recv_cq;
706 struct ib_srq *srq;
707 struct ib_xrcd *xrcd; /* XRC TGT QPs only */
708 struct ib_qp_cap cap;
709 union {
710 struct ib_qp *qpg_parent; /* see qpg_type */
711 struct ib_qpg_init_attrib parent_attrib;
712 } pp;
713 enum ib_sig_type sq_sig_type;
714 enum ib_qp_type qp_type;
715 enum ib_qp_create_flags create_flags;
716 enum ib_qpg_type qpg_type;
717 u8 port_num; /* special QP types only */
718 };
719
720 struct ib_qp_open_attr {
721 void (*event_handler)(struct ib_event *, void *);
722 void *qp_context;
723 u32 qp_num;
724 enum ib_qp_type qp_type;
725 };
726
727 enum ib_rnr_timeout {
728 IB_RNR_TIMER_655_36 = 0,
729 IB_RNR_TIMER_000_01 = 1,
730 IB_RNR_TIMER_000_02 = 2,
731 IB_RNR_TIMER_000_03 = 3,
732 IB_RNR_TIMER_000_04 = 4,
733 IB_RNR_TIMER_000_06 = 5,
734 IB_RNR_TIMER_000_08 = 6,
735 IB_RNR_TIMER_000_12 = 7,
736 IB_RNR_TIMER_000_16 = 8,
737 IB_RNR_TIMER_000_24 = 9,
738 IB_RNR_TIMER_000_32 = 10,
739 IB_RNR_TIMER_000_48 = 11,
740 IB_RNR_TIMER_000_64 = 12,
741 IB_RNR_TIMER_000_96 = 13,
742 IB_RNR_TIMER_001_28 = 14,
743 IB_RNR_TIMER_001_92 = 15,
744 IB_RNR_TIMER_002_56 = 16,
745 IB_RNR_TIMER_003_84 = 17,
746 IB_RNR_TIMER_005_12 = 18,
747 IB_RNR_TIMER_007_68 = 19,
748 IB_RNR_TIMER_010_24 = 20,
749 IB_RNR_TIMER_015_36 = 21,
750 IB_RNR_TIMER_020_48 = 22,
751 IB_RNR_TIMER_030_72 = 23,
752 IB_RNR_TIMER_040_96 = 24,
753 IB_RNR_TIMER_061_44 = 25,
754 IB_RNR_TIMER_081_92 = 26,
755 IB_RNR_TIMER_122_88 = 27,
756 IB_RNR_TIMER_163_84 = 28,
757 IB_RNR_TIMER_245_76 = 29,
758 IB_RNR_TIMER_327_68 = 30,
759 IB_RNR_TIMER_491_52 = 31
760 };
761
762 enum ib_qp_attr_mask {
763 IB_QP_STATE = 1,
764 IB_QP_CUR_STATE = (1<<1),
765 IB_QP_EN_SQD_ASYNC_NOTIFY = (1<<2),
766 IB_QP_ACCESS_FLAGS = (1<<3),
767 IB_QP_PKEY_INDEX = (1<<4),
768 IB_QP_PORT = (1<<5),
769 IB_QP_QKEY = (1<<6),
770 IB_QP_AV = (1<<7),
771 IB_QP_PATH_MTU = (1<<8),
772 IB_QP_TIMEOUT = (1<<9),
773 IB_QP_RETRY_CNT = (1<<10),
774 IB_QP_RNR_RETRY = (1<<11),
775 IB_QP_RQ_PSN = (1<<12),
776 IB_QP_MAX_QP_RD_ATOMIC = (1<<13),
777 IB_QP_ALT_PATH = (1<<14),
778 IB_QP_MIN_RNR_TIMER = (1<<15),
779 IB_QP_SQ_PSN = (1<<16),
780 IB_QP_MAX_DEST_RD_ATOMIC = (1<<17),
781 IB_QP_PATH_MIG_STATE = (1<<18),
782 IB_QP_CAP = (1<<19),
783 IB_QP_DEST_QPN = (1<<20),
784 IB_QP_GROUP_RSS = (1<<21)
785 };
786
787 enum ib_qp_state {
788 IB_QPS_RESET,
789 IB_QPS_INIT,
790 IB_QPS_RTR,
791 IB_QPS_RTS,
792 IB_QPS_SQD,
793 IB_QPS_SQE,
794 IB_QPS_ERR
795 };
796
797 enum ib_mig_state {
798 IB_MIG_MIGRATED,
799 IB_MIG_REARM,
800 IB_MIG_ARMED
801 };
802
803 struct ib_qp_attr {
804 enum ib_qp_state qp_state;
805 enum ib_qp_state cur_qp_state;
806 enum ib_mtu path_mtu;
807 enum ib_mig_state path_mig_state;
808 u32 qkey;
809 u32 rq_psn;
810 u32 sq_psn;
811 u32 dest_qp_num;
812 int qp_access_flags;
813 struct ib_qp_cap cap;
814 struct ib_ah_attr ah_attr;
815 struct ib_ah_attr alt_ah_attr;
816 u16 pkey_index;
817 u16 alt_pkey_index;
818 u8 en_sqd_async_notify;
819 u8 sq_draining;
820 u8 max_rd_atomic;
821 u8 max_dest_rd_atomic;
822 u8 min_rnr_timer;
823 u8 port_num;
824 u8 timeout;
825 u8 retry_cnt;
826 u8 rnr_retry;
827 u8 alt_port_num;
828 u8 alt_timeout;
829 };
830
831 enum ib_wr_opcode {
832 IB_WR_RDMA_WRITE,
833 IB_WR_RDMA_WRITE_WITH_IMM,
834 IB_WR_SEND,
835 IB_WR_SEND_WITH_IMM,
836 IB_WR_RDMA_READ,
837 IB_WR_ATOMIC_CMP_AND_SWP,
838 IB_WR_ATOMIC_FETCH_AND_ADD,
839 IB_WR_LSO,
840 IB_WR_BIG_LSO,
841 IB_WR_SEND_WITH_INV,
842 IB_WR_RDMA_READ_WITH_INV,
843 IB_WR_LOCAL_INV,
844 IB_WR_FAST_REG_MR,
845 IB_WR_MASKED_ATOMIC_CMP_AND_SWP,
846 IB_WR_MASKED_ATOMIC_FETCH_AND_ADD,
847 };
848
849 enum ib_send_flags {
850 IB_SEND_FENCE = 1,
851 IB_SEND_SIGNALED = (1<<1),
852 IB_SEND_SOLICITED = (1<<2),
853 IB_SEND_INLINE = (1<<3),
854 IB_SEND_IP_CSUM = (1<<4)
855 };
856
857 enum ib_flow_types {
858 IB_FLOW_ETH = 0,
859 IB_FLOW_IB_UC = 1,
860 IB_FLOW_IB_MC_IPV4 = 2,
861 IB_FLOW_IB_MC_IPV6 = 3
862 };
863
864 enum {
865 IB_FLOW_L4_NONE = 0,
866 IB_FLOW_L4_OTHER = 3,
867 IB_FLOW_L4_UDP = 5,
868 IB_FLOW_L4_TCP = 6
869 };
870
871 struct ib_sge {
872 u64 addr;
873 u32 length;
874 u32 lkey;
875 };
876
877 struct ib_fast_reg_page_list {
878 struct ib_device *device;
879 u64 *page_list;
880 unsigned int max_page_list_len;
881 };
882
883 struct ib_send_wr {
884 struct ib_send_wr *next;
885 u64 wr_id;
886 struct ib_sge *sg_list;
887 int num_sge;
888 enum ib_wr_opcode opcode;
889 int send_flags;
890 union {
891 __be32 imm_data;
892 u32 invalidate_rkey;
893 } ex;
894 union {
895 struct {
896 u64 remote_addr;
897 u32 rkey;
898 } rdma;
899 struct {
900 u64 remote_addr;
901 u64 compare_add;
902 u64 swap;
903 u64 compare_add_mask;
904 u64 swap_mask;
905 u32 rkey;
906 } atomic;
907 struct {
908 struct ib_ah *ah;
909 void *header;
910 int hlen;
911 int mss;
912 u32 remote_qpn;
913 u32 remote_qkey;
914 u16 pkey_index; /* valid for GSI only */
915 u8 port_num; /* valid for DR SMPs on switch only */
916 } ud;
917 struct {
918 u64 iova_start;
919 struct ib_fast_reg_page_list *page_list;
920 unsigned int page_shift;
921 unsigned int page_list_len;
922 u32 length;
923 int access_flags;
924 u32 rkey;
925 } fast_reg;
926 struct {
927 struct ib_unpacked_lrh *lrh;
928 u32 eth_type;
929 u8 static_rate;
930 } raw_ety;
931 } wr;
932 u32 xrc_remote_srq_num; /* XRC TGT QPs only */
933 };
934
935 struct ib_recv_wr {
936 struct ib_recv_wr *next;
937 u64 wr_id;
938 struct ib_sge *sg_list;
939 int num_sge;
940 };
941
942 enum ib_access_flags {
943 IB_ACCESS_LOCAL_WRITE = 1,
944 IB_ACCESS_REMOTE_WRITE = (1<<1),
945 IB_ACCESS_REMOTE_READ = (1<<2),
946 IB_ACCESS_REMOTE_ATOMIC = (1<<3),
947 IB_ACCESS_MW_BIND = (1<<4),
948 IB_ACCESS_ALLOCATE_MR = (1<<5),
949 IB_ACCESS_SHARED_MR_USER_READ = (1<<6),
950 IB_ACCESS_SHARED_MR_USER_WRITE = (1<<7),
951 IB_ACCESS_SHARED_MR_GROUP_READ = (1<<8),
952 IB_ACCESS_SHARED_MR_GROUP_WRITE = (1<<9),
953 IB_ACCESS_SHARED_MR_OTHER_READ = (1<<10),
954 IB_ACCESS_SHARED_MR_OTHER_WRITE = (1<<11)
955
956 };
957
958 struct ib_phys_buf {
959 u64 addr;
960 u64 size;
961 };
962
963 struct ib_mr_attr {
964 struct ib_pd *pd;
965 u64 device_virt_addr;
966 u64 size;
967 int mr_access_flags;
968 u32 lkey;
969 u32 rkey;
970 };
971
972 enum ib_mr_rereg_flags {
973 IB_MR_REREG_TRANS = 1,
974 IB_MR_REREG_PD = (1<<1),
975 IB_MR_REREG_ACCESS = (1<<2)
976 };
977
978 struct ib_mw_bind {
979 struct ib_mr *mr;
980 u64 wr_id;
981 u64 addr;
982 u32 length;
983 int send_flags;
984 int mw_access_flags;
985 };
986
987 struct ib_fmr_attr {
988 int max_pages;
989 int max_maps;
990 u8 page_shift;
991 };
992
993 struct ib_ucontext {
994 struct ib_device *device;
995 struct list_head pd_list;
996 struct list_head mr_list;
997 struct list_head mw_list;
998 struct list_head cq_list;
999 struct list_head qp_list;
1000 struct list_head srq_list;
1001 struct list_head ah_list;
1002 struct list_head xrcd_list;
1003 int closing;
1004 };
1005
1006 struct ib_uobject {
1007 u64 user_handle; /* handle given to us by userspace */
1008 struct ib_ucontext *context; /* associated user context */
1009 void *object; /* containing object */
1010 struct list_head list; /* link to context's list */
1011 int id; /* index into kernel idr */
1012 struct kref ref;
1013 struct rw_semaphore mutex; /* protects .live */
1014 int live;
1015 };
1016
1017 struct ib_udata {
1018 void __user *inbuf;
1019 void __user *outbuf;
1020 size_t inlen;
1021 size_t outlen;
1022 };
1023
1024 struct ib_uxrc_rcv_object {
1025 struct list_head list; /* link to context's list */
1026 u32 qp_num;
1027 u32 domain_handle;
1028 };
1029
1030 struct ib_pd {
1031 struct ib_device *device;
1032 struct ib_uobject *uobject;
1033 atomic_t usecnt; /* count all resources */
1034 };
1035
1036 struct ib_xrcd {
1037 struct ib_device *device;
1038 struct ib_uobject *uobject;
1039 atomic_t usecnt; /* count all exposed resources */
1040 struct inode *inode;
1041 struct rb_node node;
1042
1043 struct mutex tgt_qp_mutex;
1044 struct list_head tgt_qp_list;
1045 };
1046
1047 struct ib_ah {
1048 struct ib_device *device;
1049 struct ib_pd *pd;
1050 struct ib_uobject *uobject;
1051 };
1052
1053 typedef void (*ib_comp_handler)(struct ib_cq *cq, void *cq_context);
1054
1055 struct ib_cq {
1056 struct ib_device *device;
1057 struct ib_uobject *uobject;
1058 ib_comp_handler comp_handler;
1059 void (*event_handler)(struct ib_event *, void *);
1060 void *cq_context;
1061 int cqe;
1062 atomic_t usecnt; /* count number of work queues */
1063 };
1064
1065 struct ib_srq {
1066 struct ib_device *device;
1067 struct ib_pd *pd;
1068 struct ib_uobject *uobject;
1069 void (*event_handler)(struct ib_event *, void *);
1070 void *srq_context;
1071 enum ib_srq_type srq_type;
1072 atomic_t usecnt;
1073
1074 union {
1075 struct {
1076 struct ib_xrcd *xrcd;
1077 struct ib_cq *cq;
1078 u32 srq_num;
1079 } xrc;
1080 } ext;
1081 };
1082
1083 struct ib_qp {
1084 struct ib_device *device;
1085 struct ib_pd *pd;
1086 struct ib_cq *send_cq;
1087 struct ib_cq *recv_cq;
1088 struct ib_srq *srq;
1089 struct ib_xrcd *xrcd; /* XRC TGT QPs only */
1090 struct list_head xrcd_list;
1091 atomic_t usecnt; /* count times opened, mcast attaches */
1092 struct list_head open_list;
1093 struct ib_qp *real_qp;
1094 struct ib_uobject *uobject;
1095 void (*event_handler)(struct ib_event *, void *);
1096 void *qp_context;
1097 u32 qp_num;
1098 enum ib_qp_type qp_type;
1099 enum ib_qpg_type qpg_type;
1100 };
1101
1102 struct ib_mr {
1103 struct ib_device *device;
1104 struct ib_pd *pd;
1105 struct ib_uobject *uobject;
1106 u32 lkey;
1107 u32 rkey;
1108 atomic_t usecnt; /* count number of MWs */
1109 };
1110
1111 struct ib_mw {
1112 struct ib_device *device;
1113 struct ib_pd *pd;
1114 struct ib_uobject *uobject;
1115 u32 rkey;
1116 };
1117
1118 struct ib_fmr {
1119 struct ib_device *device;
1120 struct ib_pd *pd;
1121 struct list_head list;
1122 u32 lkey;
1123 u32 rkey;
1124 };
1125
1126 struct ib_flow_spec {
1127 enum ib_flow_types type;
1128 union {
1129 struct {
1130 __be16 ethertype;
1131 __be16 vlan;
1132 u8 vlan_present;
1133 u8 mac[6];
1134 u8 port;
1135 } eth;
1136 struct {
1137 __be32 qpn;
1138 } ib_uc;
1139 struct {
1140 u8 mgid[16];
1141 } ib_mc;
1142 } l2_id;
1143 __be32 src_ip;
1144 __be32 dst_ip;
1145 __be16 src_port;
1146 __be16 dst_port;
1147 u8 l4_protocol;
1148 u8 block_mc_loopback;
1149 u8 rule_type;
1150 };
1151
1152 struct ib_mad;
1153 struct ib_grh;
1154
1155 enum ib_process_mad_flags {
1156 IB_MAD_IGNORE_MKEY = 1,
1157 IB_MAD_IGNORE_BKEY = 2,
1158 IB_MAD_IGNORE_ALL = IB_MAD_IGNORE_MKEY | IB_MAD_IGNORE_BKEY
1159 };
1160
1161 enum ib_mad_result {
1162 IB_MAD_RESULT_FAILURE = 0, /* (!SUCCESS is the important flag) */
1163 IB_MAD_RESULT_SUCCESS = 1 << 0, /* MAD was successfully processed */
1164 IB_MAD_RESULT_REPLY = 1 << 1, /* Reply packet needs to be sent */
1165 IB_MAD_RESULT_CONSUMED = 1 << 2 /* Packet consumed: stop processing */
1166 };
1167
1168 #define IB_DEVICE_NAME_MAX 64
1169
1170 struct ib_cache {
1171 rwlock_t lock;
1172 struct ib_event_handler event_handler;
1173 struct ib_pkey_cache **pkey_cache;
1174 struct ib_gid_cache **gid_cache;
1175 u8 *lmc_cache;
1176 };
1177
1178 struct ib_dma_mapping_ops {
1179 int (*mapping_error)(struct ib_device *dev,
1180 u64 dma_addr);
1181 u64 (*map_single)(struct ib_device *dev,
1182 void *ptr, size_t size,
1183 enum dma_data_direction direction);
1184 void (*unmap_single)(struct ib_device *dev,
1185 u64 addr, size_t size,
1186 enum dma_data_direction direction);
1187 u64 (*map_page)(struct ib_device *dev,
1188 struct page *page, unsigned long offset,
1189 size_t size,
1190 enum dma_data_direction direction);
1191 void (*unmap_page)(struct ib_device *dev,
1192 u64 addr, size_t size,
1193 enum dma_data_direction direction);
1194 int (*map_sg)(struct ib_device *dev,
1195 struct scatterlist *sg, int nents,
1196 enum dma_data_direction direction);
1197 void (*unmap_sg)(struct ib_device *dev,
1198 struct scatterlist *sg, int nents,
1199 enum dma_data_direction direction);
1200 u64 (*dma_address)(struct ib_device *dev,
1201 struct scatterlist *sg);
1202 unsigned int (*dma_len)(struct ib_device *dev,
1203 struct scatterlist *sg);
1204 void (*sync_single_for_cpu)(struct ib_device *dev,
1205 u64 dma_handle,
1206 size_t size,
1207 enum dma_data_direction dir);
1208 void (*sync_single_for_device)(struct ib_device *dev,
1209 u64 dma_handle,
1210 size_t size,
1211 enum dma_data_direction dir);
1212 void *(*alloc_coherent)(struct ib_device *dev,
1213 size_t size,
1214 u64 *dma_handle,
1215 gfp_t flag);
1216 void (*free_coherent)(struct ib_device *dev,
1217 size_t size, void *cpu_addr,
1218 u64 dma_handle);
1219 };
1220
1221 struct iw_cm_verbs;
1222
1223 struct ib_port_immutable {
1224 int pkey_tbl_len;
1225 int gid_tbl_len;
1226 u32 core_cap_flags;
1227 u32 max_mad_size;
1228 };
1229
1230 struct ib_device {
1231 struct device *dma_device;
1232
1233 char name[IB_DEVICE_NAME_MAX];
1234
1235 struct list_head event_handler_list;
1236 spinlock_t event_handler_lock;
1237
1238 spinlock_t client_data_lock;
1239 struct list_head core_list;
1240 struct list_head client_data_list;
1241
1242 struct ib_cache cache;
1243 /**
1244 * port_immutable is indexed by port number
1245 */
1246 struct ib_port_immutable *port_immutable;
1247
1248 int num_comp_vectors;
1249
1250 struct iw_cm_verbs *iwcm;
1251
1252 int (*get_protocol_stats)(struct ib_device *device,
1253 union rdma_protocol_stats *stats);
1254 int (*query_device)(struct ib_device *device,
1255 struct ib_device_attr *device_attr);
1256 int (*query_port)(struct ib_device *device,
1257 u8 port_num,
1258 struct ib_port_attr *port_attr);
1259 enum rdma_link_layer (*get_link_layer)(struct ib_device *device,
1260 u8 port_num);
1261 int (*query_gid)(struct ib_device *device,
1262 u8 port_num, int index,
1263 union ib_gid *gid);
1264 int (*query_pkey)(struct ib_device *device,
1265 u8 port_num, u16 index, u16 *pkey);
1266 int (*modify_device)(struct ib_device *device,
1267 int device_modify_mask,
1268 struct ib_device_modify *device_modify);
1269 int (*modify_port)(struct ib_device *device,
1270 u8 port_num, int port_modify_mask,
1271 struct ib_port_modify *port_modify);
1272 struct ib_ucontext * (*alloc_ucontext)(struct ib_device *device,
1273 struct ib_udata *udata);
1274 int (*dealloc_ucontext)(struct ib_ucontext *context);
1275 int (*mmap)(struct ib_ucontext *context,
1276 struct vm_area_struct *vma);
1277 struct ib_pd * (*alloc_pd)(struct ib_device *device,
1278 struct ib_ucontext *context,
1279 struct ib_udata *udata);
1280 int (*dealloc_pd)(struct ib_pd *pd);
1281 struct ib_ah * (*create_ah)(struct ib_pd *pd,
1282 struct ib_ah_attr *ah_attr);
1283 int (*modify_ah)(struct ib_ah *ah,
1284 struct ib_ah_attr *ah_attr);
1285 int (*query_ah)(struct ib_ah *ah,
1286 struct ib_ah_attr *ah_attr);
1287 int (*destroy_ah)(struct ib_ah *ah);
1288 struct ib_srq * (*create_srq)(struct ib_pd *pd,
1289 struct ib_srq_init_attr *srq_init_attr,
1290 struct ib_udata *udata);
1291 int (*modify_srq)(struct ib_srq *srq,
1292 struct ib_srq_attr *srq_attr,
1293 enum ib_srq_attr_mask srq_attr_mask,
1294 struct ib_udata *udata);
1295 int (*query_srq)(struct ib_srq *srq,
1296 struct ib_srq_attr *srq_attr);
1297 int (*destroy_srq)(struct ib_srq *srq);
1298 int (*post_srq_recv)(struct ib_srq *srq,
1299 struct ib_recv_wr *recv_wr,
1300 struct ib_recv_wr **bad_recv_wr);
1301 struct ib_qp * (*create_qp)(struct ib_pd *pd,
1302 struct ib_qp_init_attr *qp_init_attr,
1303 struct ib_udata *udata);
1304 int (*modify_qp)(struct ib_qp *qp,
1305 struct ib_qp_attr *qp_attr,
1306 int qp_attr_mask,
1307 struct ib_udata *udata);
1308 int (*query_qp)(struct ib_qp *qp,
1309 struct ib_qp_attr *qp_attr,
1310 int qp_attr_mask,
1311 struct ib_qp_init_attr *qp_init_attr);
1312 int (*destroy_qp)(struct ib_qp *qp);
1313 int (*post_send)(struct ib_qp *qp,
1314 struct ib_send_wr *send_wr,
1315 struct ib_send_wr **bad_send_wr);
1316 int (*post_recv)(struct ib_qp *qp,
1317 struct ib_recv_wr *recv_wr,
1318 struct ib_recv_wr **bad_recv_wr);
1319 struct ib_cq * (*create_cq)(struct ib_device *device, int cqe,
1320 int comp_vector,
1321 struct ib_ucontext *context,
1322 struct ib_udata *udata);
1323 int (*modify_cq)(struct ib_cq *cq, u16 cq_count,
1324 u16 cq_period);
1325 int (*destroy_cq)(struct ib_cq *cq);
1326 int (*resize_cq)(struct ib_cq *cq, int cqe,
1327 struct ib_udata *udata);
1328 int (*poll_cq)(struct ib_cq *cq, int num_entries,
1329 struct ib_wc *wc);
1330 int (*peek_cq)(struct ib_cq *cq, int wc_cnt);
1331 int (*req_notify_cq)(struct ib_cq *cq,
1332 enum ib_cq_notify_flags flags);
1333 int (*req_ncomp_notif)(struct ib_cq *cq,
1334 int wc_cnt);
1335 struct ib_mr * (*get_dma_mr)(struct ib_pd *pd,
1336 int mr_access_flags);
1337 struct ib_mr * (*reg_phys_mr)(struct ib_pd *pd,
1338 struct ib_phys_buf *phys_buf_array,
1339 int num_phys_buf,
1340 int mr_access_flags,
1341 u64 *iova_start);
1342 struct ib_mr * (*reg_user_mr)(struct ib_pd *pd,
1343 u64 start, u64 length,
1344 u64 virt_addr,
1345 int mr_access_flags,
1346 struct ib_udata *udata,
1347 int mr_id);
1348 int (*query_mr)(struct ib_mr *mr,
1349 struct ib_mr_attr *mr_attr);
1350 int (*dereg_mr)(struct ib_mr *mr);
1351 struct ib_mr * (*alloc_fast_reg_mr)(struct ib_pd *pd,
1352 int max_page_list_len);
1353 struct ib_fast_reg_page_list * (*alloc_fast_reg_page_list)(struct ib_device *device,
1354 int page_list_len);
1355 void (*free_fast_reg_page_list)(struct ib_fast_reg_page_list *page_list);
1356 int (*rereg_phys_mr)(struct ib_mr *mr,
1357 int mr_rereg_mask,
1358 struct ib_pd *pd,
1359 struct ib_phys_buf *phys_buf_array,
1360 int num_phys_buf,
1361 int mr_access_flags,
1362 u64 *iova_start);
1363 struct ib_mw * (*alloc_mw)(struct ib_pd *pd);
1364 int (*bind_mw)(struct ib_qp *qp,
1365 struct ib_mw *mw,
1366 struct ib_mw_bind *mw_bind);
1367 int (*dealloc_mw)(struct ib_mw *mw);
1368 struct ib_fmr * (*alloc_fmr)(struct ib_pd *pd,
1369 int mr_access_flags,
1370 struct ib_fmr_attr *fmr_attr);
1371 int (*map_phys_fmr)(struct ib_fmr *fmr,
1372 u64 *page_list, int list_len,
1373 u64 iova);
1374 int (*unmap_fmr)(struct list_head *fmr_list);
1375 int (*dealloc_fmr)(struct ib_fmr *fmr);
1376 int (*attach_mcast)(struct ib_qp *qp,
1377 union ib_gid *gid,
1378 u16 lid);
1379 int (*detach_mcast)(struct ib_qp *qp,
1380 union ib_gid *gid,
1381 u16 lid);
1382 int (*process_mad)(struct ib_device *device,
1383 int process_mad_flags,
1384 u8 port_num,
1385 struct ib_wc *in_wc,
1386 struct ib_grh *in_grh,
1387 struct ib_mad *in_mad,
1388 struct ib_mad *out_mad);
1389 struct ib_srq * (*create_xrc_srq)(struct ib_pd *pd,
1390 struct ib_cq *xrc_cq,
1391 struct ib_xrcd *xrcd,
1392 struct ib_srq_init_attr *srq_init_attr,
1393 struct ib_udata *udata);
1394 struct ib_xrcd * (*alloc_xrcd)(struct ib_device *device,
1395 struct ib_ucontext *ucontext,
1396 struct ib_udata *udata);
1397 int (*dealloc_xrcd)(struct ib_xrcd *xrcd);
1398 int (*create_xrc_rcv_qp)(struct ib_qp_init_attr *init_attr,
1399 u32 *qp_num);
1400 int (*modify_xrc_rcv_qp)(struct ib_xrcd *xrcd,
1401 u32 qp_num,
1402 struct ib_qp_attr *attr,
1403 int attr_mask);
1404 int (*query_xrc_rcv_qp)(struct ib_xrcd *xrcd,
1405 u32 qp_num,
1406 struct ib_qp_attr *attr,
1407 int attr_mask,
1408 struct ib_qp_init_attr *init_attr);
1409 int (*reg_xrc_rcv_qp)(struct ib_xrcd *xrcd,
1410 void *context,
1411 u32 qp_num);
1412 int (*unreg_xrc_rcv_qp)(struct ib_xrcd *xrcd,
1413 void *context,
1414 u32 qp_num);
1415 int (*attach_flow)(struct ib_qp *qp,
1416 struct ib_flow_spec *spec,
1417 int priority);
1418 int (*detach_flow)(struct ib_qp *qp,
1419 struct ib_flow_spec *spec,
1420 int priority);
1421
1422 unsigned long (*get_unmapped_area)(struct file *file,
1423 unsigned long addr,
1424 unsigned long len, unsigned long pgoff,
1425 unsigned long flags);
1426 struct ib_dma_mapping_ops *dma_ops;
1427
1428 struct module *owner;
1429 struct device dev;
1430 struct kobject *ports_parent;
1431 struct list_head port_list;
1432
1433 enum {
1434 IB_DEV_UNINITIALIZED,
1435 IB_DEV_REGISTERED,
1436 IB_DEV_UNREGISTERED
1437 } reg_state;
1438
1439 int uverbs_abi_ver;
1440 u64 uverbs_cmd_mask;
1441
1442 char node_desc[64];
1443 __be64 node_guid;
1444 u32 local_dma_lkey;
1445 u8 node_type;
1446 u8 phys_port_cnt;
1447 struct rb_root ib_uverbs_xrcd_table;
1448 struct mutex xrcd_table_mutex;
1449
1450 /**
1451 * The following mandatory functions are used only at device
1452 * registration. Keep functions such as these at the end of this
1453 * structure to avoid cache line misses when accessing struct ib_device
1454 * in fast paths.
1455 */
1456 int (*get_port_immutable)(struct ib_device *, u8, struct ib_port_immutable *);
1457 };
1458
1459 struct ib_client {
1460 char *name;
1461 void (*add) (struct ib_device *);
1462 void (*remove)(struct ib_device *);
1463
1464 struct list_head list;
1465 };
1466
1467 struct ib_device *ib_alloc_device(size_t size);
1468 void ib_dealloc_device(struct ib_device *device);
1469
1470 int ib_register_device(struct ib_device *device,
1471 int (*port_callback)(struct ib_device *,
1472 u8, struct kobject *));
1473 void ib_unregister_device(struct ib_device *device);
1474
1475 int ib_register_client (struct ib_client *client);
1476 void ib_unregister_client(struct ib_client *client);
1477
1478 void *ib_get_client_data(struct ib_device *device, struct ib_client *client);
1479 void ib_set_client_data(struct ib_device *device, struct ib_client *client,
1480 void *data);
1481
ib_copy_from_udata(void * dest,struct ib_udata * udata,size_t len)1482 static inline int ib_copy_from_udata(void *dest, struct ib_udata *udata, size_t len)
1483 {
1484 return copy_from_user(dest, udata->inbuf, len) ? -EFAULT : 0;
1485 }
1486
ib_copy_to_udata(struct ib_udata * udata,void * src,size_t len)1487 static inline int ib_copy_to_udata(struct ib_udata *udata, void *src, size_t len)
1488 {
1489 return copy_to_user(udata->outbuf, src, len) ? -EFAULT : 0;
1490 }
1491
1492 /**
1493 * ib_modify_qp_is_ok - Check that the supplied attribute mask
1494 * contains all required attributes and no attributes not allowed for
1495 * the given QP state transition.
1496 * @cur_state: Current QP state
1497 * @next_state: Next QP state
1498 * @type: QP type
1499 * @mask: Mask of supplied QP attributes
1500 *
1501 * This function is a helper function that a low-level driver's
1502 * modify_qp method can use to validate the consumer's input. It
1503 * checks that cur_state and next_state are valid QP states, that a
1504 * transition from cur_state to next_state is allowed by the IB spec,
1505 * and that the attribute mask supplied is allowed for the transition.
1506 */
1507 int ib_modify_qp_is_ok(enum ib_qp_state cur_state, enum ib_qp_state next_state,
1508 enum ib_qp_type type, enum ib_qp_attr_mask mask);
1509
1510 int ib_register_event_handler (struct ib_event_handler *event_handler);
1511 int ib_unregister_event_handler(struct ib_event_handler *event_handler);
1512 void ib_dispatch_event(struct ib_event *event);
1513
1514 int ib_query_device(struct ib_device *device,
1515 struct ib_device_attr *device_attr);
1516
1517 int ib_query_port(struct ib_device *device,
1518 u8 port_num, struct ib_port_attr *port_attr);
1519
1520 enum rdma_link_layer rdma_port_get_link_layer(struct ib_device *device,
1521 u8 port_num);
1522
rdma_protocol_ib(const struct ib_device * device,u8 port_num)1523 static inline bool rdma_protocol_ib(const struct ib_device *device, u8 port_num)
1524 {
1525 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_IB;
1526 }
1527
rdma_protocol_roce(const struct ib_device * device,u8 port_num)1528 static inline bool rdma_protocol_roce(const struct ib_device *device, u8 port_num)
1529 {
1530 return device->port_immutable[port_num].core_cap_flags &
1531 (RDMA_CORE_CAP_PROT_ROCE | RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP);
1532 }
1533
rdma_protocol_roce_udp_encap(const struct ib_device * device,u8 port_num)1534 static inline bool rdma_protocol_roce_udp_encap(const struct ib_device *device, u8 port_num)
1535 {
1536 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP;
1537 }
1538
rdma_protocol_roce_eth_encap(const struct ib_device * device,u8 port_num)1539 static inline bool rdma_protocol_roce_eth_encap(const struct ib_device *device, u8 port_num)
1540 {
1541 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_ROCE;
1542 }
1543
rdma_protocol_iwarp(const struct ib_device * device,u8 port_num)1544 static inline bool rdma_protocol_iwarp(const struct ib_device *device, u8 port_num)
1545 {
1546 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_IWARP;
1547 }
1548
rdma_ib_or_roce(const struct ib_device * device,u8 port_num)1549 static inline bool rdma_ib_or_roce(const struct ib_device *device, u8 port_num)
1550 {
1551 return rdma_protocol_ib(device, port_num) ||
1552 rdma_protocol_roce(device, port_num);
1553 }
1554
1555 /**
1556 * rdma_cap_ib_mad - Check if the port of a device supports Infiniband
1557 * Management Datagrams.
1558 * @device: Device to check
1559 * @port_num: Port number to check
1560 *
1561 * Management Datagrams (MAD) are a required part of the InfiniBand
1562 * specification and are supported on all InfiniBand devices. A slightly
1563 * extended version are also supported on OPA interfaces.
1564 *
1565 * Return: true if the port supports sending/receiving of MAD packets.
1566 */
rdma_cap_ib_mad(const struct ib_device * device,u8 port_num)1567 static inline bool rdma_cap_ib_mad(const struct ib_device *device, u8 port_num)
1568 {
1569 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_MAD;
1570 }
1571
1572 /**
1573 * rdma_cap_opa_mad - Check if the port of device provides support for OPA
1574 * Management Datagrams.
1575 * @device: Device to check
1576 * @port_num: Port number to check
1577 *
1578 * Intel OmniPath devices extend and/or replace the InfiniBand Management
1579 * datagrams with their own versions. These OPA MADs share many but not all of
1580 * the characteristics of InfiniBand MADs.
1581 *
1582 * OPA MADs differ in the following ways:
1583 *
1584 * 1) MADs are variable size up to 2K
1585 * IBTA defined MADs remain fixed at 256 bytes
1586 * 2) OPA SMPs must carry valid PKeys
1587 * 3) OPA SMP packets are a different format
1588 *
1589 * Return: true if the port supports OPA MAD packet formats.
1590 */
rdma_cap_opa_mad(struct ib_device * device,u8 port_num)1591 static inline bool rdma_cap_opa_mad(struct ib_device *device, u8 port_num)
1592 {
1593 return (device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_OPA_MAD)
1594 == RDMA_CORE_CAP_OPA_MAD;
1595 }
1596
1597 /**
1598 * rdma_cap_ib_smi - Check if the port of a device provides an Infiniband
1599 * Subnet Management Agent (SMA) on the Subnet Management Interface (SMI).
1600 * @device: Device to check
1601 * @port_num: Port number to check
1602 *
1603 * Each InfiniBand node is required to provide a Subnet Management Agent
1604 * that the subnet manager can access. Prior to the fabric being fully
1605 * configured by the subnet manager, the SMA is accessed via a well known
1606 * interface called the Subnet Management Interface (SMI). This interface
1607 * uses directed route packets to communicate with the SM to get around the
1608 * chicken and egg problem of the SM needing to know what's on the fabric
1609 * in order to configure the fabric, and needing to configure the fabric in
1610 * order to send packets to the devices on the fabric. These directed
1611 * route packets do not need the fabric fully configured in order to reach
1612 * their destination. The SMI is the only method allowed to send
1613 * directed route packets on an InfiniBand fabric.
1614 *
1615 * Return: true if the port provides an SMI.
1616 */
rdma_cap_ib_smi(const struct ib_device * device,u8 port_num)1617 static inline bool rdma_cap_ib_smi(const struct ib_device *device, u8 port_num)
1618 {
1619 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_SMI;
1620 }
1621
1622 /**
1623 * rdma_cap_ib_cm - Check if the port of device has the capability Infiniband
1624 * Communication Manager.
1625 * @device: Device to check
1626 * @port_num: Port number to check
1627 *
1628 * The InfiniBand Communication Manager is one of many pre-defined General
1629 * Service Agents (GSA) that are accessed via the General Service
1630 * Interface (GSI). It's role is to facilitate establishment of connections
1631 * between nodes as well as other management related tasks for established
1632 * connections.
1633 *
1634 * Return: true if the port supports an IB CM (this does not guarantee that
1635 * a CM is actually running however).
1636 */
rdma_cap_ib_cm(const struct ib_device * device,u8 port_num)1637 static inline bool rdma_cap_ib_cm(const struct ib_device *device, u8 port_num)
1638 {
1639 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_CM;
1640 }
1641
1642 /**
1643 * rdma_cap_iw_cm - Check if the port of device has the capability IWARP
1644 * Communication Manager.
1645 * @device: Device to check
1646 * @port_num: Port number to check
1647 *
1648 * Similar to above, but specific to iWARP connections which have a different
1649 * managment protocol than InfiniBand.
1650 *
1651 * Return: true if the port supports an iWARP CM (this does not guarantee that
1652 * a CM is actually running however).
1653 */
rdma_cap_iw_cm(const struct ib_device * device,u8 port_num)1654 static inline bool rdma_cap_iw_cm(const struct ib_device *device, u8 port_num)
1655 {
1656 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IW_CM;
1657 }
1658
1659 /**
1660 * rdma_cap_ib_sa - Check if the port of device has the capability Infiniband
1661 * Subnet Administration.
1662 * @device: Device to check
1663 * @port_num: Port number to check
1664 *
1665 * An InfiniBand Subnet Administration (SA) service is a pre-defined General
1666 * Service Agent (GSA) provided by the Subnet Manager (SM). On InfiniBand
1667 * fabrics, devices should resolve routes to other hosts by contacting the
1668 * SA to query the proper route.
1669 *
1670 * Return: true if the port should act as a client to the fabric Subnet
1671 * Administration interface. This does not imply that the SA service is
1672 * running locally.
1673 */
rdma_cap_ib_sa(const struct ib_device * device,u8 port_num)1674 static inline bool rdma_cap_ib_sa(const struct ib_device *device, u8 port_num)
1675 {
1676 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_SA;
1677 }
1678
1679 /**
1680 * rdma_cap_ib_mcast - Check if the port of device has the capability Infiniband
1681 * Multicast.
1682 * @device: Device to check
1683 * @port_num: Port number to check
1684 *
1685 * InfiniBand multicast registration is more complex than normal IPv4 or
1686 * IPv6 multicast registration. Each Host Channel Adapter must register
1687 * with the Subnet Manager when it wishes to join a multicast group. It
1688 * should do so only once regardless of how many queue pairs it subscribes
1689 * to this group. And it should leave the group only after all queue pairs
1690 * attached to the group have been detached.
1691 *
1692 * Return: true if the port must undertake the additional adminstrative
1693 * overhead of registering/unregistering with the SM and tracking of the
1694 * total number of queue pairs attached to the multicast group.
1695 */
rdma_cap_ib_mcast(const struct ib_device * device,u8 port_num)1696 static inline bool rdma_cap_ib_mcast(const struct ib_device *device, u8 port_num)
1697 {
1698 return rdma_cap_ib_sa(device, port_num);
1699 }
1700
1701 /**
1702 * rdma_cap_af_ib - Check if the port of device has the capability
1703 * Native Infiniband Address.
1704 * @device: Device to check
1705 * @port_num: Port number to check
1706 *
1707 * InfiniBand addressing uses a port's GUID + Subnet Prefix to make a default
1708 * GID. RoCE uses a different mechanism, but still generates a GID via
1709 * a prescribed mechanism and port specific data.
1710 *
1711 * Return: true if the port uses a GID address to identify devices on the
1712 * network.
1713 */
rdma_cap_af_ib(const struct ib_device * device,u8 port_num)1714 static inline bool rdma_cap_af_ib(const struct ib_device *device, u8 port_num)
1715 {
1716 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_AF_IB;
1717 }
1718
1719 /**
1720 * rdma_cap_eth_ah - Check if the port of device has the capability
1721 * Ethernet Address Handle.
1722 * @device: Device to check
1723 * @port_num: Port number to check
1724 *
1725 * RoCE is InfiniBand over Ethernet, and it uses a well defined technique
1726 * to fabricate GIDs over Ethernet/IP specific addresses native to the
1727 * port. Normally, packet headers are generated by the sending host
1728 * adapter, but when sending connectionless datagrams, we must manually
1729 * inject the proper headers for the fabric we are communicating over.
1730 *
1731 * Return: true if we are running as a RoCE port and must force the
1732 * addition of a Global Route Header built from our Ethernet Address
1733 * Handle into our header list for connectionless packets.
1734 */
rdma_cap_eth_ah(const struct ib_device * device,u8 port_num)1735 static inline bool rdma_cap_eth_ah(const struct ib_device *device, u8 port_num)
1736 {
1737 return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_ETH_AH;
1738 }
1739
1740 /**
1741 * rdma_max_mad_size - Return the max MAD size required by this RDMA Port.
1742 *
1743 * @device: Device
1744 * @port_num: Port number
1745 *
1746 * This MAD size includes the MAD headers and MAD payload. No other headers
1747 * are included.
1748 *
1749 * Return the max MAD size required by the Port. Will return 0 if the port
1750 * does not support MADs
1751 */
rdma_max_mad_size(const struct ib_device * device,u8 port_num)1752 static inline size_t rdma_max_mad_size(const struct ib_device *device, u8 port_num)
1753 {
1754 return device->port_immutable[port_num].max_mad_size;
1755 }
1756
1757 /*
1758 * Check if the device supports READ W/ INVALIDATE.
1759 */
rdma_cap_read_inv(struct ib_device * dev,u32 port_num)1760 static inline bool rdma_cap_read_inv(struct ib_device *dev, u32 port_num)
1761 {
1762 /*
1763 * iWarp drivers must support READ W/ INVALIDATE. No other protocol
1764 * has support for it yet.
1765 */
1766 return rdma_protocol_iwarp(dev, port_num);
1767 }
1768
1769 int ib_query_gid(struct ib_device *device,
1770 u8 port_num, int index, union ib_gid *gid);
1771
1772 int ib_query_pkey(struct ib_device *device,
1773 u8 port_num, u16 index, u16 *pkey);
1774
1775 int ib_modify_device(struct ib_device *device,
1776 int device_modify_mask,
1777 struct ib_device_modify *device_modify);
1778
1779 int ib_modify_port(struct ib_device *device,
1780 u8 port_num, int port_modify_mask,
1781 struct ib_port_modify *port_modify);
1782
1783 int ib_find_gid(struct ib_device *device, union ib_gid *gid,
1784 u8 *port_num, u16 *index);
1785
1786 int ib_find_pkey(struct ib_device *device,
1787 u8 port_num, u16 pkey, u16 *index);
1788
1789 /**
1790 * ib_alloc_pd - Allocates an unused protection domain.
1791 * @device: The device on which to allocate the protection domain.
1792 *
1793 * A protection domain object provides an association between QPs, shared
1794 * receive queues, address handles, memory regions, and memory windows.
1795 */
1796 struct ib_pd *ib_alloc_pd(struct ib_device *device);
1797
1798 /**
1799 * ib_dealloc_pd - Deallocates a protection domain.
1800 * @pd: The protection domain to deallocate.
1801 */
1802 int ib_dealloc_pd(struct ib_pd *pd);
1803
1804 /**
1805 * ib_create_ah - Creates an address handle for the given address vector.
1806 * @pd: The protection domain associated with the address handle.
1807 * @ah_attr: The attributes of the address vector.
1808 *
1809 * The address handle is used to reference a local or global destination
1810 * in all UD QP post sends.
1811 */
1812 struct ib_ah *ib_create_ah(struct ib_pd *pd, struct ib_ah_attr *ah_attr);
1813
1814 /**
1815 * ib_init_ah_from_wc - Initializes address handle attributes from a
1816 * work completion.
1817 * @device: Device on which the received message arrived.
1818 * @port_num: Port on which the received message arrived.
1819 * @wc: Work completion associated with the received message.
1820 * @grh: References the received global route header. This parameter is
1821 * ignored unless the work completion indicates that the GRH is valid.
1822 * @ah_attr: Returned attributes that can be used when creating an address
1823 * handle for replying to the message.
1824 */
1825 int ib_init_ah_from_wc(struct ib_device *device, u8 port_num, struct ib_wc *wc,
1826 struct ib_grh *grh, struct ib_ah_attr *ah_attr);
1827
1828 /**
1829 * ib_create_ah_from_wc - Creates an address handle associated with the
1830 * sender of the specified work completion.
1831 * @pd: The protection domain associated with the address handle.
1832 * @wc: Work completion information associated with a received message.
1833 * @grh: References the received global route header. This parameter is
1834 * ignored unless the work completion indicates that the GRH is valid.
1835 * @port_num: The outbound port number to associate with the address.
1836 *
1837 * The address handle is used to reference a local or global destination
1838 * in all UD QP post sends.
1839 */
1840 struct ib_ah *ib_create_ah_from_wc(struct ib_pd *pd, struct ib_wc *wc,
1841 struct ib_grh *grh, u8 port_num);
1842
1843 /**
1844 * ib_modify_ah - Modifies the address vector associated with an address
1845 * handle.
1846 * @ah: The address handle to modify.
1847 * @ah_attr: The new address vector attributes to associate with the
1848 * address handle.
1849 */
1850 int ib_modify_ah(struct ib_ah *ah, struct ib_ah_attr *ah_attr);
1851
1852 /**
1853 * ib_query_ah - Queries the address vector associated with an address
1854 * handle.
1855 * @ah: The address handle to query.
1856 * @ah_attr: The address vector attributes associated with the address
1857 * handle.
1858 */
1859 int ib_query_ah(struct ib_ah *ah, struct ib_ah_attr *ah_attr);
1860
1861 /**
1862 * ib_destroy_ah - Destroys an address handle.
1863 * @ah: The address handle to destroy.
1864 */
1865 int ib_destroy_ah(struct ib_ah *ah);
1866
1867 /**
1868 * ib_create_xrc_srq - Creates an XRC SRQ associated with the specified
1869 * protection domain, cq, and xrc domain.
1870 * @pd: The protection domain associated with the SRQ.
1871 * @xrc_cq: The cq to be associated with the XRC SRQ.
1872 * @xrcd: The XRC domain to be associated with the XRC SRQ.
1873 * @srq_init_attr: A list of initial attributes required to create the
1874 * XRC SRQ. If XRC SRQ creation succeeds, then the attributes are updated
1875 * to the actual capabilities of the created XRC SRQ.
1876 *
1877 * srq_attr->max_wr and srq_attr->max_sge are read the determine the
1878 * requested size of the XRC SRQ, and set to the actual values allocated
1879 * on return. If ib_create_xrc_srq() succeeds, then max_wr and max_sge
1880 * will always be at least as large as the requested values.
1881 */
1882 struct ib_srq *ib_create_xrc_srq(struct ib_pd *pd,
1883 struct ib_cq *xrc_cq,
1884 struct ib_xrcd *xrcd,
1885 struct ib_srq_init_attr *srq_init_attr);
1886
1887 /**
1888 * ib_create_srq - Creates a SRQ associated with the specified protection
1889 * domain.
1890 * @pd: The protection domain associated with the SRQ.
1891 * @srq_init_attr: A list of initial attributes required to create the
1892 * SRQ. If SRQ creation succeeds, then the attributes are updated to
1893 * the actual capabilities of the created SRQ.
1894 *
1895 * srq_attr->max_wr and srq_attr->max_sge are read the determine the
1896 * requested size of the SRQ, and set to the actual values allocated
1897 * on return. If ib_create_srq() succeeds, then max_wr and max_sge
1898 * will always be at least as large as the requested values.
1899 */
1900 struct ib_srq *ib_create_srq(struct ib_pd *pd,
1901 struct ib_srq_init_attr *srq_init_attr);
1902
1903 /**
1904 * ib_modify_srq - Modifies the attributes for the specified SRQ.
1905 * @srq: The SRQ to modify.
1906 * @srq_attr: On input, specifies the SRQ attributes to modify. On output,
1907 * the current values of selected SRQ attributes are returned.
1908 * @srq_attr_mask: A bit-mask used to specify which attributes of the SRQ
1909 * are being modified.
1910 *
1911 * The mask may contain IB_SRQ_MAX_WR to resize the SRQ and/or
1912 * IB_SRQ_LIMIT to set the SRQ's limit and request notification when
1913 * the number of receives queued drops below the limit.
1914 */
1915 int ib_modify_srq(struct ib_srq *srq,
1916 struct ib_srq_attr *srq_attr,
1917 enum ib_srq_attr_mask srq_attr_mask);
1918
1919 /**
1920 * ib_query_srq - Returns the attribute list and current values for the
1921 * specified SRQ.
1922 * @srq: The SRQ to query.
1923 * @srq_attr: The attributes of the specified SRQ.
1924 */
1925 int ib_query_srq(struct ib_srq *srq,
1926 struct ib_srq_attr *srq_attr);
1927
1928 /**
1929 * ib_destroy_srq - Destroys the specified SRQ.
1930 * @srq: The SRQ to destroy.
1931 */
1932 int ib_destroy_srq(struct ib_srq *srq);
1933
1934 /**
1935 * ib_post_srq_recv - Posts a list of work requests to the specified SRQ.
1936 * @srq: The SRQ to post the work request on.
1937 * @recv_wr: A list of work requests to post on the receive queue.
1938 * @bad_recv_wr: On an immediate failure, this parameter will reference
1939 * the work request that failed to be posted on the QP.
1940 */
ib_post_srq_recv(struct ib_srq * srq,struct ib_recv_wr * recv_wr,struct ib_recv_wr ** bad_recv_wr)1941 static inline int ib_post_srq_recv(struct ib_srq *srq,
1942 struct ib_recv_wr *recv_wr,
1943 struct ib_recv_wr **bad_recv_wr)
1944 {
1945 return srq->device->post_srq_recv(srq, recv_wr, bad_recv_wr);
1946 }
1947
1948 /**
1949 * ib_create_qp - Creates a QP associated with the specified protection
1950 * domain.
1951 * @pd: The protection domain associated with the QP.
1952 * @qp_init_attr: A list of initial attributes required to create the
1953 * QP. If QP creation succeeds, then the attributes are updated to
1954 * the actual capabilities of the created QP.
1955 */
1956 struct ib_qp *ib_create_qp(struct ib_pd *pd,
1957 struct ib_qp_init_attr *qp_init_attr);
1958
1959 /**
1960 * ib_modify_qp - Modifies the attributes for the specified QP and then
1961 * transitions the QP to the given state.
1962 * @qp: The QP to modify.
1963 * @qp_attr: On input, specifies the QP attributes to modify. On output,
1964 * the current values of selected QP attributes are returned.
1965 * @qp_attr_mask: A bit-mask used to specify which attributes of the QP
1966 * are being modified.
1967 */
1968 int ib_modify_qp(struct ib_qp *qp,
1969 struct ib_qp_attr *qp_attr,
1970 int qp_attr_mask);
1971
1972 /**
1973 * ib_query_qp - Returns the attribute list and current values for the
1974 * specified QP.
1975 * @qp: The QP to query.
1976 * @qp_attr: The attributes of the specified QP.
1977 * @qp_attr_mask: A bit-mask used to select specific attributes to query.
1978 * @qp_init_attr: Additional attributes of the selected QP.
1979 *
1980 * The qp_attr_mask may be used to limit the query to gathering only the
1981 * selected attributes.
1982 */
1983 int ib_query_qp(struct ib_qp *qp,
1984 struct ib_qp_attr *qp_attr,
1985 int qp_attr_mask,
1986 struct ib_qp_init_attr *qp_init_attr);
1987
1988 /**
1989 * ib_destroy_qp - Destroys the specified QP.
1990 * @qp: The QP to destroy.
1991 */
1992 int ib_destroy_qp(struct ib_qp *qp);
1993
1994 /**
1995 * ib_open_qp - Obtain a reference to an existing sharable QP.
1996 * @xrcd - XRC domain
1997 * @qp_open_attr: Attributes identifying the QP to open.
1998 *
1999 * Returns a reference to a sharable QP.
2000 */
2001 struct ib_qp *ib_open_qp(struct ib_xrcd *xrcd,
2002 struct ib_qp_open_attr *qp_open_attr);
2003
2004 /**
2005 * ib_close_qp - Release an external reference to a QP.
2006 * @qp: The QP handle to release
2007 *
2008 * The opened QP handle is released by the caller. The underlying
2009 * shared QP is not destroyed until all internal references are released.
2010 */
2011 int ib_close_qp(struct ib_qp *qp);
2012
2013 /**
2014 * ib_post_send - Posts a list of work requests to the send queue of
2015 * the specified QP.
2016 * @qp: The QP to post the work request on.
2017 * @send_wr: A list of work requests to post on the send queue.
2018 * @bad_send_wr: On an immediate failure, this parameter will reference
2019 * the work request that failed to be posted on the QP.
2020 *
2021 * While IBA Vol. 1 section 11.4.1.1 specifies that if an immediate
2022 * error is returned, the QP state shall not be affected,
2023 * ib_post_send() will return an immediate error after queueing any
2024 * earlier work requests in the list.
2025 */
ib_post_send(struct ib_qp * qp,struct ib_send_wr * send_wr,struct ib_send_wr ** bad_send_wr)2026 static inline int ib_post_send(struct ib_qp *qp,
2027 struct ib_send_wr *send_wr,
2028 struct ib_send_wr **bad_send_wr)
2029 {
2030 return qp->device->post_send(qp, send_wr, bad_send_wr);
2031 }
2032
2033 /**
2034 * ib_post_recv - Posts a list of work requests to the receive queue of
2035 * the specified QP.
2036 * @qp: The QP to post the work request on.
2037 * @recv_wr: A list of work requests to post on the receive queue.
2038 * @bad_recv_wr: On an immediate failure, this parameter will reference
2039 * the work request that failed to be posted on the QP.
2040 */
ib_post_recv(struct ib_qp * qp,struct ib_recv_wr * recv_wr,struct ib_recv_wr ** bad_recv_wr)2041 static inline int ib_post_recv(struct ib_qp *qp,
2042 struct ib_recv_wr *recv_wr,
2043 struct ib_recv_wr **bad_recv_wr)
2044 {
2045 return qp->device->post_recv(qp, recv_wr, bad_recv_wr);
2046 }
2047
2048 /*
2049 * IB_CQ_VECTOR_LEAST_ATTACHED: The constant specifies that
2050 * the CQ will be attached to the completion vector that has
2051 * the least number of CQs already attached to it.
2052 */
2053 #define IB_CQ_VECTOR_LEAST_ATTACHED 0xffffffff
2054
2055 /**
2056 * ib_create_cq - Creates a CQ on the specified device.
2057 * @device: The device on which to create the CQ.
2058 * @comp_handler: A user-specified callback that is invoked when a
2059 * completion event occurs on the CQ.
2060 * @event_handler: A user-specified callback that is invoked when an
2061 * asynchronous event not associated with a completion occurs on the CQ.
2062 * @cq_context: Context associated with the CQ returned to the user via
2063 * the associated completion and event handlers.
2064 * @cqe: The minimum size of the CQ.
2065 * @comp_vector - Completion vector used to signal completion events.
2066 * Must be >= 0 and < context->num_comp_vectors.
2067 *
2068 * Users can examine the cq structure to determine the actual CQ size.
2069 */
2070 struct ib_cq *ib_create_cq(struct ib_device *device,
2071 ib_comp_handler comp_handler,
2072 void (*event_handler)(struct ib_event *, void *),
2073 void *cq_context, int cqe, int comp_vector);
2074
2075 /**
2076 * ib_resize_cq - Modifies the capacity of the CQ.
2077 * @cq: The CQ to resize.
2078 * @cqe: The minimum size of the CQ.
2079 *
2080 * Users can examine the cq structure to determine the actual CQ size.
2081 */
2082 int ib_resize_cq(struct ib_cq *cq, int cqe);
2083
2084 /**
2085 * ib_modify_cq - Modifies moderation params of the CQ
2086 * @cq: The CQ to modify.
2087 * @cq_count: number of CQEs that will trigger an event
2088 * @cq_period: max period of time in usec before triggering an event
2089 *
2090 */
2091 int ib_modify_cq(struct ib_cq *cq, u16 cq_count, u16 cq_period);
2092
2093 /**
2094 * ib_destroy_cq - Destroys the specified CQ.
2095 * @cq: The CQ to destroy.
2096 */
2097 int ib_destroy_cq(struct ib_cq *cq);
2098
2099 /**
2100 * ib_poll_cq - poll a CQ for completion(s)
2101 * @cq:the CQ being polled
2102 * @num_entries:maximum number of completions to return
2103 * @wc:array of at least @num_entries &struct ib_wc where completions
2104 * will be returned
2105 *
2106 * Poll a CQ for (possibly multiple) completions. If the return value
2107 * is < 0, an error occurred. If the return value is >= 0, it is the
2108 * number of completions returned. If the return value is
2109 * non-negative and < num_entries, then the CQ was emptied.
2110 */
ib_poll_cq(struct ib_cq * cq,int num_entries,struct ib_wc * wc)2111 static inline int ib_poll_cq(struct ib_cq *cq, int num_entries,
2112 struct ib_wc *wc)
2113 {
2114 return cq->device->poll_cq(cq, num_entries, wc);
2115 }
2116
2117 /**
2118 * ib_peek_cq - Returns the number of unreaped completions currently
2119 * on the specified CQ.
2120 * @cq: The CQ to peek.
2121 * @wc_cnt: A minimum number of unreaped completions to check for.
2122 *
2123 * If the number of unreaped completions is greater than or equal to wc_cnt,
2124 * this function returns wc_cnt, otherwise, it returns the actual number of
2125 * unreaped completions.
2126 */
2127 int ib_peek_cq(struct ib_cq *cq, int wc_cnt);
2128
2129 /**
2130 * ib_req_notify_cq - Request completion notification on a CQ.
2131 * @cq: The CQ to generate an event for.
2132 * @flags:
2133 * Must contain exactly one of %IB_CQ_SOLICITED or %IB_CQ_NEXT_COMP
2134 * to request an event on the next solicited event or next work
2135 * completion at any type, respectively. %IB_CQ_REPORT_MISSED_EVENTS
2136 * may also be |ed in to request a hint about missed events, as
2137 * described below.
2138 *
2139 * Return Value:
2140 * < 0 means an error occurred while requesting notification
2141 * == 0 means notification was requested successfully, and if
2142 * IB_CQ_REPORT_MISSED_EVENTS was passed in, then no events
2143 * were missed and it is safe to wait for another event. In
2144 * this case is it guaranteed that any work completions added
2145 * to the CQ since the last CQ poll will trigger a completion
2146 * notification event.
2147 * > 0 is only returned if IB_CQ_REPORT_MISSED_EVENTS was passed
2148 * in. It means that the consumer must poll the CQ again to
2149 * make sure it is empty to avoid missing an event because of a
2150 * race between requesting notification and an entry being
2151 * added to the CQ. This return value means it is possible
2152 * (but not guaranteed) that a work completion has been added
2153 * to the CQ since the last poll without triggering a
2154 * completion notification event.
2155 */
ib_req_notify_cq(struct ib_cq * cq,enum ib_cq_notify_flags flags)2156 static inline int ib_req_notify_cq(struct ib_cq *cq,
2157 enum ib_cq_notify_flags flags)
2158 {
2159 return cq->device->req_notify_cq(cq, flags);
2160 }
2161
2162 /**
2163 * ib_req_ncomp_notif - Request completion notification when there are
2164 * at least the specified number of unreaped completions on the CQ.
2165 * @cq: The CQ to generate an event for.
2166 * @wc_cnt: The number of unreaped completions that should be on the
2167 * CQ before an event is generated.
2168 */
ib_req_ncomp_notif(struct ib_cq * cq,int wc_cnt)2169 static inline int ib_req_ncomp_notif(struct ib_cq *cq, int wc_cnt)
2170 {
2171 return cq->device->req_ncomp_notif ?
2172 cq->device->req_ncomp_notif(cq, wc_cnt) :
2173 -ENOSYS;
2174 }
2175
2176 /**
2177 * ib_get_dma_mr - Returns a memory region for system memory that is
2178 * usable for DMA.
2179 * @pd: The protection domain associated with the memory region.
2180 * @mr_access_flags: Specifies the memory access rights.
2181 *
2182 * Note that the ib_dma_*() functions defined below must be used
2183 * to create/destroy addresses used with the Lkey or Rkey returned
2184 * by ib_get_dma_mr().
2185 */
2186 struct ib_mr *ib_get_dma_mr(struct ib_pd *pd, int mr_access_flags);
2187
2188 /**
2189 * ib_dma_mapping_error - check a DMA addr for error
2190 * @dev: The device for which the dma_addr was created
2191 * @dma_addr: The DMA address to check
2192 */
ib_dma_mapping_error(struct ib_device * dev,u64 dma_addr)2193 static inline int ib_dma_mapping_error(struct ib_device *dev, u64 dma_addr)
2194 {
2195 if (dev->dma_ops)
2196 return dev->dma_ops->mapping_error(dev, dma_addr);
2197 return dma_mapping_error(dev->dma_device, dma_addr);
2198 }
2199
2200 /**
2201 * ib_dma_map_single - Map a kernel virtual address to DMA address
2202 * @dev: The device for which the dma_addr is to be created
2203 * @cpu_addr: The kernel virtual address
2204 * @size: The size of the region in bytes
2205 * @direction: The direction of the DMA
2206 */
ib_dma_map_single(struct ib_device * dev,void * cpu_addr,size_t size,enum dma_data_direction direction)2207 static inline u64 ib_dma_map_single(struct ib_device *dev,
2208 void *cpu_addr, size_t size,
2209 enum dma_data_direction direction)
2210 {
2211 if (dev->dma_ops)
2212 return dev->dma_ops->map_single(dev, cpu_addr, size, direction);
2213 return dma_map_single(dev->dma_device, cpu_addr, size, direction);
2214 }
2215
2216 /**
2217 * ib_dma_unmap_single - Destroy a mapping created by ib_dma_map_single()
2218 * @dev: The device for which the DMA address was created
2219 * @addr: The DMA address
2220 * @size: The size of the region in bytes
2221 * @direction: The direction of the DMA
2222 */
ib_dma_unmap_single(struct ib_device * dev,u64 addr,size_t size,enum dma_data_direction direction)2223 static inline void ib_dma_unmap_single(struct ib_device *dev,
2224 u64 addr, size_t size,
2225 enum dma_data_direction direction)
2226 {
2227 if (dev->dma_ops)
2228 dev->dma_ops->unmap_single(dev, addr, size, direction);
2229 else
2230 dma_unmap_single(dev->dma_device, addr, size, direction);
2231 }
2232
ib_dma_map_single_attrs(struct ib_device * dev,void * cpu_addr,size_t size,enum dma_data_direction direction,struct dma_attrs * attrs)2233 static inline u64 ib_dma_map_single_attrs(struct ib_device *dev,
2234 void *cpu_addr, size_t size,
2235 enum dma_data_direction direction,
2236 struct dma_attrs *attrs)
2237 {
2238 return dma_map_single_attrs(dev->dma_device, cpu_addr, size,
2239 direction, attrs);
2240 }
2241
ib_dma_unmap_single_attrs(struct ib_device * dev,u64 addr,size_t size,enum dma_data_direction direction,struct dma_attrs * attrs)2242 static inline void ib_dma_unmap_single_attrs(struct ib_device *dev,
2243 u64 addr, size_t size,
2244 enum dma_data_direction direction,
2245 struct dma_attrs *attrs)
2246 {
2247 return dma_unmap_single_attrs(dev->dma_device, addr, size,
2248 direction, attrs);
2249 }
2250
2251 /**
2252 * ib_dma_map_page - Map a physical page to DMA address
2253 * @dev: The device for which the dma_addr is to be created
2254 * @page: The page to be mapped
2255 * @offset: The offset within the page
2256 * @size: The size of the region in bytes
2257 * @direction: The direction of the DMA
2258 */
ib_dma_map_page(struct ib_device * dev,struct page * page,unsigned long offset,size_t size,enum dma_data_direction direction)2259 static inline u64 ib_dma_map_page(struct ib_device *dev,
2260 struct page *page,
2261 unsigned long offset,
2262 size_t size,
2263 enum dma_data_direction direction)
2264 {
2265 if (dev->dma_ops)
2266 return dev->dma_ops->map_page(dev, page, offset, size, direction);
2267 return dma_map_page(dev->dma_device, page, offset, size, direction);
2268 }
2269
2270 /**
2271 * ib_dma_unmap_page - Destroy a mapping created by ib_dma_map_page()
2272 * @dev: The device for which the DMA address was created
2273 * @addr: The DMA address
2274 * @size: The size of the region in bytes
2275 * @direction: The direction of the DMA
2276 */
ib_dma_unmap_page(struct ib_device * dev,u64 addr,size_t size,enum dma_data_direction direction)2277 static inline void ib_dma_unmap_page(struct ib_device *dev,
2278 u64 addr, size_t size,
2279 enum dma_data_direction direction)
2280 {
2281 if (dev->dma_ops)
2282 dev->dma_ops->unmap_page(dev, addr, size, direction);
2283 else
2284 dma_unmap_page(dev->dma_device, addr, size, direction);
2285 }
2286
2287 /**
2288 * ib_dma_map_sg - Map a scatter/gather list to DMA addresses
2289 * @dev: The device for which the DMA addresses are to be created
2290 * @sg: The array of scatter/gather entries
2291 * @nents: The number of scatter/gather entries
2292 * @direction: The direction of the DMA
2293 */
ib_dma_map_sg(struct ib_device * dev,struct scatterlist * sg,int nents,enum dma_data_direction direction)2294 static inline int ib_dma_map_sg(struct ib_device *dev,
2295 struct scatterlist *sg, int nents,
2296 enum dma_data_direction direction)
2297 {
2298 if (dev->dma_ops)
2299 return dev->dma_ops->map_sg(dev, sg, nents, direction);
2300 return dma_map_sg(dev->dma_device, sg, nents, direction);
2301 }
2302
2303 /**
2304 * ib_dma_unmap_sg - Unmap a scatter/gather list of DMA addresses
2305 * @dev: The device for which the DMA addresses were created
2306 * @sg: The array of scatter/gather entries
2307 * @nents: The number of scatter/gather entries
2308 * @direction: The direction of the DMA
2309 */
ib_dma_unmap_sg(struct ib_device * dev,struct scatterlist * sg,int nents,enum dma_data_direction direction)2310 static inline void ib_dma_unmap_sg(struct ib_device *dev,
2311 struct scatterlist *sg, int nents,
2312 enum dma_data_direction direction)
2313 {
2314 if (dev->dma_ops)
2315 dev->dma_ops->unmap_sg(dev, sg, nents, direction);
2316 else
2317 dma_unmap_sg(dev->dma_device, sg, nents, direction);
2318 }
2319
ib_dma_map_sg_attrs(struct ib_device * dev,struct scatterlist * sg,int nents,enum dma_data_direction direction,struct dma_attrs * attrs)2320 static inline int ib_dma_map_sg_attrs(struct ib_device *dev,
2321 struct scatterlist *sg, int nents,
2322 enum dma_data_direction direction,
2323 struct dma_attrs *attrs)
2324 {
2325 return dma_map_sg_attrs(dev->dma_device, sg, nents, direction, attrs);
2326 }
2327
ib_dma_unmap_sg_attrs(struct ib_device * dev,struct scatterlist * sg,int nents,enum dma_data_direction direction,struct dma_attrs * attrs)2328 static inline void ib_dma_unmap_sg_attrs(struct ib_device *dev,
2329 struct scatterlist *sg, int nents,
2330 enum dma_data_direction direction,
2331 struct dma_attrs *attrs)
2332 {
2333 dma_unmap_sg_attrs(dev->dma_device, sg, nents, direction, attrs);
2334 }
2335 /**
2336 * ib_sg_dma_address - Return the DMA address from a scatter/gather entry
2337 * @dev: The device for which the DMA addresses were created
2338 * @sg: The scatter/gather entry
2339 */
ib_sg_dma_address(struct ib_device * dev,struct scatterlist * sg)2340 static inline u64 ib_sg_dma_address(struct ib_device *dev,
2341 struct scatterlist *sg)
2342 {
2343 if (dev->dma_ops)
2344 return dev->dma_ops->dma_address(dev, sg);
2345 return sg_dma_address(sg);
2346 }
2347
2348 /**
2349 * ib_sg_dma_len - Return the DMA length from a scatter/gather entry
2350 * @dev: The device for which the DMA addresses were created
2351 * @sg: The scatter/gather entry
2352 */
ib_sg_dma_len(struct ib_device * dev,struct scatterlist * sg)2353 static inline unsigned int ib_sg_dma_len(struct ib_device *dev,
2354 struct scatterlist *sg)
2355 {
2356 if (dev->dma_ops)
2357 return dev->dma_ops->dma_len(dev, sg);
2358 return sg_dma_len(sg);
2359 }
2360
2361 /**
2362 * ib_dma_sync_single_for_cpu - Prepare DMA region to be accessed by CPU
2363 * @dev: The device for which the DMA address was created
2364 * @addr: The DMA address
2365 * @size: The size of the region in bytes
2366 * @dir: The direction of the DMA
2367 */
ib_dma_sync_single_for_cpu(struct ib_device * dev,u64 addr,size_t size,enum dma_data_direction dir)2368 static inline void ib_dma_sync_single_for_cpu(struct ib_device *dev,
2369 u64 addr,
2370 size_t size,
2371 enum dma_data_direction dir)
2372 {
2373 if (dev->dma_ops)
2374 dev->dma_ops->sync_single_for_cpu(dev, addr, size, dir);
2375 else
2376 dma_sync_single_for_cpu(dev->dma_device, addr, size, dir);
2377 }
2378
2379 /**
2380 * ib_dma_sync_single_for_device - Prepare DMA region to be accessed by device
2381 * @dev: The device for which the DMA address was created
2382 * @addr: The DMA address
2383 * @size: The size of the region in bytes
2384 * @dir: The direction of the DMA
2385 */
ib_dma_sync_single_for_device(struct ib_device * dev,u64 addr,size_t size,enum dma_data_direction dir)2386 static inline void ib_dma_sync_single_for_device(struct ib_device *dev,
2387 u64 addr,
2388 size_t size,
2389 enum dma_data_direction dir)
2390 {
2391 if (dev->dma_ops)
2392 dev->dma_ops->sync_single_for_device(dev, addr, size, dir);
2393 else
2394 dma_sync_single_for_device(dev->dma_device, addr, size, dir);
2395 }
2396
2397 /**
2398 * ib_dma_alloc_coherent - Allocate memory and map it for DMA
2399 * @dev: The device for which the DMA address is requested
2400 * @size: The size of the region to allocate in bytes
2401 * @dma_handle: A pointer for returning the DMA address of the region
2402 * @flag: memory allocator flags
2403 */
ib_dma_alloc_coherent(struct ib_device * dev,size_t size,u64 * dma_handle,gfp_t flag)2404 static inline void *ib_dma_alloc_coherent(struct ib_device *dev,
2405 size_t size,
2406 u64 *dma_handle,
2407 gfp_t flag)
2408 {
2409 if (dev->dma_ops)
2410 return dev->dma_ops->alloc_coherent(dev, size, dma_handle, flag);
2411 else {
2412 dma_addr_t handle;
2413 void *ret;
2414
2415 ret = dma_alloc_coherent(dev->dma_device, size, &handle, flag);
2416 *dma_handle = handle;
2417 return ret;
2418 }
2419 }
2420
2421 /**
2422 * ib_dma_free_coherent - Free memory allocated by ib_dma_alloc_coherent()
2423 * @dev: The device for which the DMA addresses were allocated
2424 * @size: The size of the region
2425 * @cpu_addr: the address returned by ib_dma_alloc_coherent()
2426 * @dma_handle: the DMA address returned by ib_dma_alloc_coherent()
2427 */
ib_dma_free_coherent(struct ib_device * dev,size_t size,void * cpu_addr,u64 dma_handle)2428 static inline void ib_dma_free_coherent(struct ib_device *dev,
2429 size_t size, void *cpu_addr,
2430 u64 dma_handle)
2431 {
2432 if (dev->dma_ops)
2433 dev->dma_ops->free_coherent(dev, size, cpu_addr, dma_handle);
2434 else
2435 dma_free_coherent(dev->dma_device, size, cpu_addr, dma_handle);
2436 }
2437
2438 /**
2439 * ib_reg_phys_mr - Prepares a virtually addressed memory region for use
2440 * by an HCA.
2441 * @pd: The protection domain associated assigned to the registered region.
2442 * @phys_buf_array: Specifies a list of physical buffers to use in the
2443 * memory region.
2444 * @num_phys_buf: Specifies the size of the phys_buf_array.
2445 * @mr_access_flags: Specifies the memory access rights.
2446 * @iova_start: The offset of the region's starting I/O virtual address.
2447 */
2448 struct ib_mr *ib_reg_phys_mr(struct ib_pd *pd,
2449 struct ib_phys_buf *phys_buf_array,
2450 int num_phys_buf,
2451 int mr_access_flags,
2452 u64 *iova_start);
2453
2454 /**
2455 * ib_rereg_phys_mr - Modifies the attributes of an existing memory region.
2456 * Conceptually, this call performs the functions deregister memory region
2457 * followed by register physical memory region. Where possible,
2458 * resources are reused instead of deallocated and reallocated.
2459 * @mr: The memory region to modify.
2460 * @mr_rereg_mask: A bit-mask used to indicate which of the following
2461 * properties of the memory region are being modified.
2462 * @pd: If %IB_MR_REREG_PD is set in mr_rereg_mask, this field specifies
2463 * the new protection domain to associated with the memory region,
2464 * otherwise, this parameter is ignored.
2465 * @phys_buf_array: If %IB_MR_REREG_TRANS is set in mr_rereg_mask, this
2466 * field specifies a list of physical buffers to use in the new
2467 * translation, otherwise, this parameter is ignored.
2468 * @num_phys_buf: If %IB_MR_REREG_TRANS is set in mr_rereg_mask, this
2469 * field specifies the size of the phys_buf_array, otherwise, this
2470 * parameter is ignored.
2471 * @mr_access_flags: If %IB_MR_REREG_ACCESS is set in mr_rereg_mask, this
2472 * field specifies the new memory access rights, otherwise, this
2473 * parameter is ignored.
2474 * @iova_start: The offset of the region's starting I/O virtual address.
2475 */
2476 int ib_rereg_phys_mr(struct ib_mr *mr,
2477 int mr_rereg_mask,
2478 struct ib_pd *pd,
2479 struct ib_phys_buf *phys_buf_array,
2480 int num_phys_buf,
2481 int mr_access_flags,
2482 u64 *iova_start);
2483
2484 /**
2485 * ib_query_mr - Retrieves information about a specific memory region.
2486 * @mr: The memory region to retrieve information about.
2487 * @mr_attr: The attributes of the specified memory region.
2488 */
2489 int ib_query_mr(struct ib_mr *mr, struct ib_mr_attr *mr_attr);
2490
2491 /**
2492 * ib_dereg_mr - Deregisters a memory region and removes it from the
2493 * HCA translation table.
2494 * @mr: The memory region to deregister.
2495 */
2496 int ib_dereg_mr(struct ib_mr *mr);
2497
2498 /**
2499 * ib_alloc_fast_reg_mr - Allocates memory region usable with the
2500 * IB_WR_FAST_REG_MR send work request.
2501 * @pd: The protection domain associated with the region.
2502 * @max_page_list_len: requested max physical buffer list length to be
2503 * used with fast register work requests for this MR.
2504 */
2505 struct ib_mr *ib_alloc_fast_reg_mr(struct ib_pd *pd, int max_page_list_len);
2506
2507 /**
2508 * ib_alloc_fast_reg_page_list - Allocates a page list array
2509 * @device - ib device pointer.
2510 * @page_list_len - size of the page list array to be allocated.
2511 *
2512 * This allocates and returns a struct ib_fast_reg_page_list * and a
2513 * page_list array that is at least page_list_len in size. The actual
2514 * size is returned in max_page_list_len. The caller is responsible
2515 * for initializing the contents of the page_list array before posting
2516 * a send work request with the IB_WC_FAST_REG_MR opcode.
2517 *
2518 * The page_list array entries must be translated using one of the
2519 * ib_dma_*() functions just like the addresses passed to
2520 * ib_map_phys_fmr(). Once the ib_post_send() is issued, the struct
2521 * ib_fast_reg_page_list must not be modified by the caller until the
2522 * IB_WC_FAST_REG_MR work request completes.
2523 */
2524 struct ib_fast_reg_page_list *ib_alloc_fast_reg_page_list(
2525 struct ib_device *device, int page_list_len);
2526
2527 /**
2528 * ib_free_fast_reg_page_list - Deallocates a previously allocated
2529 * page list array.
2530 * @page_list - struct ib_fast_reg_page_list pointer to be deallocated.
2531 */
2532 void ib_free_fast_reg_page_list(struct ib_fast_reg_page_list *page_list);
2533
2534 /**
2535 * ib_update_fast_reg_key - updates the key portion of the fast_reg MR
2536 * R_Key and L_Key.
2537 * @mr - struct ib_mr pointer to be updated.
2538 * @newkey - new key to be used.
2539 */
ib_update_fast_reg_key(struct ib_mr * mr,u8 newkey)2540 static inline void ib_update_fast_reg_key(struct ib_mr *mr, u8 newkey)
2541 {
2542 mr->lkey = (mr->lkey & 0xffffff00) | newkey;
2543 mr->rkey = (mr->rkey & 0xffffff00) | newkey;
2544 }
2545
2546 /**
2547 * ib_alloc_mw - Allocates a memory window.
2548 * @pd: The protection domain associated with the memory window.
2549 */
2550 struct ib_mw *ib_alloc_mw(struct ib_pd *pd);
2551
2552 /**
2553 * ib_bind_mw - Posts a work request to the send queue of the specified
2554 * QP, which binds the memory window to the given address range and
2555 * remote access attributes.
2556 * @qp: QP to post the bind work request on.
2557 * @mw: The memory window to bind.
2558 * @mw_bind: Specifies information about the memory window, including
2559 * its address range, remote access rights, and associated memory region.
2560 */
ib_bind_mw(struct ib_qp * qp,struct ib_mw * mw,struct ib_mw_bind * mw_bind)2561 static inline int ib_bind_mw(struct ib_qp *qp,
2562 struct ib_mw *mw,
2563 struct ib_mw_bind *mw_bind)
2564 {
2565 /* XXX reference counting in corresponding MR? */
2566 return mw->device->bind_mw ?
2567 mw->device->bind_mw(qp, mw, mw_bind) :
2568 -ENOSYS;
2569 }
2570
2571 /**
2572 * ib_dealloc_mw - Deallocates a memory window.
2573 * @mw: The memory window to deallocate.
2574 */
2575 int ib_dealloc_mw(struct ib_mw *mw);
2576
2577 /**
2578 * ib_alloc_fmr - Allocates a unmapped fast memory region.
2579 * @pd: The protection domain associated with the unmapped region.
2580 * @mr_access_flags: Specifies the memory access rights.
2581 * @fmr_attr: Attributes of the unmapped region.
2582 *
2583 * A fast memory region must be mapped before it can be used as part of
2584 * a work request.
2585 */
2586 struct ib_fmr *ib_alloc_fmr(struct ib_pd *pd,
2587 int mr_access_flags,
2588 struct ib_fmr_attr *fmr_attr);
2589
2590 /**
2591 * ib_map_phys_fmr - Maps a list of physical pages to a fast memory region.
2592 * @fmr: The fast memory region to associate with the pages.
2593 * @page_list: An array of physical pages to map to the fast memory region.
2594 * @list_len: The number of pages in page_list.
2595 * @iova: The I/O virtual address to use with the mapped region.
2596 */
ib_map_phys_fmr(struct ib_fmr * fmr,u64 * page_list,int list_len,u64 iova)2597 static inline int ib_map_phys_fmr(struct ib_fmr *fmr,
2598 u64 *page_list, int list_len,
2599 u64 iova)
2600 {
2601 return fmr->device->map_phys_fmr(fmr, page_list, list_len, iova);
2602 }
2603
2604 /**
2605 * ib_unmap_fmr - Removes the mapping from a list of fast memory regions.
2606 * @fmr_list: A linked list of fast memory regions to unmap.
2607 */
2608 int ib_unmap_fmr(struct list_head *fmr_list);
2609
2610 /**
2611 * ib_dealloc_fmr - Deallocates a fast memory region.
2612 * @fmr: The fast memory region to deallocate.
2613 */
2614 int ib_dealloc_fmr(struct ib_fmr *fmr);
2615
2616 /**
2617 * ib_attach_mcast - Attaches the specified QP to a multicast group.
2618 * @qp: QP to attach to the multicast group. The QP must be type
2619 * IB_QPT_UD.
2620 * @gid: Multicast group GID.
2621 * @lid: Multicast group LID in host byte order.
2622 *
2623 * In order to send and receive multicast packets, subnet
2624 * administration must have created the multicast group and configured
2625 * the fabric appropriately. The port associated with the specified
2626 * QP must also be a member of the multicast group.
2627 */
2628 int ib_attach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
2629
2630 /**
2631 * ib_detach_mcast - Detaches the specified QP from a multicast group.
2632 * @qp: QP to detach from the multicast group.
2633 * @gid: Multicast group GID.
2634 * @lid: Multicast group LID in host byte order.
2635 */
2636 int ib_detach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
2637
2638 /**
2639 * ib_alloc_xrcd - Allocates an XRC domain.
2640 * @device: The device on which to allocate the XRC domain.
2641 */
2642 struct ib_xrcd *ib_alloc_xrcd(struct ib_device *device);
2643
2644 /**
2645 * ib_dealloc_xrcd - Deallocates an XRC domain.
2646 * @xrcd: The XRC domain to deallocate.
2647 */
2648 int ib_dealloc_xrcd(struct ib_xrcd *xrcd);
2649
2650 int ib_attach_flow(struct ib_qp *qp, struct ib_flow_spec *spec, int priority);
2651 int ib_detach_flow(struct ib_qp *qp, struct ib_flow_spec *spec, int priority);
2652
2653 #endif /* IB_VERBS_H */
2654