1 /*-
2 * Copyright (c) 2013-2020, Mellanox Technologies, Ltd. All rights reserved.
3 *
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
6 * are met:
7 * 1. Redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer.
9 * 2. Redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution.
12 *
13 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND
14 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
16 * ARE DISCLAIMED. IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
17 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
18 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
19 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
20 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
21 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
22 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
23 * SUCH DAMAGE.
24 *
25 * $FreeBSD$
26 */
27
28 #ifndef MLX5_IB_H
29 #define MLX5_IB_H
30
31 #include <linux/kernel.h>
32 #include <linux/sched.h>
33 #include <linux/printk.h>
34 #include <linux/netdevice.h>
35 #include <rdma/ib_verbs.h>
36 #include <rdma/ib_umem.h>
37 #include <rdma/ib_smi.h>
38 #include <dev/mlx5/cq.h>
39 #include <dev/mlx5/qp.h>
40 #include <dev/mlx5/srq.h>
41 #include <linux/types.h>
42 #include <dev/mlx5/mlx5_core/transobj.h>
43 #include <rdma/ib_user_verbs.h>
44 #include <rdma/mlx5-abi.h>
45 #include <rdma/uverbs_ioctl.h>
46
47 #define mlx5_ib_dbg(dev, format, arg...) \
48 pr_debug("%s:%s:%d:(pid %d): " format, (dev)->ib_dev.name, __func__, \
49 __LINE__, current->pid, ##arg)
50
51 #define mlx5_ib_err(dev, format, arg...) \
52 pr_err("%s: ERR: %s:%d:(pid %d): " format, (dev)->ib_dev.name, __func__, \
53 __LINE__, current->pid, ##arg)
54
55 #define mlx5_ib_warn(dev, format, arg...) \
56 pr_warn("%s: WARN: %s:%d:(pid %d): " format, (dev)->ib_dev.name, __func__, \
57 __LINE__, current->pid, ##arg)
58
59 #define field_avail(type, fld, sz) (offsetof(type, fld) + \
60 sizeof(((type *)0)->fld) <= (sz))
61 #define MLX5_IB_DEFAULT_UIDX 0xffffff
62 #define MLX5_USER_ASSIGNED_UIDX_MASK __mlx5_mask(qpc, user_index)
63
64 #define MLX5_MKEY_PAGE_SHIFT_MASK __mlx5_mask(mkc, log_page_size)
65
66 enum {
67 MLX5_IB_MMAP_CMD_SHIFT = 8,
68 MLX5_IB_MMAP_CMD_MASK = 0xff,
69 };
70
71 enum {
72 MLX5_RES_SCAT_DATA32_CQE = 0x1,
73 MLX5_RES_SCAT_DATA64_CQE = 0x2,
74 MLX5_REQ_SCAT_DATA32_CQE = 0x11,
75 MLX5_REQ_SCAT_DATA64_CQE = 0x22,
76 };
77
78 enum mlx5_ib_latency_class {
79 MLX5_IB_LATENCY_CLASS_LOW,
80 MLX5_IB_LATENCY_CLASS_MEDIUM,
81 MLX5_IB_LATENCY_CLASS_HIGH,
82 MLX5_IB_LATENCY_CLASS_FAST_PATH
83 };
84
85 enum mlx5_ib_mad_ifc_flags {
86 MLX5_MAD_IFC_IGNORE_MKEY = 1,
87 MLX5_MAD_IFC_IGNORE_BKEY = 2,
88 MLX5_MAD_IFC_NET_VIEW = 4,
89 };
90
91 enum {
92 MLX5_CROSS_CHANNEL_BFREG = 0,
93 };
94
95 enum {
96 MLX5_CQE_VERSION_V0,
97 MLX5_CQE_VERSION_V1,
98 };
99
100 enum {
101 MLX5_IB_INVALID_UAR_INDEX = BIT(31),
102 MLX5_IB_INVALID_BFREG = BIT(31),
103 };
104
105 enum mlx5_ib_mmap_type {
106 MLX5_IB_MMAP_TYPE_MEMIC = 1,
107 MLX5_IB_MMAP_TYPE_VAR = 2,
108 MLX5_IB_MMAP_TYPE_UAR_WC = 3,
109 MLX5_IB_MMAP_TYPE_UAR_NC = 4,
110 };
111
112 struct mlx5_bfreg_info {
113 u32 *sys_pages;
114 int num_low_latency_bfregs;
115 unsigned int *count;
116
117 /*
118 * protect bfreg allocation data structs
119 */
120 struct mutex lock;
121 u32 ver;
122 u8 lib_uar_4k : 1;
123 u8 lib_uar_dyn : 1;
124 u32 num_sys_pages;
125 u32 num_static_sys_pages;
126 u32 total_num_bfregs;
127 u32 num_dyn_bfregs;
128 };
129
130 struct mlx5_ib_ucontext {
131 struct ib_ucontext ibucontext;
132 struct list_head db_page_list;
133
134 /* protect doorbell record alloc/free
135 */
136 struct mutex db_page_mutex;
137 struct mlx5_bfreg_info bfregi;
138 u8 cqe_version;
139 /* Transport Domain number */
140 u32 tdn;
141
142 u64 lib_caps;
143 u16 devx_uid;
144 };
145
146 static inline struct mlx5_ib_ucontext *to_mucontext(struct ib_ucontext *ibucontext)
147 {
148 return container_of(ibucontext, struct mlx5_ib_ucontext, ibucontext);
149 }
150
151 struct mlx5_ib_pd {
152 struct ib_pd ibpd;
153 u32 pdn;
154 u16 uid;
155 };
156
157 #define MLX5_IB_FLOW_MCAST_PRIO (MLX5_BY_PASS_NUM_PRIOS - 1)
158 #define MLX5_IB_FLOW_LAST_PRIO (MLX5_BY_PASS_NUM_REGULAR_PRIOS - 1)
159 #if (MLX5_IB_FLOW_LAST_PRIO <= 0)
160 #error "Invalid number of bypass priorities"
161 #endif
162 #define MLX5_IB_FLOW_LEFTOVERS_PRIO (MLX5_IB_FLOW_MCAST_PRIO + 1)
163
164 #define MLX5_IB_NUM_FLOW_FT (MLX5_IB_FLOW_LEFTOVERS_PRIO + 1)
165 #define MLX5_IB_NUM_SNIFFER_FTS 2
166 struct mlx5_ib_flow_prio {
167 struct mlx5_flow_table *flow_table;
168 unsigned int refcount;
169 };
170
171 struct mlx5_ib_flow_handler {
172 struct list_head list;
173 struct ib_flow ibflow;
174 struct mlx5_ib_flow_prio *prio;
175 struct mlx5_flow_rule *rule;
176 };
177
178 struct mlx5_ib_flow_db {
179 struct mlx5_ib_flow_prio prios[MLX5_IB_NUM_FLOW_FT];
180 struct mlx5_ib_flow_prio sniffer[MLX5_IB_NUM_SNIFFER_FTS];
181 struct mlx5_flow_table *lag_demux_ft;
182 /* Protect flow steering bypass flow tables
183 * when add/del flow rules.
184 * only single add/removal of flow steering rule could be done
185 * simultaneously.
186 */
187 struct mutex lock;
188 };
189
190 /* Use macros here so that don't have to duplicate
191 * enum ib_send_flags and enum ib_qp_type for low-level driver
192 */
193
194 #define MLX5_IB_SEND_UMR_UNREG IB_SEND_RESERVED_START
195 #define MLX5_IB_SEND_UMR_FAIL_IF_FREE (IB_SEND_RESERVED_START << 1)
196 #define MLX5_IB_SEND_UMR_UPDATE_MTT (IB_SEND_RESERVED_START << 2)
197
198 #define MLX5_IB_SEND_UMR_UPDATE_TRANSLATION (IB_SEND_RESERVED_START << 3)
199 #define MLX5_IB_SEND_UMR_UPDATE_PD (IB_SEND_RESERVED_START << 4)
200 #define MLX5_IB_SEND_UMR_UPDATE_ACCESS IB_SEND_RESERVED_END
201
202 #define MLX5_IB_QPT_REG_UMR IB_QPT_RESERVED1
203 /*
204 * IB_QPT_GSI creates the software wrapper around GSI, and MLX5_IB_QPT_HW_GSI
205 * creates the actual hardware QP.
206 */
207 #define MLX5_IB_QPT_HW_GSI IB_QPT_RESERVED2
208 #define MLX5_IB_QPT_DCI IB_QPT_RESERVED3
209 #define MLX5_IB_QPT_DCT IB_QPT_RESERVED4
210 #define MLX5_IB_WR_UMR IB_WR_RESERVED1
211
212 /* Private QP creation flags to be passed in ib_qp_init_attr.create_flags.
213 *
214 * These flags are intended for internal use by the mlx5_ib driver, and they
215 * rely on the range reserved for that use in the ib_qp_create_flags enum.
216 */
217 #define MLX5_IB_QP_CREATE_SQPN_QP1 IB_QP_CREATE_RESERVED_START
218 #define MLX5_IB_QP_CREATE_WC_TEST (IB_QP_CREATE_RESERVED_START << 1)
219
220 struct wr_list {
221 u16 opcode;
222 u16 next;
223 };
224
225 struct mlx5_ib_wq {
226 u64 *wrid;
227 u32 *wr_data;
228 struct wr_list *w_list;
229 unsigned *wqe_head;
230 u16 unsig_count;
231
232 /* serialize post to the work queue
233 */
234 spinlock_t lock;
235 int wqe_cnt;
236 int max_post;
237 int max_gs;
238 int offset;
239 int wqe_shift;
240 unsigned head;
241 unsigned tail;
242 u16 cur_post;
243 u16 last_poll;
244 void *qend;
245 };
246
247 struct mlx5_ib_rwq {
248 struct ib_wq ibwq;
249 struct mlx5_core_qp core_qp;
250 u32 rq_num_pas;
251 u32 log_rq_stride;
252 u32 log_rq_size;
253 u32 rq_page_offset;
254 u32 log_page_size;
255 struct ib_umem *umem;
256 size_t buf_size;
257 unsigned int page_shift;
258 int create_type;
259 struct mlx5_db db;
260 u32 user_index;
261 u32 wqe_count;
262 u32 wqe_shift;
263 int wq_sig;
264 };
265
266 enum {
267 MLX5_QP_USER,
268 MLX5_QP_KERNEL,
269 MLX5_QP_EMPTY
270 };
271
272 enum {
273 MLX5_WQ_USER,
274 MLX5_WQ_KERNEL
275 };
276
277 struct mlx5_ib_rwq_ind_table {
278 struct ib_rwq_ind_table ib_rwq_ind_tbl;
279 u32 rqtn;
280 u16 uid;
281 };
282
283 /*
284 * Connect-IB can trigger up to four concurrent pagefaults
285 * per-QP.
286 */
287 enum mlx5_ib_pagefault_context {
288 MLX5_IB_PAGEFAULT_RESPONDER_READ,
289 MLX5_IB_PAGEFAULT_REQUESTOR_READ,
290 MLX5_IB_PAGEFAULT_RESPONDER_WRITE,
291 MLX5_IB_PAGEFAULT_REQUESTOR_WRITE,
292 MLX5_IB_PAGEFAULT_CONTEXTS
293 };
294
295 static inline enum mlx5_ib_pagefault_context
296 mlx5_ib_get_pagefault_context(struct mlx5_pagefault *pagefault)
297 {
298 return pagefault->flags & (MLX5_PFAULT_REQUESTOR | MLX5_PFAULT_WRITE);
299 }
300
301 struct mlx5_ib_pfault {
302 struct work_struct work;
303 struct mlx5_pagefault mpfault;
304 };
305
306 struct mlx5_ib_ubuffer {
307 struct ib_umem *umem;
308 int buf_size;
309 u64 buf_addr;
310 };
311
312 struct mlx5_ib_qp_base {
313 struct mlx5_ib_qp *container_mibqp;
314 struct mlx5_core_qp mqp;
315 struct mlx5_ib_ubuffer ubuffer;
316 };
317
318 struct mlx5_ib_qp_trans {
319 struct mlx5_ib_qp_base base;
320 u16 xrcdn;
321 u8 alt_port;
322 u8 atomic_rd_en;
323 u8 resp_depth;
324 };
325
326 struct mlx5_ib_rss_qp {
327 u32 tirn;
328 };
329
330 struct mlx5_ib_rq {
331 struct mlx5_ib_qp_base base;
332 struct mlx5_ib_wq *rq;
333 struct mlx5_ib_ubuffer ubuffer;
334 struct mlx5_db *doorbell;
335 u32 tirn;
336 u8 state;
337 };
338
339 struct mlx5_ib_sq {
340 struct mlx5_ib_qp_base base;
341 struct mlx5_ib_wq *sq;
342 struct mlx5_ib_ubuffer ubuffer;
343 struct mlx5_db *doorbell;
344 u32 tisn;
345 u8 state;
346 };
347
348 struct mlx5_ib_raw_packet_qp {
349 struct mlx5_ib_sq sq;
350 struct mlx5_ib_rq rq;
351 };
352
353 struct mlx5_bf {
354 int buf_size;
355 unsigned long offset;
356 struct mlx5_sq_bfreg *bfreg;
357 spinlock_t lock32;
358 };
359
360 struct mlx5_ib_dct {
361 struct mlx5_core_dct mdct;
362 u32 *in;
363 };
364
365 struct mlx5_ib_qp {
366 struct ib_qp ibqp;
367 union {
368 struct mlx5_ib_qp_trans trans_qp;
369 struct mlx5_ib_raw_packet_qp raw_packet_qp;
370 struct mlx5_ib_rss_qp rss_qp;
371 struct mlx5_ib_dct dct;
372 };
373 struct mlx5_buf buf;
374
375 struct mlx5_db db;
376 struct mlx5_ib_wq rq;
377
378 u8 sq_signal_bits;
379 u8 fm_cache;
380 struct mlx5_ib_wq sq;
381
382 /* serialize qp state modifications
383 */
384 struct mutex mutex;
385 u32 flags;
386 u8 port;
387 u8 state;
388 int wq_sig;
389 int scat_cqe;
390 int max_inline_data;
391 struct mlx5_bf bf;
392 int has_rq;
393
394 /* only for user space QPs. For kernel
395 * we have it from the bf object
396 */
397 int bfregn;
398
399 int create_type;
400
401 /* Store signature errors */
402 bool signature_en;
403
404 #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
405 /*
406 * A flag that is true for QP's that are in a state that doesn't
407 * allow page faults, and shouldn't schedule any more faults.
408 */
409 int disable_page_faults;
410 /*
411 * The disable_page_faults_lock protects a QP's disable_page_faults
412 * field, allowing for a thread to atomically check whether the QP
413 * allows page faults, and if so schedule a page fault.
414 */
415 spinlock_t disable_page_faults_lock;
416 struct mlx5_ib_pfault pagefaults[MLX5_IB_PAGEFAULT_CONTEXTS];
417 #endif
418 struct list_head qps_list;
419 struct list_head cq_recv_list;
420 struct list_head cq_send_list;
421 };
422
423 struct mlx5_ib_cq_buf {
424 struct mlx5_buf buf;
425 struct ib_umem *umem;
426 int cqe_size;
427 int nent;
428 };
429
430 enum mlx5_ib_qp_flags {
431 MLX5_IB_QP_LSO = IB_QP_CREATE_IPOIB_UD_LSO,
432 MLX5_IB_QP_BLOCK_MULTICAST_LOOPBACK = IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK,
433 MLX5_IB_QP_CROSS_CHANNEL = IB_QP_CREATE_CROSS_CHANNEL,
434 MLX5_IB_QP_MANAGED_SEND = IB_QP_CREATE_MANAGED_SEND,
435 MLX5_IB_QP_MANAGED_RECV = IB_QP_CREATE_MANAGED_RECV,
436 MLX5_IB_QP_SIGNATURE_HANDLING = 1 << 5,
437 /* QP uses 1 as its source QP number */
438 MLX5_IB_QP_SQPN_QP1 = 1 << 6,
439 MLX5_IB_QP_CAP_SCATTER_FCS = 1 << 7,
440 MLX5_IB_QP_RSS = 1 << 8,
441 MLX5_IB_QP_UNDERLAY = 1 << 10,
442 };
443
444 struct mlx5_umr_wr {
445 struct ib_send_wr wr;
446 union {
447 u64 virt_addr;
448 u64 offset;
449 } target;
450 struct ib_pd *pd;
451 unsigned int page_shift;
452 unsigned int npages;
453 u32 length;
454 int access_flags;
455 u32 mkey;
456 };
457
458 static inline const struct mlx5_umr_wr *umr_wr(const struct ib_send_wr *wr)
459 {
460 return container_of(wr, struct mlx5_umr_wr, wr);
461 }
462
463 struct mlx5_shared_mr_info {
464 int mr_id;
465 struct ib_umem *umem;
466 };
467
468 struct mlx5_ib_cq {
469 struct ib_cq ibcq;
470 struct mlx5_core_cq mcq;
471 struct mlx5_ib_cq_buf buf;
472 struct mlx5_db db;
473
474 /* serialize access to the CQ
475 */
476 spinlock_t lock;
477
478 /* protect resize cq
479 */
480 struct mutex resize_mutex;
481 struct mlx5_ib_cq_buf *resize_buf;
482 struct ib_umem *resize_umem;
483 int cqe_size;
484 struct list_head list_send_qp;
485 struct list_head list_recv_qp;
486 u32 create_flags;
487 struct list_head wc_list;
488 enum ib_cq_notify_flags notify_flags;
489 struct work_struct notify_work;
490 };
491
492 struct mlx5_ib_wc {
493 struct ib_wc wc;
494 struct list_head list;
495 };
496
497 struct mlx5_ib_srq {
498 struct ib_srq ibsrq;
499 struct mlx5_core_srq msrq;
500 struct mlx5_buf buf;
501 struct mlx5_db db;
502 u64 *wrid;
503 /* protect SRQ hanlding
504 */
505 spinlock_t lock;
506 int head;
507 int tail;
508 u16 wqe_ctr;
509 struct ib_umem *umem;
510 /* serialize arming a SRQ
511 */
512 struct mutex mutex;
513 int wq_sig;
514 };
515
516 struct mlx5_ib_xrcd {
517 struct ib_xrcd ibxrcd;
518 u32 xrcdn;
519 };
520
521 enum mlx5_ib_mtt_access_flags {
522 MLX5_IB_MTT_READ = (1 << 0),
523 MLX5_IB_MTT_WRITE = (1 << 1),
524 };
525
526 struct mlx5_user_mmap_entry {
527 struct rdma_user_mmap_entry rdma_entry;
528 u8 mmap_flag;
529 u64 address;
530 u32 page_idx;
531 };
532
533 #define MLX5_IB_MTT_PRESENT (MLX5_IB_MTT_READ | MLX5_IB_MTT_WRITE)
534
535 struct mlx5_ib_mr {
536 struct ib_mr ibmr;
537 void *descs;
538 dma_addr_t desc_map;
539 int ndescs;
540 int max_descs;
541 int desc_size;
542 int access_mode;
543 struct mlx5_core_mkey mmkey;
544 struct ib_umem *umem;
545 struct mlx5_shared_mr_info *smr_info;
546 struct list_head list;
547 int order;
548 int umred;
549 int npages;
550 struct mlx5_ib_dev *dev;
551 u32 out[MLX5_ST_SZ_DW(create_mkey_out)];
552 struct mlx5_core_sig_ctx *sig;
553 int live;
554 void *descs_alloc;
555 int access_flags; /* Needed for rereg MR */
556 struct mlx5_async_work cb_work;
557 };
558
559 struct mlx5_ib_mw {
560 struct ib_mw ibmw;
561 struct mlx5_core_mkey mmkey;
562 };
563
564 struct mlx5_ib_devx_mr {
565 struct mlx5_core_mkey mmkey;
566 int ndescs;
567 };
568
569 struct mlx5_ib_umr_context {
570 struct ib_cqe cqe;
571 enum ib_wc_status status;
572 struct completion done;
573 };
574
575 struct umr_common {
576 struct ib_pd *pd;
577 struct ib_cq *cq;
578 struct ib_qp *qp;
579 /* control access to UMR QP
580 */
581 struct semaphore sem;
582 };
583
584 enum {
585 MLX5_FMR_INVALID,
586 MLX5_FMR_VALID,
587 MLX5_FMR_BUSY,
588 };
589
590 struct mlx5_cache_ent {
591 struct list_head head;
592 /* sync access to the cahce entry
593 */
594 spinlock_t lock;
595
596
597 struct dentry *dir;
598 char name[4];
599 u32 order;
600 u32 size;
601 u32 cur;
602 u32 miss;
603 u32 limit;
604
605 struct dentry *fsize;
606 struct dentry *fcur;
607 struct dentry *fmiss;
608 struct dentry *flimit;
609
610 struct mlx5_ib_dev *dev;
611 struct work_struct work;
612 struct delayed_work dwork;
613 int pending;
614 };
615
616 struct mlx5_mr_cache {
617 struct workqueue_struct *wq;
618 struct mlx5_cache_ent ent[MAX_MR_CACHE_ENTRIES];
619 int stopped;
620 struct dentry *root;
621 unsigned long last_add;
622 };
623
624 struct mlx5_ib_gsi_qp;
625
626 struct mlx5_ib_port_resources {
627 struct mlx5_ib_resources *devr;
628 struct mlx5_ib_gsi_qp *gsi;
629 struct work_struct pkey_change_work;
630 };
631
632 struct mlx5_ib_resources {
633 struct ib_cq *c0;
634 struct ib_xrcd *x0;
635 struct ib_xrcd *x1;
636 struct ib_pd *p0;
637 struct ib_srq *s0;
638 struct ib_srq *s1;
639 struct mlx5_ib_port_resources ports[2];
640 /* Protects changes to the port resources */
641 struct mutex mutex;
642 };
643
644 struct mlx5_ib_port {
645 u16 q_cnt_id;
646 };
647
648 struct mlx5_roce {
649 /* Protect mlx5_ib_get_netdev from invoking dev_hold() with a NULL
650 * netdev pointer
651 */
652 rwlock_t netdev_lock;
653 struct ifnet *netdev;
654 struct notifier_block nb;
655 atomic_t next_port;
656 };
657
658 #define MLX5_IB_STATS_COUNT(a,...) a
659 #define MLX5_IB_STATS_VAR(a,b,c,...) b c;
660 #define MLX5_IB_STATS_DESC(a,b,c,d,e,...) d, e,
661
662 #define MLX5_IB_CONG_PARAMS(m) \
663 /* ECN RP */ \
664 m(+1, u64, rp_clamp_tgt_rate, "rp_clamp_tgt_rate", "If set, whenever a CNP is processed, the target rate is updated to be the current rate") \
665 m(+1, u64, rp_clamp_tgt_rate_ati, "rp_clamp_tgt_rate_ati", "If set, when receiving a CNP, the target rate should be updated if the transission rate was increased due to the timer, and not only due to the byte counter") \
666 m(+1, u64, rp_time_reset, "rp_time_reset", "Time in microseconds between rate increases if no CNPs are received") \
667 m(+1, u64, rp_byte_reset, "rp_byte_reset", "Transmitted data in bytes between rate increases if no CNP's are received. A value of zero means disabled.") \
668 m(+1, u64, rp_threshold, "rp_threshold", "The number of times rpByteStage or rpTimeStage can count before the RP rate control state machine advances states") \
669 m(+1, u64, rp_ai_rate, "rp_ai_rate", "The rate, in Mbits per second, used to increase rpTargetRate in the active increase state") \
670 m(+1, u64, rp_hai_rate, "rp_hai_rate", "The rate, in Mbits per second, used to increase rpTargetRate in the hyper increase state") \
671 m(+1, u64, rp_min_dec_fac, "rp_min_dec_fac", "The minimum factor by which the current transmit rate can be changed when processing a CNP. Value is given as a percentage, [1 .. 100]") \
672 m(+1, u64, rp_min_rate, "rp_min_rate", "The minimum value, in Mbps per second, for rate to limit") \
673 m(+1, u64, rp_rate_to_set_on_first_cnp, "rp_rate_to_set_on_first_cnp", "The rate that is set for the flow when a rate limiter is allocated to it upon first CNP received, in Mbps. A value of zero means use full port speed") \
674 m(+1, u64, rp_dce_tcp_g, "rp_dce_tcp_g", "Used to update the congestion estimator, alpha, once every dce_tcp_rtt once every dce_tcp_rtt microseconds") \
675 m(+1, u64, rp_dce_tcp_rtt, "rp_dce_tcp_rtt", "The time between updates of the aolpha value, in microseconds") \
676 m(+1, u64, rp_rate_reduce_monitor_period, "rp_rate_reduce_monitor_period", "The minimum time between two consecutive rate reductions for a single flow") \
677 m(+1, u64, rp_initial_alpha_value, "rp_initial_alpha_value", "The initial value of alpha to use when receiving the first CNP for a flow") \
678 m(+1, u64, rp_gd, "rp_gd", "If a CNP is received, the flow rate is reduced at the beginning of the next rate_reduce_monitor_period interval") \
679 /* ECN NP */ \
680 m(+1, u64, np_cnp_dscp, "np_cnp_dscp", "The DiffServ Code Point of the generated CNP for this port") \
681 m(+1, u64, np_cnp_prio_mode, "np_cnp_prio_mode", "The 802.1p priority value of the generated CNP for this port") \
682 m(+1, u64, np_cnp_prio, "np_cnp_prio", "The 802.1p priority value of the generated CNP for this port")
683
684 #define MLX5_IB_CONG_PARAMS_NUM (0 MLX5_IB_CONG_PARAMS(MLX5_IB_STATS_COUNT))
685
686 #define MLX5_IB_CONG_STATS(m) \
687 m(+1, u64, syndrome, "syndrome", "Syndrome number") \
688 m(+1, u64, rp_cur_flows, "rp_cur_flows", "Number of flows limited") \
689 m(+1, u64, sum_flows, "sum_flows", "Sum of the number of flows limited over time") \
690 m(+1, u64, rp_cnp_ignored, "rp_cnp_ignored", "Number of CNPs and CNMs ignored") \
691 m(+1, u64, rp_cnp_handled, "rp_cnp_handled", "Number of CNPs and CNMs successfully handled") \
692 m(+1, u64, time_stamp, "time_stamp", "Time stamp in microseconds") \
693 m(+1, u64, accumulators_period, "accumulators_period", "The value of X variable for accumulating counters") \
694 m(+1, u64, np_ecn_marked_roce_packets, "np_ecn_marked_roce_packets", "Number of ECN marked packets seen") \
695 m(+1, u64, np_cnp_sent, "np_cnp_sent", "Number of CNPs sent")
696
697 #define MLX5_IB_CONG_STATS_NUM (0 MLX5_IB_CONG_STATS(MLX5_IB_STATS_COUNT))
698
699 #define MLX5_IB_CONG_STATUS(m) \
700 /* ECN RP */ \
701 m(+1, u64, rp_0_enable, "rp_0_enable", "Enable reaction point, priority 0", MLX5_IB_RROCE_ECN_RP, 0, enable) \
702 m(+1, u64, rp_1_enable, "rp_1_enable", "Enable reaction point, priority 1", MLX5_IB_RROCE_ECN_RP, 1, enable) \
703 m(+1, u64, rp_2_enable, "rp_2_enable", "Enable reaction point, priority 2", MLX5_IB_RROCE_ECN_RP, 2, enable) \
704 m(+1, u64, rp_3_enable, "rp_3_enable", "Enable reaction point, priority 3", MLX5_IB_RROCE_ECN_RP, 3, enable) \
705 m(+1, u64, rp_4_enable, "rp_4_enable", "Enable reaction point, priority 4", MLX5_IB_RROCE_ECN_RP, 4, enable) \
706 m(+1, u64, rp_5_enable, "rp_5_enable", "Enable reaction point, priority 5", MLX5_IB_RROCE_ECN_RP, 5, enable) \
707 m(+1, u64, rp_6_enable, "rp_6_enable", "Enable reaction point, priority 6", MLX5_IB_RROCE_ECN_RP, 6, enable) \
708 m(+1, u64, rp_7_enable, "rp_7_enable", "Enable reaction point, priority 7", MLX5_IB_RROCE_ECN_RP, 7, enable) \
709 m(+1, u64, rp_8_enable, "rp_8_enable", "Enable reaction point, priority 8", MLX5_IB_RROCE_ECN_RP, 8, enable) \
710 m(+1, u64, rp_9_enable, "rp_9_enable", "Enable reaction point, priority 9", MLX5_IB_RROCE_ECN_RP, 9, enable) \
711 m(+1, u64, rp_10_enable, "rp_10_enable", "Enable reaction point, priority 10", MLX5_IB_RROCE_ECN_RP, 10, enable) \
712 m(+1, u64, rp_11_enable, "rp_11_enable", "Enable reaction point, priority 11", MLX5_IB_RROCE_ECN_RP, 11, enable) \
713 m(+1, u64, rp_12_enable, "rp_12_enable", "Enable reaction point, priority 12", MLX5_IB_RROCE_ECN_RP, 12, enable) \
714 m(+1, u64, rp_13_enable, "rp_13_enable", "Enable reaction point, priority 13", MLX5_IB_RROCE_ECN_RP, 13, enable) \
715 m(+1, u64, rp_14_enable, "rp_14_enable", "Enable reaction point, priority 14", MLX5_IB_RROCE_ECN_RP, 14, enable) \
716 m(+1, u64, rp_15_enable, "rp_15_enable", "Enable reaction point, priority 15", MLX5_IB_RROCE_ECN_RP, 15, enable) \
717 /* ECN NP */ \
718 m(+1, u64, np_0_enable, "np_0_enable", "Enable notification point, priority 0", MLX5_IB_RROCE_ECN_NP, 0, enable) \
719 m(+1, u64, np_1_enable, "np_1_enable", "Enable notification point, priority 1", MLX5_IB_RROCE_ECN_NP, 1, enable) \
720 m(+1, u64, np_2_enable, "np_2_enable", "Enable notification point, priority 2", MLX5_IB_RROCE_ECN_NP, 2, enable) \
721 m(+1, u64, np_3_enable, "np_3_enable", "Enable notification point, priority 3", MLX5_IB_RROCE_ECN_NP, 3, enable) \
722 m(+1, u64, np_4_enable, "np_4_enable", "Enable notification point, priority 4", MLX5_IB_RROCE_ECN_NP, 4, enable) \
723 m(+1, u64, np_5_enable, "np_5_enable", "Enable notification point, priority 5", MLX5_IB_RROCE_ECN_NP, 5, enable) \
724 m(+1, u64, np_6_enable, "np_6_enable", "Enable notification point, priority 6", MLX5_IB_RROCE_ECN_NP, 6, enable) \
725 m(+1, u64, np_7_enable, "np_7_enable", "Enable notification point, priority 7", MLX5_IB_RROCE_ECN_NP, 7, enable) \
726 m(+1, u64, np_8_enable, "np_8_enable", "Enable notification point, priority 8", MLX5_IB_RROCE_ECN_NP, 8, enable) \
727 m(+1, u64, np_9_enable, "np_9_enable", "Enable notification point, priority 9", MLX5_IB_RROCE_ECN_NP, 9, enable) \
728 m(+1, u64, np_10_enable, "np_10_enable", "Enable notification point, priority 10", MLX5_IB_RROCE_ECN_NP, 10, enable) \
729 m(+1, u64, np_11_enable, "np_11_enable", "Enable notification point, priority 11", MLX5_IB_RROCE_ECN_NP, 11, enable) \
730 m(+1, u64, np_12_enable, "np_12_enable", "Enable notification point, priority 12", MLX5_IB_RROCE_ECN_NP, 12, enable) \
731 m(+1, u64, np_13_enable, "np_13_enable", "Enable notification point, priority 13", MLX5_IB_RROCE_ECN_NP, 13, enable) \
732 m(+1, u64, np_14_enable, "np_14_enable", "Enable notification point, priority 14", MLX5_IB_RROCE_ECN_NP, 14, enable) \
733 m(+1, u64, np_15_enable, "np_15_enable", "Enable notification point, priority 15", MLX5_IB_RROCE_ECN_NP, 15, enable) \
734
735 #define MLX5_IB_CONG_STATUS_NUM (0 MLX5_IB_CONG_STATUS(MLX5_IB_STATS_COUNT))
736
737 struct mlx5_ib_congestion {
738 struct sysctl_ctx_list ctx;
739 struct sx lock;
740 struct delayed_work dwork;
741 union {
742 u64 arg[1];
743 struct {
744 MLX5_IB_CONG_PARAMS(MLX5_IB_STATS_VAR)
745 MLX5_IB_CONG_STATS(MLX5_IB_STATS_VAR)
746 MLX5_IB_CONG_STATUS(MLX5_IB_STATS_VAR)
747 };
748 };
749 };
750
751 struct mlx5_devx_event_table {
752 /* serialize updating the event_xa */
753 struct mutex event_xa_lock;
754 struct xarray event_xa;
755 };
756
757 struct mlx5_ib_dev {
758 struct ib_device ib_dev;
759 struct mlx5_core_dev *mdev;
760 struct mlx5_roce roce;
761 MLX5_DECLARE_DOORBELL_LOCK(uar_lock);
762 int num_ports;
763 /* serialize update of capability mask
764 */
765 struct mutex cap_mask_mutex;
766 u8 ib_active:1;
767 u8 wc_support:1;
768 struct umr_common umrc;
769 /* sync used page count stats
770 */
771 struct mlx5_ib_resources devr;
772 struct mlx5_mr_cache cache;
773 struct timer_list delay_timer;
774 /* Prevents soft lock on massive reg MRs */
775 struct mutex slow_path_mutex;
776 int fill_delay;
777 #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
778 struct ib_odp_caps odp_caps;
779 /*
780 * Sleepable RCU that prevents destruction of MRs while they are still
781 * being used by a page fault handler.
782 */
783 struct srcu_struct mr_srcu;
784 #endif
785 struct mlx5_ib_flow_db flow_db;
786 /* protect resources needed as part of reset flow */
787 spinlock_t reset_flow_resource_lock;
788 struct list_head qp_list;
789 /* Array with num_ports elements */
790 struct mlx5_ib_port *port;
791 struct mlx5_sq_bfreg bfreg;
792 struct mlx5_sq_bfreg wc_bfreg;
793 struct mlx5_sq_bfreg fp_bfreg;
794 struct mlx5_devx_event_table devx_event_table;
795 struct mlx5_ib_congestion congestion;
796
797 struct mlx5_async_ctx async_ctx;
798
799 /* protect the user_td */
800 struct mutex lb_mutex;
801 u32 user_td;
802 };
803
804 static inline struct mlx5_ib_cq *to_mibcq(struct mlx5_core_cq *mcq)
805 {
806 return container_of(mcq, struct mlx5_ib_cq, mcq);
807 }
808
809 static inline struct mlx5_ib_xrcd *to_mxrcd(struct ib_xrcd *ibxrcd)
810 {
811 return container_of(ibxrcd, struct mlx5_ib_xrcd, ibxrcd);
812 }
813
814 static inline struct mlx5_ib_dev *to_mdev(struct ib_device *ibdev)
815 {
816 return container_of(ibdev, struct mlx5_ib_dev, ib_dev);
817 }
818
819 static inline struct mlx5_ib_dev *mlx5_udata_to_mdev(struct ib_udata *udata)
820 {
821 struct mlx5_ib_ucontext *context = rdma_udata_to_drv_context(
822 udata, struct mlx5_ib_ucontext, ibucontext);
823
824 return to_mdev(context->ibucontext.device);
825 }
826
827 static inline struct mlx5_ib_cq *to_mcq(struct ib_cq *ibcq)
828 {
829 return container_of(ibcq, struct mlx5_ib_cq, ibcq);
830 }
831
832 static inline struct mlx5_ib_qp *to_mibqp(struct mlx5_core_qp *mqp)
833 {
834 return container_of(mqp, struct mlx5_ib_qp_base, mqp)->container_mibqp;
835 }
836
837 static inline struct mlx5_ib_rwq *to_mibrwq(struct mlx5_core_qp *core_qp)
838 {
839 return container_of(core_qp, struct mlx5_ib_rwq, core_qp);
840 }
841
842 static inline struct mlx5_ib_mr *to_mibmr(struct mlx5_core_mkey *mmkey)
843 {
844 return container_of(mmkey, struct mlx5_ib_mr, mmkey);
845 }
846
847 static inline struct mlx5_ib_pd *to_mpd(struct ib_pd *ibpd)
848 {
849 return container_of(ibpd, struct mlx5_ib_pd, ibpd);
850 }
851
852 static inline struct mlx5_ib_srq *to_msrq(struct ib_srq *ibsrq)
853 {
854 return container_of(ibsrq, struct mlx5_ib_srq, ibsrq);
855 }
856
857 static inline struct mlx5_ib_qp *to_mqp(struct ib_qp *ibqp)
858 {
859 return container_of(ibqp, struct mlx5_ib_qp, ibqp);
860 }
861
862 static inline struct mlx5_ib_rwq *to_mrwq(struct ib_wq *ibwq)
863 {
864 return container_of(ibwq, struct mlx5_ib_rwq, ibwq);
865 }
866
867 static inline struct mlx5_ib_rwq_ind_table *to_mrwq_ind_table(struct ib_rwq_ind_table *ib_rwq_ind_tbl)
868 {
869 return container_of(ib_rwq_ind_tbl, struct mlx5_ib_rwq_ind_table, ib_rwq_ind_tbl);
870 }
871
872 static inline struct mlx5_ib_srq *to_mibsrq(struct mlx5_core_srq *msrq)
873 {
874 return container_of(msrq, struct mlx5_ib_srq, msrq);
875 }
876
877 static inline struct mlx5_ib_mr *to_mmr(struct ib_mr *ibmr)
878 {
879 return container_of(ibmr, struct mlx5_ib_mr, ibmr);
880 }
881
882 static inline struct mlx5_ib_mw *to_mmw(struct ib_mw *ibmw)
883 {
884 return container_of(ibmw, struct mlx5_ib_mw, ibmw);
885 }
886
887 struct mlx5_ib_ah {
888 struct ib_ah ibah;
889 struct mlx5_av av;
890 };
891
892 static inline struct mlx5_ib_ah *to_mah(struct ib_ah *ibah)
893 {
894 return container_of(ibah, struct mlx5_ib_ah, ibah);
895 }
896
897 static inline struct mlx5_user_mmap_entry *
898 to_mmmap(struct rdma_user_mmap_entry *rdma_entry)
899 {
900 return container_of(rdma_entry,
901 struct mlx5_user_mmap_entry, rdma_entry);
902 }
903
904 int mlx5_ib_db_map_user(struct mlx5_ib_ucontext *context, unsigned long virt,
905 struct mlx5_db *db);
906 void mlx5_ib_db_unmap_user(struct mlx5_ib_ucontext *context, struct mlx5_db *db);
907 void __mlx5_ib_cq_clean(struct mlx5_ib_cq *cq, u32 qpn, struct mlx5_ib_srq *srq);
908 void mlx5_ib_cq_clean(struct mlx5_ib_cq *cq, u32 qpn, struct mlx5_ib_srq *srq);
909 void mlx5_ib_free_srq_wqe(struct mlx5_ib_srq *srq, int wqe_index);
910 int mlx5_MAD_IFC(struct mlx5_ib_dev *dev, int ignore_mkey, int ignore_bkey,
911 u8 port, const struct ib_wc *in_wc, const struct ib_grh *in_grh,
912 const void *in_mad, void *response_mad);
913 int mlx5_ib_create_ah(struct ib_ah *ah, struct ib_ah_attr *ah_attr, u32 flags,
914 struct ib_udata *udata);
915 int mlx5_ib_query_ah(struct ib_ah *ibah, struct ib_ah_attr *ah_attr);
916 void mlx5_ib_destroy_ah(struct ib_ah *ah, u32 flags);
917 int mlx5_ib_create_srq(struct ib_srq *srq, struct ib_srq_init_attr *init_attr,
918 struct ib_udata *udata);
919 int mlx5_ib_modify_srq(struct ib_srq *ibsrq, struct ib_srq_attr *attr,
920 enum ib_srq_attr_mask attr_mask, struct ib_udata *udata);
921 int mlx5_ib_query_srq(struct ib_srq *ibsrq, struct ib_srq_attr *srq_attr);
922 void mlx5_ib_destroy_srq(struct ib_srq *srq, struct ib_udata *udata);
923 int mlx5_ib_post_srq_recv(struct ib_srq *ibsrq, const struct ib_recv_wr *wr,
924 const struct ib_recv_wr **bad_wr);
925 struct ib_qp *mlx5_ib_create_qp(struct ib_pd *pd,
926 struct ib_qp_init_attr *init_attr,
927 struct ib_udata *udata);
928 int mlx5_ib_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *attr,
929 int attr_mask, struct ib_udata *udata);
930 int mlx5_ib_query_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr, int qp_attr_mask,
931 struct ib_qp_init_attr *qp_init_attr);
932 int mlx5_ib_destroy_qp(struct ib_qp *qp, struct ib_udata *udata);
933 int mlx5_ib_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
934 const struct ib_send_wr **bad_wr);
935 int mlx5_ib_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr,
936 const struct ib_recv_wr **bad_wr);
937 void *mlx5_get_send_wqe(struct mlx5_ib_qp *qp, int n);
938 int mlx5_ib_read_user_wqe(struct mlx5_ib_qp *qp, int send, int wqe_index,
939 void *buffer, u32 length,
940 struct mlx5_ib_qp_base *base);
941 int mlx5_ib_create_cq(struct ib_cq *ibcq, const struct ib_cq_init_attr *attr,
942 struct ib_udata *udata);
943 void mlx5_ib_destroy_cq(struct ib_cq *cq, struct ib_udata *udata);
944 int mlx5_ib_poll_cq(struct ib_cq *ibcq, int num_entries, struct ib_wc *wc);
945 int mlx5_ib_arm_cq(struct ib_cq *ibcq, enum ib_cq_notify_flags flags);
946 int mlx5_ib_modify_cq(struct ib_cq *cq, u16 cq_count, u16 cq_period);
947 int mlx5_ib_resize_cq(struct ib_cq *ibcq, int entries, struct ib_udata *udata);
948 struct ib_mr *mlx5_ib_get_dma_mr(struct ib_pd *pd, int acc);
949 struct ib_mr *mlx5_ib_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,
950 u64 virt_addr, int access_flags,
951 struct ib_udata *udata);
952 struct ib_mw *mlx5_ib_alloc_mw(struct ib_pd *pd, enum ib_mw_type type,
953 struct ib_udata *udata);
954 int mlx5_ib_dealloc_mw(struct ib_mw *mw);
955 int mlx5_ib_update_mtt(struct mlx5_ib_mr *mr, u64 start_page_index,
956 int npages, int zap);
957 int mlx5_ib_rereg_user_mr(struct ib_mr *ib_mr, int flags, u64 start,
958 u64 length, u64 virt_addr, int access_flags,
959 struct ib_pd *pd, struct ib_udata *udata);
960 int mlx5_ib_dereg_mr(struct ib_mr *ibmr, struct ib_udata *udata);
961 struct ib_mr *mlx5_ib_alloc_mr(struct ib_pd *pd, enum ib_mr_type mr_type,
962 u32 max_num_sg, struct ib_udata *udata);
963 int mlx5_ib_map_mr_sg(struct ib_mr *ibmr, struct scatterlist *sg, int sg_nents,
964 unsigned int *sg_offset);
965 int mlx5_ib_process_mad(struct ib_device *ibdev, int mad_flags, u8 port_num,
966 const struct ib_wc *in_wc, const struct ib_grh *in_grh,
967 const struct ib_mad_hdr *in, size_t in_mad_size,
968 struct ib_mad_hdr *out, size_t *out_mad_size,
969 u16 *out_mad_pkey_index);
970 struct ib_xrcd *mlx5_ib_alloc_xrcd(struct ib_device *ibdev,
971 struct ib_udata *udata);
972 int mlx5_ib_dealloc_xrcd(struct ib_xrcd *xrcd, struct ib_udata *udata);
973 int mlx5_ib_get_buf_offset(u64 addr, int page_shift, u32 *offset);
974 int mlx5_query_ext_port_caps(struct mlx5_ib_dev *dev, u8 port);
975 int mlx5_query_mad_ifc_smp_attr_node_info(struct ib_device *ibdev,
976 struct ib_smp *out_mad);
977 int mlx5_query_mad_ifc_system_image_guid(struct ib_device *ibdev,
978 __be64 *sys_image_guid);
979 int mlx5_query_mad_ifc_max_pkeys(struct ib_device *ibdev,
980 u16 *max_pkeys);
981 int mlx5_query_mad_ifc_vendor_id(struct ib_device *ibdev,
982 u32 *vendor_id);
983 int mlx5_query_mad_ifc_node_desc(struct mlx5_ib_dev *dev, char *node_desc);
984 int mlx5_query_mad_ifc_node_guid(struct mlx5_ib_dev *dev, __be64 *node_guid);
985 int mlx5_query_mad_ifc_pkey(struct ib_device *ibdev, u8 port, u16 index,
986 u16 *pkey);
987 int mlx5_query_mad_ifc_gids(struct ib_device *ibdev, u8 port, int index,
988 union ib_gid *gid);
989 int mlx5_query_mad_ifc_port(struct ib_device *ibdev, u8 port,
990 struct ib_port_attr *props);
991 int mlx5_ib_query_port(struct ib_device *ibdev, u8 port,
992 struct ib_port_attr *props);
993 int mlx5_ib_init_fmr(struct mlx5_ib_dev *dev);
994 void mlx5_ib_cleanup_fmr(struct mlx5_ib_dev *dev);
995 void mlx5_ib_cont_pages(struct ib_umem *umem, u64 addr,
996 unsigned long max_page_shift,
997 int *count, int *shift,
998 int *ncont, int *order);
999 void __mlx5_ib_populate_pas(struct mlx5_ib_dev *dev, struct ib_umem *umem,
1000 int page_shift, size_t offset, size_t num_pages,
1001 __be64 *pas, int access_flags);
1002 void mlx5_ib_populate_pas(struct mlx5_ib_dev *dev, struct ib_umem *umem,
1003 int page_shift, __be64 *pas, int access_flags);
1004 void mlx5_ib_copy_pas(u64 *old, u64 *new, int step, int num);
1005 int mlx5_ib_get_cqe_size(struct mlx5_ib_dev *dev, struct ib_cq *ibcq);
1006 int mlx5_mr_cache_init(struct mlx5_ib_dev *dev);
1007 int mlx5_mr_cache_cleanup(struct mlx5_ib_dev *dev);
1008 int mlx5_mr_ib_cont_pages(struct ib_umem *umem, u64 addr, int *count, int *shift);
1009 int mlx5_ib_check_mr_status(struct ib_mr *ibmr, u32 check_mask,
1010 struct ib_mr_status *mr_status);
1011 struct ib_wq *mlx5_ib_create_wq(struct ib_pd *pd,
1012 struct ib_wq_init_attr *init_attr,
1013 struct ib_udata *udata);
1014 void mlx5_ib_destroy_wq(struct ib_wq *wq, struct ib_udata *udata);
1015 int mlx5_ib_modify_wq(struct ib_wq *wq, struct ib_wq_attr *wq_attr,
1016 u32 wq_attr_mask, struct ib_udata *udata);
1017 struct ib_rwq_ind_table *mlx5_ib_create_rwq_ind_table(struct ib_device *device,
1018 struct ib_rwq_ind_table_init_attr *init_attr,
1019 struct ib_udata *udata);
1020 int mlx5_ib_destroy_rwq_ind_table(struct ib_rwq_ind_table *wq_ind_table);
1021
1022 #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
1023 extern struct workqueue_struct *mlx5_ib_page_fault_wq;
1024
1025 void mlx5_ib_internal_fill_odp_caps(struct mlx5_ib_dev *dev);
1026 void mlx5_ib_mr_pfault_handler(struct mlx5_ib_qp *qp,
1027 struct mlx5_ib_pfault *pfault);
1028 void mlx5_ib_odp_create_qp(struct mlx5_ib_qp *qp);
1029 int mlx5_ib_odp_init_one(struct mlx5_ib_dev *ibdev);
1030 void mlx5_ib_odp_remove_one(struct mlx5_ib_dev *ibdev);
1031 int __init mlx5_ib_odp_init(void);
1032 void mlx5_ib_odp_cleanup(void);
1033 void mlx5_ib_qp_disable_pagefaults(struct mlx5_ib_qp *qp);
1034 void mlx5_ib_qp_enable_pagefaults(struct mlx5_ib_qp *qp);
1035 void mlx5_ib_invalidate_range(struct ib_umem *umem, unsigned long start,
1036 unsigned long end);
1037 #else /* CONFIG_INFINIBAND_ON_DEMAND_PAGING */
1038 static inline void mlx5_ib_internal_fill_odp_caps(struct mlx5_ib_dev *dev)
1039 {
1040 return;
1041 }
1042
1043 static inline void mlx5_ib_odp_create_qp(struct mlx5_ib_qp *qp) {}
1044 static inline int mlx5_ib_odp_init_one(struct mlx5_ib_dev *ibdev) { return 0; }
1045 static inline void mlx5_ib_odp_remove_one(struct mlx5_ib_dev *ibdev) {}
1046 static inline int mlx5_ib_odp_init(void) { return 0; }
1047 static inline void mlx5_ib_odp_cleanup(void) {}
1048 static inline void mlx5_ib_qp_disable_pagefaults(struct mlx5_ib_qp *qp) {}
1049 static inline void mlx5_ib_qp_enable_pagefaults(struct mlx5_ib_qp *qp) {}
1050
1051 #endif /* CONFIG_INFINIBAND_ON_DEMAND_PAGING */
1052
1053 int mlx5_ib_get_vf_config(struct ib_device *device, int vf,
1054 u8 port, struct ifla_vf_info *info);
1055 int mlx5_ib_set_vf_link_state(struct ib_device *device, int vf,
1056 u8 port, int state);
1057 int mlx5_ib_get_vf_stats(struct ib_device *device, int vf,
1058 u8 port, struct ifla_vf_stats *stats);
1059 int mlx5_ib_set_vf_guid(struct ib_device *device, int vf, u8 port,
1060 u64 guid, int type);
1061
1062 __be16 mlx5_get_roce_udp_sport(struct mlx5_ib_dev *dev, u8 port_num,
1063 int index);
1064 int mlx5_get_roce_gid_type(struct mlx5_ib_dev *dev, u8 port_num,
1065 int index, enum ib_gid_type *gid_type);
1066
1067 /* GSI QP helper functions */
1068 struct ib_qp *mlx5_ib_gsi_create_qp(struct ib_pd *pd,
1069 struct ib_qp_init_attr *init_attr);
1070 int mlx5_ib_gsi_destroy_qp(struct ib_qp *qp);
1071 int mlx5_ib_gsi_modify_qp(struct ib_qp *qp, struct ib_qp_attr *attr,
1072 int attr_mask);
1073 int mlx5_ib_gsi_query_qp(struct ib_qp *qp, struct ib_qp_attr *qp_attr,
1074 int qp_attr_mask,
1075 struct ib_qp_init_attr *qp_init_attr);
1076 int mlx5_ib_gsi_post_send(struct ib_qp *qp, const struct ib_send_wr *wr,
1077 const struct ib_send_wr **bad_wr);
1078 int mlx5_ib_gsi_post_recv(struct ib_qp *qp, const struct ib_recv_wr *wr,
1079 const struct ib_recv_wr **bad_wr);
1080 void mlx5_ib_gsi_pkey_change(struct mlx5_ib_gsi_qp *gsi);
1081
1082 int mlx5_ib_generate_wc(struct ib_cq *ibcq, struct ib_wc *wc);
1083
1084 void mlx5_ib_free_bfreg(struct mlx5_ib_dev *dev, struct mlx5_bfreg_info *bfregi,
1085 int bfregn);
1086
1087 #if 1 /* IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS) */
1088 int mlx5_ib_devx_create(struct mlx5_ib_dev *dev, bool is_user);
1089 void mlx5_ib_devx_destroy(struct mlx5_ib_dev *dev, u16 uid);
1090 void mlx5_ib_devx_init_event_table(struct mlx5_ib_dev *dev);
1091 void mlx5_ib_devx_cleanup_event_table(struct mlx5_ib_dev *dev);
1092 bool mlx5_ib_devx_is_flow_dest(void *obj, int *dest_id, int *dest_type);
1093 bool mlx5_ib_devx_is_flow_counter(void *obj, u32 offset, u32 *counter_id);
1094 #else
1095 static inline int
1096 mlx5_ib_devx_create(struct mlx5_ib_dev *dev,
1097 bool is_user) { return -EOPNOTSUPP; }
1098 static inline void mlx5_ib_devx_destroy(struct mlx5_ib_dev *dev, u16 uid) {}
1099 static inline void mlx5_ib_devx_init_event_table(struct mlx5_ib_dev *dev) {}
1100 static inline void mlx5_ib_devx_cleanup_event_table(struct mlx5_ib_dev *dev) {}
1101 static inline bool mlx5_ib_devx_is_flow_dest(void *obj, int *dest_id,
1102 int *dest_type)
1103 {
1104 return false;
1105 }
1106 #endif
1107
1108 static inline void init_query_mad(struct ib_smp *mad)
1109 {
1110 mad->base_version = 1;
1111 mad->mgmt_class = IB_MGMT_CLASS_SUBN_LID_ROUTED;
1112 mad->class_version = 1;
1113 mad->method = IB_MGMT_METHOD_GET;
1114 }
1115
1116 static inline u8 convert_access(int acc)
1117 {
1118 return (acc & IB_ACCESS_REMOTE_ATOMIC ? MLX5_PERM_ATOMIC : 0) |
1119 (acc & IB_ACCESS_REMOTE_WRITE ? MLX5_PERM_REMOTE_WRITE : 0) |
1120 (acc & IB_ACCESS_REMOTE_READ ? MLX5_PERM_REMOTE_READ : 0) |
1121 (acc & IB_ACCESS_LOCAL_WRITE ? MLX5_PERM_LOCAL_WRITE : 0) |
1122 MLX5_PERM_LOCAL_READ;
1123 }
1124
1125 static inline int is_qp1(enum ib_qp_type qp_type)
1126 {
1127 return qp_type == MLX5_IB_QPT_HW_GSI;
1128 }
1129
1130 #define MLX5_MAX_UMR_SHIFT 16
1131 #define MLX5_MAX_UMR_PAGES (1 << MLX5_MAX_UMR_SHIFT)
1132
1133 static inline u32 check_cq_create_flags(u32 flags)
1134 {
1135 /*
1136 * It returns non-zero value for unsupported CQ
1137 * create flags, otherwise it returns zero.
1138 */
1139 return (flags & ~(IB_CQ_FLAGS_IGNORE_OVERRUN |
1140 IB_CQ_FLAGS_TIMESTAMP_COMPLETION));
1141 }
1142
1143 static inline int verify_assign_uidx(u8 cqe_version, u32 cmd_uidx,
1144 u32 *user_index)
1145 {
1146 if (cqe_version) {
1147 if ((cmd_uidx == MLX5_IB_DEFAULT_UIDX) ||
1148 (cmd_uidx & ~MLX5_USER_ASSIGNED_UIDX_MASK))
1149 return -EINVAL;
1150 *user_index = cmd_uidx;
1151 } else {
1152 *user_index = MLX5_IB_DEFAULT_UIDX;
1153 }
1154
1155 return 0;
1156 }
1157
1158 static inline int get_qp_user_index(struct mlx5_ib_ucontext *ucontext,
1159 struct mlx5_ib_create_qp *ucmd,
1160 int inlen,
1161 u32 *user_index)
1162 {
1163 u8 cqe_version = ucontext->cqe_version;
1164
1165 if (field_avail(struct mlx5_ib_create_qp, uidx, inlen) &&
1166 !cqe_version && (ucmd->uidx == MLX5_IB_DEFAULT_UIDX))
1167 return 0;
1168
1169 if (!!(field_avail(struct mlx5_ib_create_qp, uidx, inlen) !=
1170 !!cqe_version))
1171 return -EINVAL;
1172
1173 return verify_assign_uidx(cqe_version, ucmd->uidx, user_index);
1174 }
1175
1176 static inline int get_srq_user_index(struct mlx5_ib_ucontext *ucontext,
1177 struct mlx5_ib_create_srq *ucmd,
1178 int inlen,
1179 u32 *user_index)
1180 {
1181 u8 cqe_version = ucontext->cqe_version;
1182
1183 if (field_avail(struct mlx5_ib_create_srq, uidx, inlen) &&
1184 !cqe_version && (ucmd->uidx == MLX5_IB_DEFAULT_UIDX))
1185 return 0;
1186
1187 if (!!(field_avail(struct mlx5_ib_create_srq, uidx, inlen) !=
1188 !!cqe_version))
1189 return -EINVAL;
1190
1191 return verify_assign_uidx(cqe_version, ucmd->uidx, user_index);
1192 }
1193
1194 void mlx5_ib_cleanup_congestion(struct mlx5_ib_dev *);
1195 int mlx5_ib_init_congestion(struct mlx5_ib_dev *);
1196
1197 static inline int get_uars_per_sys_page(struct mlx5_ib_dev *dev, bool lib_support)
1198 {
1199 return lib_support && MLX5_CAP_GEN(dev->mdev, uar_4k) ?
1200 MLX5_UARS_IN_PAGE : 1;
1201 }
1202
1203 static inline int get_num_static_uars(struct mlx5_ib_dev *dev,
1204 struct mlx5_bfreg_info *bfregi)
1205 {
1206 return get_uars_per_sys_page(dev, bfregi->lib_uar_4k) * bfregi->num_static_sys_pages;
1207 }
1208
1209 int bfregn_to_uar_index(struct mlx5_ib_dev *dev,
1210 struct mlx5_bfreg_info *bfregi, u32 bfregn,
1211 bool dyn_bfreg);
1212
1213 #endif /* MLX5_IB_H */
Cache object: d9d0c57bfabbe646cdd03a96987605aa
|