FreeBSD/Linux Kernel Cross Reference
sys/dev/ena/ena.h
1 /*-
2 * SPDX-License-Identifier: BSD-2-Clause
3 *
4 * Copyright (c) 2015-2020 Amazon.com, Inc. or its affiliates.
5 * All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 *
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 *
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 *
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 *
30 * $FreeBSD$
31 *
32 */
33
34 #ifndef ENA_H
35 #define ENA_H
36
37 #include "opt_rss.h"
38
39 #include "ena-com/ena_com.h"
40 #include "ena-com/ena_eth_com.h"
41
42 #define DRV_MODULE_VER_MAJOR 2
43 #define DRV_MODULE_VER_MINOR 4
44 #define DRV_MODULE_VER_SUBMINOR 1
45
46 #define DRV_MODULE_NAME "ena"
47
48 #ifndef DRV_MODULE_VERSION
49 #define DRV_MODULE_VERSION \
50 __XSTRING(DRV_MODULE_VER_MAJOR) "." \
51 __XSTRING(DRV_MODULE_VER_MINOR) "." \
52 __XSTRING(DRV_MODULE_VER_SUBMINOR)
53 #endif
54 #define DEVICE_NAME "Elastic Network Adapter (ENA)"
55 #define DEVICE_DESC "ENA adapter"
56
57 /* Calculate DMA mask - width for ena cannot exceed 48, so it is safe */
58 #define ENA_DMA_BIT_MASK(x) ((1ULL << (x)) - 1ULL)
59
60 /* 1 for AENQ + ADMIN */
61 #define ENA_ADMIN_MSIX_VEC 1
62 #define ENA_MAX_MSIX_VEC(io_queues) (ENA_ADMIN_MSIX_VEC + (io_queues))
63
64 #define ENA_REG_BAR 0
65 #define ENA_MEM_BAR 2
66
67 #define ENA_BUS_DMA_SEGS 32
68
69 #define ENA_DEFAULT_BUF_RING_SIZE 4096
70
71 #define ENA_DEFAULT_RING_SIZE 1024
72 #define ENA_MIN_RING_SIZE 256
73
74 /*
75 * Refill Rx queue when number of required descriptors is above
76 * QUEUE_SIZE / ENA_RX_REFILL_THRESH_DIVIDER or ENA_RX_REFILL_THRESH_PACKET
77 */
78 #define ENA_RX_REFILL_THRESH_DIVIDER 8
79 #define ENA_RX_REFILL_THRESH_PACKET 256
80
81 #define ENA_IRQNAME_SIZE 40
82
83 #define ENA_PKT_MAX_BUFS 19
84
85 #define ENA_RX_RSS_TABLE_LOG_SIZE 7
86 #define ENA_RX_RSS_TABLE_SIZE (1 << ENA_RX_RSS_TABLE_LOG_SIZE)
87
88 #define ENA_HASH_KEY_SIZE 40
89
90 #define ENA_MAX_FRAME_LEN 10000
91 #define ENA_MIN_FRAME_LEN 60
92
93 #define ENA_TX_RESUME_THRESH (ENA_PKT_MAX_BUFS + 2)
94
95 #define DB_THRESHOLD 64
96
97 #define TX_COMMIT 32
98 /*
99 * TX budget for cleaning. It should be half of the RX budget to reduce amount
100 * of TCP retransmissions.
101 */
102 #define TX_BUDGET 128
103 /* RX cleanup budget. -1 stands for infinity. */
104 #define RX_BUDGET 256
105 /*
106 * How many times we can repeat cleanup in the io irq handling routine if the
107 * RX or TX budget was depleted.
108 */
109 #define CLEAN_BUDGET 8
110
111 #define RX_IRQ_INTERVAL 20
112 #define TX_IRQ_INTERVAL 50
113
114 #define ENA_MIN_MTU 128
115
116 #define ENA_TSO_MAXSIZE 65536
117
118 #define ENA_MMIO_DISABLE_REG_READ BIT(0)
119
120 #define ENA_TX_RING_IDX_NEXT(idx, ring_size) (((idx) + 1) & ((ring_size) - 1))
121
122 #define ENA_RX_RING_IDX_NEXT(idx, ring_size) (((idx) + 1) & ((ring_size) - 1))
123
124 #define ENA_IO_TXQ_IDX(q) (2 * (q))
125 #define ENA_IO_RXQ_IDX(q) (2 * (q) + 1)
126 #define ENA_IO_TXQ_IDX_TO_COMBINED_IDX(q) ((q) / 2)
127 #define ENA_IO_RXQ_IDX_TO_COMBINED_IDX(q) (((q) - 1) / 2)
128
129 #define ENA_MGMNT_IRQ_IDX 0
130 #define ENA_IO_IRQ_FIRST_IDX 1
131 #define ENA_IO_IRQ_IDX(q) (ENA_IO_IRQ_FIRST_IDX + (q))
132
133 #define ENA_MAX_NO_INTERRUPT_ITERATIONS 3
134
135 /*
136 * ENA device should send keep alive msg every 1 sec.
137 * We wait for 6 sec just to be on the safe side.
138 */
139 #define DEFAULT_KEEP_ALIVE_TO (SBT_1S * 6)
140
141 /* Time in jiffies before concluding the transmitter is hung. */
142 #define DEFAULT_TX_CMP_TO (SBT_1S * 5)
143
144 /* Number of queues to check for missing queues per timer tick */
145 #define DEFAULT_TX_MONITORED_QUEUES (4)
146
147 /* Max number of timeouted packets before device reset */
148 #define DEFAULT_TX_CMP_THRESHOLD (128)
149
150 /*
151 * Supported PCI vendor and devices IDs
152 */
153 #define PCI_VENDOR_ID_AMAZON 0x1d0f
154
155 #define PCI_DEV_ID_ENA_PF 0x0ec2
156 #define PCI_DEV_ID_ENA_PF_RSERV0 0x1ec2
157 #define PCI_DEV_ID_ENA_VF 0xec20
158 #define PCI_DEV_ID_ENA_VF_RSERV0 0xec21
159
160 /*
161 * Flags indicating current ENA driver state
162 */
163 enum ena_flags_t {
164 ENA_FLAG_DEVICE_RUNNING,
165 ENA_FLAG_DEV_UP,
166 ENA_FLAG_LINK_UP,
167 ENA_FLAG_MSIX_ENABLED,
168 ENA_FLAG_TRIGGER_RESET,
169 ENA_FLAG_ONGOING_RESET,
170 ENA_FLAG_DEV_UP_BEFORE_RESET,
171 ENA_FLAG_RSS_ACTIVE,
172 ENA_FLAGS_NUMBER = ENA_FLAG_RSS_ACTIVE
173 };
174
175 BITSET_DEFINE(_ena_state, ENA_FLAGS_NUMBER);
176 typedef struct _ena_state ena_state_t;
177
178 #define ENA_FLAG_ZERO(adapter) \
179 BIT_ZERO(ENA_FLAGS_NUMBER, &(adapter)->flags)
180 #define ENA_FLAG_ISSET(bit, adapter) \
181 BIT_ISSET(ENA_FLAGS_NUMBER, (bit), &(adapter)->flags)
182 #define ENA_FLAG_SET_ATOMIC(bit, adapter) \
183 BIT_SET_ATOMIC(ENA_FLAGS_NUMBER, (bit), &(adapter)->flags)
184 #define ENA_FLAG_CLEAR_ATOMIC(bit, adapter) \
185 BIT_CLR_ATOMIC(ENA_FLAGS_NUMBER, (bit), &(adapter)->flags)
186
187 struct msix_entry {
188 int entry;
189 int vector;
190 };
191
192 typedef struct _ena_vendor_info_t {
193 uint16_t vendor_id;
194 uint16_t device_id;
195 unsigned int index;
196 } ena_vendor_info_t;
197
198 struct ena_irq {
199 /* Interrupt resources */
200 struct resource *res;
201 driver_filter_t *handler;
202 void *data;
203 void *cookie;
204 unsigned int vector;
205 bool requested;
206 #ifdef RSS
207 int cpu;
208 #endif
209 char name[ENA_IRQNAME_SIZE];
210 };
211
212 struct ena_que {
213 struct ena_adapter *adapter;
214 struct ena_ring *tx_ring;
215 struct ena_ring *rx_ring;
216
217 struct task cleanup_task;
218 struct taskqueue *cleanup_tq;
219
220 uint32_t id;
221 #ifdef RSS
222 int cpu;
223 cpuset_t cpu_mask;
224 #endif
225 struct sysctl_oid *oid;
226 };
227
228 struct ena_calc_queue_size_ctx {
229 struct ena_com_dev_get_features_ctx *get_feat_ctx;
230 struct ena_com_dev *ena_dev;
231 device_t pdev;
232 uint32_t tx_queue_size;
233 uint32_t rx_queue_size;
234 uint32_t max_tx_queue_size;
235 uint32_t max_rx_queue_size;
236 uint16_t max_tx_sgl_size;
237 uint16_t max_rx_sgl_size;
238 };
239
240 #ifdef DEV_NETMAP
241 struct ena_netmap_tx_info {
242 uint32_t socket_buf_idx[ENA_PKT_MAX_BUFS];
243 bus_dmamap_t map_seg[ENA_PKT_MAX_BUFS];
244 unsigned int sockets_used;
245 };
246 #endif
247
248 struct ena_tx_buffer {
249 struct mbuf *mbuf;
250 /* # of ena desc for this specific mbuf
251 * (includes data desc and metadata desc) */
252 unsigned int tx_descs;
253 /* # of buffers used by this mbuf */
254 unsigned int num_of_bufs;
255
256 bus_dmamap_t dmamap;
257
258 /* Used to detect missing tx packets */
259 struct bintime timestamp;
260 bool print_once;
261
262 #ifdef DEV_NETMAP
263 struct ena_netmap_tx_info nm_info;
264 #endif /* DEV_NETMAP */
265
266 struct ena_com_buf bufs[ENA_PKT_MAX_BUFS];
267 } __aligned(CACHE_LINE_SIZE);
268
269 struct ena_rx_buffer {
270 struct mbuf *mbuf;
271 bus_dmamap_t map;
272 struct ena_com_buf ena_buf;
273 #ifdef DEV_NETMAP
274 uint32_t netmap_buf_idx;
275 #endif /* DEV_NETMAP */
276 } __aligned(CACHE_LINE_SIZE);
277
278 struct ena_stats_tx {
279 counter_u64_t cnt;
280 counter_u64_t bytes;
281 counter_u64_t prepare_ctx_err;
282 counter_u64_t dma_mapping_err;
283 counter_u64_t doorbells;
284 counter_u64_t missing_tx_comp;
285 counter_u64_t bad_req_id;
286 counter_u64_t collapse;
287 counter_u64_t collapse_err;
288 counter_u64_t queue_wakeup;
289 counter_u64_t queue_stop;
290 counter_u64_t llq_buffer_copy;
291 counter_u64_t unmask_interrupt_num;
292 };
293
294 struct ena_stats_rx {
295 counter_u64_t cnt;
296 counter_u64_t bytes;
297 counter_u64_t refil_partial;
298 counter_u64_t csum_bad;
299 counter_u64_t mjum_alloc_fail;
300 counter_u64_t mbuf_alloc_fail;
301 counter_u64_t dma_mapping_err;
302 counter_u64_t bad_desc_num;
303 counter_u64_t bad_req_id;
304 counter_u64_t empty_rx_ring;
305 counter_u64_t csum_good;
306 };
307
308 struct ena_ring {
309 /* Holds the empty requests for TX/RX out of order completions */
310 union {
311 uint16_t *free_tx_ids;
312 uint16_t *free_rx_ids;
313 };
314 struct ena_com_dev *ena_dev;
315 struct ena_adapter *adapter;
316 struct ena_com_io_cq *ena_com_io_cq;
317 struct ena_com_io_sq *ena_com_io_sq;
318
319 uint16_t qid;
320
321 /* Determines if device will use LLQ or normal mode for TX */
322 enum ena_admin_placement_policy_type tx_mem_queue_type;
323 union {
324 /* The maximum length the driver can push to the device (For LLQ) */
325 uint8_t tx_max_header_size;
326 /* The maximum (and default) mbuf size for the Rx descriptor. */
327 uint16_t rx_mbuf_sz;
328
329 };
330
331 bool first_interrupt;
332 uint16_t no_interrupt_event_cnt;
333
334 struct ena_com_rx_buf_info ena_bufs[ENA_PKT_MAX_BUFS];
335
336 struct ena_que *que;
337 struct lro_ctrl lro;
338
339 uint16_t next_to_use;
340 uint16_t next_to_clean;
341
342 union {
343 struct ena_tx_buffer *tx_buffer_info; /* contex of tx packet */
344 struct ena_rx_buffer *rx_buffer_info; /* contex of rx packet */
345 };
346 int ring_size; /* number of tx/rx_buffer_info's entries */
347
348 struct buf_ring *br; /* only for TX */
349 uint32_t buf_ring_size;
350
351 struct mtx ring_mtx;
352 char mtx_name[16];
353
354 struct {
355 struct task enqueue_task;
356 struct taskqueue *enqueue_tq;
357 };
358
359 union {
360 struct ena_stats_tx tx_stats;
361 struct ena_stats_rx rx_stats;
362 };
363
364 union {
365 int empty_rx_queue;
366 /* For Tx ring to indicate if it's running or not */
367 bool running;
368 };
369
370 /* How many packets are sent in one Tx loop, used for doorbells */
371 uint32_t acum_pkts;
372
373 /* Used for LLQ */
374 uint8_t *push_buf_intermediate_buf;
375
376 #ifdef DEV_NETMAP
377 bool initialized;
378 #endif /* DEV_NETMAP */
379 } __aligned(CACHE_LINE_SIZE);
380
381 struct ena_stats_dev {
382 counter_u64_t wd_expired;
383 counter_u64_t interface_up;
384 counter_u64_t interface_down;
385 counter_u64_t admin_q_pause;
386 };
387
388 struct ena_hw_stats {
389 counter_u64_t rx_packets;
390 counter_u64_t tx_packets;
391
392 counter_u64_t rx_bytes;
393 counter_u64_t tx_bytes;
394
395 counter_u64_t rx_drops;
396 counter_u64_t tx_drops;
397 };
398
399 /* Board specific private data structure */
400 struct ena_adapter {
401 struct ena_com_dev *ena_dev;
402
403 /* OS defined structs */
404 if_t ifp;
405 device_t pdev;
406 struct ifmedia media;
407
408 /* OS resources */
409 struct resource *memory;
410 struct resource *registers;
411 struct resource *msix;
412 int msix_rid;
413
414 /* MSI-X */
415 struct msix_entry *msix_entries;
416 int msix_vecs;
417
418 /* DMA tags used throughout the driver adapter for Tx and Rx */
419 bus_dma_tag_t tx_buf_tag;
420 bus_dma_tag_t rx_buf_tag;
421 int dma_width;
422
423 uint32_t max_mtu;
424
425 uint32_t num_io_queues;
426 uint32_t max_num_io_queues;
427
428 uint32_t requested_tx_ring_size;
429 uint32_t requested_rx_ring_size;
430
431 uint32_t max_tx_ring_size;
432 uint32_t max_rx_ring_size;
433
434 uint16_t max_tx_sgl_size;
435 uint16_t max_rx_sgl_size;
436
437 uint32_t tx_offload_cap;
438
439 uint32_t buf_ring_size;
440
441 /* RSS*/
442 struct ena_indir *rss_indir;
443
444 uint8_t mac_addr[ETHER_ADDR_LEN];
445 /* mdio and phy*/
446
447 ena_state_t flags;
448
449 /* Queue will represent one TX and one RX ring */
450 struct ena_que que[ENA_MAX_NUM_IO_QUEUES]
451 __aligned(CACHE_LINE_SIZE);
452
453 /* TX */
454 struct ena_ring tx_ring[ENA_MAX_NUM_IO_QUEUES]
455 __aligned(CACHE_LINE_SIZE);
456
457 /* RX */
458 struct ena_ring rx_ring[ENA_MAX_NUM_IO_QUEUES]
459 __aligned(CACHE_LINE_SIZE);
460
461 struct ena_irq irq_tbl[ENA_MAX_MSIX_VEC(ENA_MAX_NUM_IO_QUEUES)];
462
463 /* Timer service */
464 struct callout timer_service;
465 sbintime_t keep_alive_timestamp;
466 uint32_t next_monitored_tx_qid;
467 struct task reset_task;
468 struct taskqueue *reset_tq;
469 int wd_active;
470 sbintime_t keep_alive_timeout;
471 sbintime_t missing_tx_timeout;
472 uint32_t missing_tx_max_queues;
473 uint32_t missing_tx_threshold;
474 bool disable_meta_caching;
475
476 uint16_t eni_metrics_sample_interval;
477 uint16_t eni_metrics_sample_interval_cnt;
478
479 /* Statistics */
480 struct ena_stats_dev dev_stats;
481 struct ena_hw_stats hw_stats;
482 struct ena_admin_eni_stats eni_metrics;
483
484 enum ena_regs_reset_reason_types reset_reason;
485 };
486
487 #define ENA_RING_MTX_LOCK(_ring) mtx_lock(&(_ring)->ring_mtx)
488 #define ENA_RING_MTX_TRYLOCK(_ring) mtx_trylock(&(_ring)->ring_mtx)
489 #define ENA_RING_MTX_UNLOCK(_ring) mtx_unlock(&(_ring)->ring_mtx)
490 #define ENA_RING_MTX_ASSERT(_ring) \
491 mtx_assert(&(_ring)->ring_mtx, MA_OWNED)
492
493 #define ENA_LOCK_INIT() \
494 sx_init(&ena_global_lock, "ENA global lock")
495 #define ENA_LOCK_DESTROY() sx_destroy(&ena_global_lock)
496 #define ENA_LOCK_LOCK() sx_xlock(&ena_global_lock)
497 #define ENA_LOCK_UNLOCK() sx_unlock(&ena_global_lock)
498 #define ENA_LOCK_ASSERT() sx_assert(&ena_global_lock, SA_XLOCKED)
499
500 #define clamp_t(type, _x, min, max) min_t(type, max_t(type, _x, min), max)
501 #define clamp_val(val, lo, hi) clamp_t(__typeof(val), val, lo, hi)
502
503 extern struct sx ena_global_lock;
504
505 static inline int ena_mbuf_count(struct mbuf *mbuf)
506 {
507 int count = 1;
508
509 while ((mbuf = mbuf->m_next) != NULL)
510 ++count;
511
512 return count;
513 }
514
515 int ena_up(struct ena_adapter *adapter);
516 void ena_down(struct ena_adapter *adapter);
517 int ena_restore_device(struct ena_adapter *adapter);
518 void ena_destroy_device(struct ena_adapter *adapter, bool graceful);
519 int ena_refill_rx_bufs(struct ena_ring *rx_ring, uint32_t num);
520 int ena_update_buf_ring_size(struct ena_adapter *adapter,
521 uint32_t new_buf_ring_size);
522 int ena_update_queue_size(struct ena_adapter *adapter, uint32_t new_tx_size,
523 uint32_t new_rx_size);
524 int ena_update_io_queue_nb(struct ena_adapter *adapter, uint32_t new_num);
525
526 static inline void
527 ena_trigger_reset(struct ena_adapter *adapter,
528 enum ena_regs_reset_reason_types reset_reason)
529 {
530 if (likely(!ENA_FLAG_ISSET(ENA_FLAG_TRIGGER_RESET, adapter))) {
531 adapter->reset_reason = reset_reason;
532 ENA_FLAG_SET_ATOMIC(ENA_FLAG_TRIGGER_RESET, adapter);
533 }
534 }
535
536 #endif /* !(ENA_H) */
Cache object: 88d30ab22a5223de2f5a3ebe583b72a4
|