FreeBSD/Linux Kernel Cross Reference
sys/dev/sfxge/sfxge.c
1 /*-
2 * Copyright (c) 2010-2016 Solarflare Communications Inc.
3 * All rights reserved.
4 *
5 * This software was developed in part by Philip Paeps under contract for
6 * Solarflare Communications, Inc.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions are met:
10 *
11 * 1. Redistributions of source code must retain the above copyright notice,
12 * this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright notice,
14 * this list of conditions and the following disclaimer in the documentation
15 * and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
19 * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
20 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
21 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
22 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
23 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
24 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
25 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
26 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
27 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 *
29 * The views and conclusions contained in the software and documentation are
30 * those of the authors and should not be interpreted as representing official
31 * policies, either expressed or implied, of the FreeBSD Project.
32 */
33
34 #include <sys/cdefs.h>
35 __FBSDID("$FreeBSD: releng/11.2/sys/dev/sfxge/sfxge.c 332288 2018-04-08 16:54:07Z brooks $");
36
37 #include "opt_rss.h"
38
39 #include <sys/param.h>
40 #include <sys/kernel.h>
41 #include <sys/bus.h>
42 #include <sys/rman.h>
43 #include <sys/lock.h>
44 #include <sys/module.h>
45 #include <sys/mutex.h>
46 #include <sys/smp.h>
47 #include <sys/socket.h>
48 #include <sys/taskqueue.h>
49 #include <sys/sockio.h>
50 #include <sys/sysctl.h>
51 #include <sys/priv.h>
52 #include <sys/syslog.h>
53
54 #include <dev/pci/pcireg.h>
55 #include <dev/pci/pcivar.h>
56
57 #include <net/ethernet.h>
58 #include <net/if.h>
59 #include <net/if_var.h>
60 #include <net/if_media.h>
61 #include <net/if_types.h>
62
63 #ifdef RSS
64 #include <net/rss_config.h>
65 #endif
66
67 #include "common/efx.h"
68
69 #include "sfxge.h"
70 #include "sfxge_rx.h"
71 #include "sfxge_ioc.h"
72 #include "sfxge_version.h"
73
74 #define SFXGE_CAP (IFCAP_VLAN_MTU | IFCAP_VLAN_HWCSUM | \
75 IFCAP_RXCSUM | IFCAP_TXCSUM | \
76 IFCAP_RXCSUM_IPV6 | IFCAP_TXCSUM_IPV6 | \
77 IFCAP_TSO4 | IFCAP_TSO6 | \
78 IFCAP_JUMBO_MTU | \
79 IFCAP_VLAN_HWTSO | IFCAP_LINKSTATE | IFCAP_HWSTATS)
80 #define SFXGE_CAP_ENABLE SFXGE_CAP
81 #define SFXGE_CAP_FIXED (IFCAP_VLAN_MTU | \
82 IFCAP_JUMBO_MTU | IFCAP_LINKSTATE | IFCAP_HWSTATS)
83
84 MALLOC_DEFINE(M_SFXGE, "sfxge", "Solarflare 10GigE driver");
85
86
87 SYSCTL_NODE(_hw, OID_AUTO, sfxge, CTLFLAG_RD, 0,
88 "SFXGE driver parameters");
89
90 #define SFXGE_PARAM_RX_RING SFXGE_PARAM(rx_ring)
91 static int sfxge_rx_ring_entries = SFXGE_NDESCS;
92 TUNABLE_INT(SFXGE_PARAM_RX_RING, &sfxge_rx_ring_entries);
93 SYSCTL_INT(_hw_sfxge, OID_AUTO, rx_ring, CTLFLAG_RDTUN,
94 &sfxge_rx_ring_entries, 0,
95 "Maximum number of descriptors in a receive ring");
96
97 #define SFXGE_PARAM_TX_RING SFXGE_PARAM(tx_ring)
98 static int sfxge_tx_ring_entries = SFXGE_NDESCS;
99 TUNABLE_INT(SFXGE_PARAM_TX_RING, &sfxge_tx_ring_entries);
100 SYSCTL_INT(_hw_sfxge, OID_AUTO, tx_ring, CTLFLAG_RDTUN,
101 &sfxge_tx_ring_entries, 0,
102 "Maximum number of descriptors in a transmit ring");
103
104 #define SFXGE_PARAM_RESTART_ATTEMPTS SFXGE_PARAM(restart_attempts)
105 static int sfxge_restart_attempts = 3;
106 TUNABLE_INT(SFXGE_PARAM_RESTART_ATTEMPTS, &sfxge_restart_attempts);
107 SYSCTL_INT(_hw_sfxge, OID_AUTO, restart_attempts, CTLFLAG_RDTUN,
108 &sfxge_restart_attempts, 0,
109 "Maximum number of attempts to bring interface up after reset");
110
111 #if EFSYS_OPT_MCDI_LOGGING
112 #define SFXGE_PARAM_MCDI_LOGGING SFXGE_PARAM(mcdi_logging)
113 static int sfxge_mcdi_logging = 0;
114 TUNABLE_INT(SFXGE_PARAM_MCDI_LOGGING, &sfxge_mcdi_logging);
115 #endif
116
117 static void
118 sfxge_reset(void *arg, int npending);
119
120 static int
121 sfxge_estimate_rsrc_limits(struct sfxge_softc *sc)
122 {
123 efx_drv_limits_t limits;
124 int rc;
125 unsigned int evq_max;
126 uint32_t evq_allocated;
127 uint32_t rxq_allocated;
128 uint32_t txq_allocated;
129
130 /*
131 * Limit the number of event queues to:
132 * - number of CPUs
133 * - hardwire maximum RSS channels
134 * - administratively specified maximum RSS channels
135 */
136 #ifdef RSS
137 /*
138 * Avoid extra limitations so that the number of queues
139 * may be configured at administrator's will
140 */
141 evq_max = MIN(MAX(rss_getnumbuckets(), 1), EFX_MAXRSS);
142 #else
143 evq_max = MIN(mp_ncpus, EFX_MAXRSS);
144 #endif
145 if (sc->max_rss_channels > 0)
146 evq_max = MIN(evq_max, sc->max_rss_channels);
147
148 memset(&limits, 0, sizeof(limits));
149
150 limits.edl_min_evq_count = 1;
151 limits.edl_max_evq_count = evq_max;
152 limits.edl_min_txq_count = SFXGE_TXQ_NTYPES;
153 limits.edl_max_txq_count = evq_max + SFXGE_TXQ_NTYPES - 1;
154 limits.edl_min_rxq_count = 1;
155 limits.edl_max_rxq_count = evq_max;
156
157 efx_nic_set_drv_limits(sc->enp, &limits);
158
159 if ((rc = efx_nic_init(sc->enp)) != 0)
160 return (rc);
161
162 rc = efx_nic_get_vi_pool(sc->enp, &evq_allocated, &rxq_allocated,
163 &txq_allocated);
164 if (rc != 0) {
165 efx_nic_fini(sc->enp);
166 return (rc);
167 }
168
169 KASSERT(txq_allocated >= SFXGE_TXQ_NTYPES,
170 ("txq_allocated < SFXGE_TXQ_NTYPES"));
171
172 sc->evq_max = MIN(evq_allocated, evq_max);
173 sc->evq_max = MIN(rxq_allocated, sc->evq_max);
174 sc->evq_max = MIN(txq_allocated - (SFXGE_TXQ_NTYPES - 1),
175 sc->evq_max);
176
177 KASSERT(sc->evq_max <= evq_max,
178 ("allocated more than maximum requested"));
179
180 #ifdef RSS
181 if (sc->evq_max < rss_getnumbuckets())
182 device_printf(sc->dev, "The number of allocated queues (%u) "
183 "is less than the number of RSS buckets (%u); "
184 "performance degradation might be observed",
185 sc->evq_max, rss_getnumbuckets());
186 #endif
187
188 /*
189 * NIC is kept initialized in the case of success to be able to
190 * initialize port to find out media types.
191 */
192 return (0);
193 }
194
195 static int
196 sfxge_set_drv_limits(struct sfxge_softc *sc)
197 {
198 efx_drv_limits_t limits;
199
200 memset(&limits, 0, sizeof(limits));
201
202 /* Limits are strict since take into account initial estimation */
203 limits.edl_min_evq_count = limits.edl_max_evq_count =
204 sc->intr.n_alloc;
205 limits.edl_min_txq_count = limits.edl_max_txq_count =
206 sc->intr.n_alloc + SFXGE_TXQ_NTYPES - 1;
207 limits.edl_min_rxq_count = limits.edl_max_rxq_count =
208 sc->intr.n_alloc;
209
210 return (efx_nic_set_drv_limits(sc->enp, &limits));
211 }
212
213 static int
214 sfxge_start(struct sfxge_softc *sc)
215 {
216 int rc;
217
218 SFXGE_ADAPTER_LOCK_ASSERT_OWNED(sc);
219
220 if (sc->init_state == SFXGE_STARTED)
221 return (0);
222
223 if (sc->init_state != SFXGE_REGISTERED) {
224 rc = EINVAL;
225 goto fail;
226 }
227
228 /* Set required resource limits */
229 if ((rc = sfxge_set_drv_limits(sc)) != 0)
230 goto fail;
231
232 if ((rc = efx_nic_init(sc->enp)) != 0)
233 goto fail;
234
235 /* Start processing interrupts. */
236 if ((rc = sfxge_intr_start(sc)) != 0)
237 goto fail2;
238
239 /* Start processing events. */
240 if ((rc = sfxge_ev_start(sc)) != 0)
241 goto fail3;
242
243 /* Fire up the port. */
244 if ((rc = sfxge_port_start(sc)) != 0)
245 goto fail4;
246
247 /* Start the receiver side. */
248 if ((rc = sfxge_rx_start(sc)) != 0)
249 goto fail5;
250
251 /* Start the transmitter side. */
252 if ((rc = sfxge_tx_start(sc)) != 0)
253 goto fail6;
254
255 sc->init_state = SFXGE_STARTED;
256
257 /* Tell the stack we're running. */
258 sc->ifnet->if_drv_flags |= IFF_DRV_RUNNING;
259 sc->ifnet->if_drv_flags &= ~IFF_DRV_OACTIVE;
260
261 return (0);
262
263 fail6:
264 sfxge_rx_stop(sc);
265
266 fail5:
267 sfxge_port_stop(sc);
268
269 fail4:
270 sfxge_ev_stop(sc);
271
272 fail3:
273 sfxge_intr_stop(sc);
274
275 fail2:
276 efx_nic_fini(sc->enp);
277
278 fail:
279 device_printf(sc->dev, "sfxge_start: %d\n", rc);
280
281 return (rc);
282 }
283
284 static void
285 sfxge_if_init(void *arg)
286 {
287 struct sfxge_softc *sc;
288
289 sc = (struct sfxge_softc *)arg;
290
291 SFXGE_ADAPTER_LOCK(sc);
292 (void)sfxge_start(sc);
293 SFXGE_ADAPTER_UNLOCK(sc);
294 }
295
296 static void
297 sfxge_stop(struct sfxge_softc *sc)
298 {
299 SFXGE_ADAPTER_LOCK_ASSERT_OWNED(sc);
300
301 if (sc->init_state != SFXGE_STARTED)
302 return;
303
304 sc->init_state = SFXGE_REGISTERED;
305
306 /* Stop the transmitter. */
307 sfxge_tx_stop(sc);
308
309 /* Stop the receiver. */
310 sfxge_rx_stop(sc);
311
312 /* Stop the port. */
313 sfxge_port_stop(sc);
314
315 /* Stop processing events. */
316 sfxge_ev_stop(sc);
317
318 /* Stop processing interrupts. */
319 sfxge_intr_stop(sc);
320
321 efx_nic_fini(sc->enp);
322
323 sc->ifnet->if_drv_flags &= ~IFF_DRV_RUNNING;
324 }
325
326
327 static int
328 sfxge_vpd_ioctl(struct sfxge_softc *sc, sfxge_ioc_t *ioc)
329 {
330 efx_vpd_value_t value;
331 int rc = 0;
332
333 switch (ioc->u.vpd.op) {
334 case SFXGE_VPD_OP_GET_KEYWORD:
335 value.evv_tag = ioc->u.vpd.tag;
336 value.evv_keyword = ioc->u.vpd.keyword;
337 rc = efx_vpd_get(sc->enp, sc->vpd_data, sc->vpd_size, &value);
338 if (rc != 0)
339 break;
340 ioc->u.vpd.len = MIN(ioc->u.vpd.len, value.evv_length);
341 if (ioc->u.vpd.payload != 0) {
342 rc = copyout(value.evv_value, ioc->u.vpd.payload,
343 ioc->u.vpd.len);
344 }
345 break;
346 case SFXGE_VPD_OP_SET_KEYWORD:
347 if (ioc->u.vpd.len > sizeof(value.evv_value))
348 return (EINVAL);
349 value.evv_tag = ioc->u.vpd.tag;
350 value.evv_keyword = ioc->u.vpd.keyword;
351 value.evv_length = ioc->u.vpd.len;
352 rc = copyin(ioc->u.vpd.payload, value.evv_value, value.evv_length);
353 if (rc != 0)
354 break;
355 rc = efx_vpd_set(sc->enp, sc->vpd_data, sc->vpd_size, &value);
356 if (rc != 0)
357 break;
358 rc = efx_vpd_verify(sc->enp, sc->vpd_data, sc->vpd_size);
359 if (rc != 0)
360 break;
361 rc = efx_vpd_write(sc->enp, sc->vpd_data, sc->vpd_size);
362 break;
363 default:
364 rc = EOPNOTSUPP;
365 break;
366 }
367
368 return (rc);
369 }
370
371 static int
372 sfxge_private_ioctl(struct sfxge_softc *sc, sfxge_ioc_t *ioc)
373 {
374 switch (ioc->op) {
375 case SFXGE_MCDI_IOC:
376 return (sfxge_mcdi_ioctl(sc, ioc));
377 case SFXGE_NVRAM_IOC:
378 return (sfxge_nvram_ioctl(sc, ioc));
379 case SFXGE_VPD_IOC:
380 return (sfxge_vpd_ioctl(sc, ioc));
381 default:
382 return (EOPNOTSUPP);
383 }
384 }
385
386
387 static int
388 sfxge_if_ioctl(struct ifnet *ifp, unsigned long command, caddr_t data)
389 {
390 struct sfxge_softc *sc;
391 struct ifreq *ifr;
392 sfxge_ioc_t ioc;
393 int error;
394
395 ifr = (struct ifreq *)data;
396 sc = ifp->if_softc;
397 error = 0;
398
399 switch (command) {
400 case SIOCSIFFLAGS:
401 SFXGE_ADAPTER_LOCK(sc);
402 if (ifp->if_flags & IFF_UP) {
403 if (ifp->if_drv_flags & IFF_DRV_RUNNING) {
404 if ((ifp->if_flags ^ sc->if_flags) &
405 (IFF_PROMISC | IFF_ALLMULTI)) {
406 sfxge_mac_filter_set(sc);
407 }
408 } else
409 sfxge_start(sc);
410 } else
411 if (ifp->if_drv_flags & IFF_DRV_RUNNING)
412 sfxge_stop(sc);
413 sc->if_flags = ifp->if_flags;
414 SFXGE_ADAPTER_UNLOCK(sc);
415 break;
416 case SIOCSIFMTU:
417 if (ifr->ifr_mtu == ifp->if_mtu) {
418 /* Nothing to do */
419 error = 0;
420 } else if (ifr->ifr_mtu > SFXGE_MAX_MTU) {
421 error = EINVAL;
422 } else if (!(ifp->if_drv_flags & IFF_DRV_RUNNING)) {
423 ifp->if_mtu = ifr->ifr_mtu;
424 error = 0;
425 } else {
426 /* Restart required */
427 SFXGE_ADAPTER_LOCK(sc);
428 sfxge_stop(sc);
429 ifp->if_mtu = ifr->ifr_mtu;
430 error = sfxge_start(sc);
431 SFXGE_ADAPTER_UNLOCK(sc);
432 if (error != 0) {
433 ifp->if_flags &= ~IFF_UP;
434 ifp->if_drv_flags &= ~IFF_DRV_RUNNING;
435 if_down(ifp);
436 }
437 }
438 break;
439 case SIOCADDMULTI:
440 case SIOCDELMULTI:
441 if (ifp->if_drv_flags & IFF_DRV_RUNNING)
442 sfxge_mac_filter_set(sc);
443 break;
444 case SIOCSIFCAP:
445 {
446 int reqcap = ifr->ifr_reqcap;
447 int capchg_mask;
448
449 SFXGE_ADAPTER_LOCK(sc);
450
451 /* Capabilities to be changed in accordance with request */
452 capchg_mask = ifp->if_capenable ^ reqcap;
453
454 /*
455 * The networking core already rejects attempts to
456 * enable capabilities we don't have. We still have
457 * to reject attempts to disable capabilities that we
458 * can't (yet) disable.
459 */
460 KASSERT((reqcap & ~ifp->if_capabilities) == 0,
461 ("Unsupported capabilities 0x%x requested 0x%x vs "
462 "supported 0x%x",
463 reqcap & ~ifp->if_capabilities,
464 reqcap , ifp->if_capabilities));
465 if (capchg_mask & SFXGE_CAP_FIXED) {
466 error = EINVAL;
467 SFXGE_ADAPTER_UNLOCK(sc);
468 break;
469 }
470
471 /* Check request before any changes */
472 if ((capchg_mask & IFCAP_TSO4) &&
473 (reqcap & (IFCAP_TSO4 | IFCAP_TXCSUM)) == IFCAP_TSO4) {
474 error = EAGAIN;
475 SFXGE_ADAPTER_UNLOCK(sc);
476 if_printf(ifp, "enable txcsum before tso4\n");
477 break;
478 }
479 if ((capchg_mask & IFCAP_TSO6) &&
480 (reqcap & (IFCAP_TSO6 | IFCAP_TXCSUM_IPV6)) == IFCAP_TSO6) {
481 error = EAGAIN;
482 SFXGE_ADAPTER_UNLOCK(sc);
483 if_printf(ifp, "enable txcsum6 before tso6\n");
484 break;
485 }
486
487 if (reqcap & IFCAP_TXCSUM) {
488 ifp->if_hwassist |= (CSUM_IP | CSUM_TCP | CSUM_UDP);
489 } else {
490 ifp->if_hwassist &= ~(CSUM_IP | CSUM_TCP | CSUM_UDP);
491 if (reqcap & IFCAP_TSO4) {
492 reqcap &= ~IFCAP_TSO4;
493 if_printf(ifp,
494 "tso4 disabled due to -txcsum\n");
495 }
496 }
497 if (reqcap & IFCAP_TXCSUM_IPV6) {
498 ifp->if_hwassist |= (CSUM_TCP_IPV6 | CSUM_UDP_IPV6);
499 } else {
500 ifp->if_hwassist &= ~(CSUM_TCP_IPV6 | CSUM_UDP_IPV6);
501 if (reqcap & IFCAP_TSO6) {
502 reqcap &= ~IFCAP_TSO6;
503 if_printf(ifp,
504 "tso6 disabled due to -txcsum6\n");
505 }
506 }
507
508 /*
509 * The kernel takes both IFCAP_TSOx and CSUM_TSO into
510 * account before using TSO. So, we do not touch
511 * checksum flags when IFCAP_TSOx is modified.
512 * Note that CSUM_TSO is (CSUM_IP_TSO|CSUM_IP6_TSO),
513 * but both bits are set in IPv4 and IPv6 mbufs.
514 */
515
516 ifp->if_capenable = reqcap;
517
518 SFXGE_ADAPTER_UNLOCK(sc);
519 break;
520 }
521 case SIOCSIFMEDIA:
522 case SIOCGIFMEDIA:
523 error = ifmedia_ioctl(ifp, ifr, &sc->media, command);
524 break;
525 #ifdef SIOCGI2C
526 case SIOCGI2C:
527 {
528 struct ifi2creq i2c;
529
530 error = copyin(ifr_data_get_ptr(ifr), &i2c, sizeof(i2c));
531 if (error != 0)
532 break;
533
534 if (i2c.len > sizeof(i2c.data)) {
535 error = EINVAL;
536 break;
537 }
538
539 SFXGE_ADAPTER_LOCK(sc);
540 error = efx_phy_module_get_info(sc->enp, i2c.dev_addr,
541 i2c.offset, i2c.len,
542 &i2c.data[0]);
543 SFXGE_ADAPTER_UNLOCK(sc);
544 if (error == 0)
545 error = copyout(&i2c, ifr_data_get_ptr(ifr),
546 sizeof(i2c));
547 break;
548 }
549 #endif
550 case SIOCGPRIVATE_0:
551 error = priv_check(curthread, PRIV_DRIVER);
552 if (error != 0)
553 break;
554 error = copyin(ifr_data_get_ptr(ifr), &ioc, sizeof(ioc));
555 if (error != 0)
556 return (error);
557 error = sfxge_private_ioctl(sc, &ioc);
558 if (error == 0) {
559 error = copyout(&ioc, ifr_data_get_ptr(ifr),
560 sizeof(ioc));
561 }
562 break;
563 default:
564 error = ether_ioctl(ifp, command, data);
565 }
566
567 return (error);
568 }
569
570 static void
571 sfxge_ifnet_fini(struct ifnet *ifp)
572 {
573 struct sfxge_softc *sc = ifp->if_softc;
574
575 SFXGE_ADAPTER_LOCK(sc);
576 sfxge_stop(sc);
577 SFXGE_ADAPTER_UNLOCK(sc);
578
579 ifmedia_removeall(&sc->media);
580 ether_ifdetach(ifp);
581 if_free(ifp);
582 }
583
584 static int
585 sfxge_ifnet_init(struct ifnet *ifp, struct sfxge_softc *sc)
586 {
587 const efx_nic_cfg_t *encp = efx_nic_cfg_get(sc->enp);
588 device_t dev;
589 int rc;
590
591 dev = sc->dev;
592 sc->ifnet = ifp;
593
594 if_initname(ifp, device_get_name(dev), device_get_unit(dev));
595 ifp->if_init = sfxge_if_init;
596 ifp->if_softc = sc;
597 ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
598 ifp->if_ioctl = sfxge_if_ioctl;
599
600 ifp->if_capabilities = SFXGE_CAP;
601 ifp->if_capenable = SFXGE_CAP_ENABLE;
602 ifp->if_hw_tsomax = SFXGE_TSO_MAX_SIZE;
603 ifp->if_hw_tsomaxsegcount = SFXGE_TX_MAPPING_MAX_SEG;
604 ifp->if_hw_tsomaxsegsize = PAGE_SIZE;
605
606 #ifdef SFXGE_LRO
607 ifp->if_capabilities |= IFCAP_LRO;
608 ifp->if_capenable |= IFCAP_LRO;
609 #endif
610
611 if (encp->enc_hw_tx_insert_vlan_enabled) {
612 ifp->if_capabilities |= IFCAP_VLAN_HWTAGGING;
613 ifp->if_capenable |= IFCAP_VLAN_HWTAGGING;
614 }
615 ifp->if_hwassist = CSUM_TCP | CSUM_UDP | CSUM_IP | CSUM_TSO |
616 CSUM_TCP_IPV6 | CSUM_UDP_IPV6;
617
618 ether_ifattach(ifp, encp->enc_mac_addr);
619
620 ifp->if_transmit = sfxge_if_transmit;
621 ifp->if_qflush = sfxge_if_qflush;
622
623 ifp->if_get_counter = sfxge_get_counter;
624
625 DBGPRINT(sc->dev, "ifmedia_init");
626 if ((rc = sfxge_port_ifmedia_init(sc)) != 0)
627 goto fail;
628
629 return (0);
630
631 fail:
632 ether_ifdetach(sc->ifnet);
633 return (rc);
634 }
635
636 void
637 sfxge_sram_buf_tbl_alloc(struct sfxge_softc *sc, size_t n, uint32_t *idp)
638 {
639 KASSERT(sc->buffer_table_next + n <=
640 efx_nic_cfg_get(sc->enp)->enc_buftbl_limit,
641 ("buffer table full"));
642
643 *idp = sc->buffer_table_next;
644 sc->buffer_table_next += n;
645 }
646
647 static int
648 sfxge_bar_init(struct sfxge_softc *sc)
649 {
650 efsys_bar_t *esbp = &sc->bar;
651
652 esbp->esb_rid = PCIR_BAR(EFX_MEM_BAR);
653 if ((esbp->esb_res = bus_alloc_resource_any(sc->dev, SYS_RES_MEMORY,
654 &esbp->esb_rid, RF_ACTIVE)) == NULL) {
655 device_printf(sc->dev, "Cannot allocate BAR region %d\n",
656 EFX_MEM_BAR);
657 return (ENXIO);
658 }
659 esbp->esb_tag = rman_get_bustag(esbp->esb_res);
660 esbp->esb_handle = rman_get_bushandle(esbp->esb_res);
661
662 SFXGE_BAR_LOCK_INIT(esbp, device_get_nameunit(sc->dev));
663
664 return (0);
665 }
666
667 static void
668 sfxge_bar_fini(struct sfxge_softc *sc)
669 {
670 efsys_bar_t *esbp = &sc->bar;
671
672 bus_release_resource(sc->dev, SYS_RES_MEMORY, esbp->esb_rid,
673 esbp->esb_res);
674 SFXGE_BAR_LOCK_DESTROY(esbp);
675 }
676
677 static int
678 sfxge_create(struct sfxge_softc *sc)
679 {
680 device_t dev;
681 efx_nic_t *enp;
682 int error;
683 char rss_param_name[sizeof(SFXGE_PARAM(%d.max_rss_channels))];
684 #if EFSYS_OPT_MCDI_LOGGING
685 char mcdi_log_param_name[sizeof(SFXGE_PARAM(%d.mcdi_logging))];
686 #endif
687
688 dev = sc->dev;
689
690 SFXGE_ADAPTER_LOCK_INIT(sc, device_get_nameunit(sc->dev));
691
692 sc->max_rss_channels = 0;
693 snprintf(rss_param_name, sizeof(rss_param_name),
694 SFXGE_PARAM(%d.max_rss_channels),
695 (int)device_get_unit(dev));
696 TUNABLE_INT_FETCH(rss_param_name, &sc->max_rss_channels);
697 #if EFSYS_OPT_MCDI_LOGGING
698 sc->mcdi_logging = sfxge_mcdi_logging;
699 snprintf(mcdi_log_param_name, sizeof(mcdi_log_param_name),
700 SFXGE_PARAM(%d.mcdi_logging),
701 (int)device_get_unit(dev));
702 TUNABLE_INT_FETCH(mcdi_log_param_name, &sc->mcdi_logging);
703 #endif
704
705 sc->stats_node = SYSCTL_ADD_NODE(
706 device_get_sysctl_ctx(dev),
707 SYSCTL_CHILDREN(device_get_sysctl_tree(dev)),
708 OID_AUTO, "stats", CTLFLAG_RD, NULL, "Statistics");
709 if (sc->stats_node == NULL) {
710 error = ENOMEM;
711 goto fail;
712 }
713
714 TASK_INIT(&sc->task_reset, 0, sfxge_reset, sc);
715
716 (void) pci_enable_busmaster(dev);
717
718 /* Initialize DMA mappings. */
719 DBGPRINT(sc->dev, "dma_init...");
720 if ((error = sfxge_dma_init(sc)) != 0)
721 goto fail;
722
723 /* Map the device registers. */
724 DBGPRINT(sc->dev, "bar_init...");
725 if ((error = sfxge_bar_init(sc)) != 0)
726 goto fail;
727
728 error = efx_family(pci_get_vendor(dev), pci_get_device(dev),
729 &sc->family);
730 KASSERT(error == 0, ("Family should be filtered by sfxge_probe()"));
731
732 DBGPRINT(sc->dev, "nic_create...");
733
734 /* Create the common code nic object. */
735 SFXGE_EFSYS_LOCK_INIT(&sc->enp_lock,
736 device_get_nameunit(sc->dev), "nic");
737 if ((error = efx_nic_create(sc->family, (efsys_identifier_t *)sc,
738 &sc->bar, &sc->enp_lock, &enp)) != 0)
739 goto fail3;
740 sc->enp = enp;
741
742 /* Initialize MCDI to talk to the microcontroller. */
743 DBGPRINT(sc->dev, "mcdi_init...");
744 if ((error = sfxge_mcdi_init(sc)) != 0)
745 goto fail4;
746
747 /* Probe the NIC and build the configuration data area. */
748 DBGPRINT(sc->dev, "nic_probe...");
749 if ((error = efx_nic_probe(enp)) != 0)
750 goto fail5;
751
752 if (!ISP2(sfxge_rx_ring_entries) ||
753 (sfxge_rx_ring_entries < EFX_RXQ_MINNDESCS) ||
754 (sfxge_rx_ring_entries > EFX_RXQ_MAXNDESCS)) {
755 log(LOG_ERR, "%s=%d must be power of 2 from %u to %u",
756 SFXGE_PARAM_RX_RING, sfxge_rx_ring_entries,
757 EFX_RXQ_MINNDESCS, EFX_RXQ_MAXNDESCS);
758 error = EINVAL;
759 goto fail_rx_ring_entries;
760 }
761 sc->rxq_entries = sfxge_rx_ring_entries;
762
763 if (!ISP2(sfxge_tx_ring_entries) ||
764 (sfxge_tx_ring_entries < EFX_TXQ_MINNDESCS) ||
765 (sfxge_tx_ring_entries > EFX_TXQ_MAXNDESCS(efx_nic_cfg_get(enp)))) {
766 log(LOG_ERR, "%s=%d must be power of 2 from %u to %u",
767 SFXGE_PARAM_TX_RING, sfxge_tx_ring_entries,
768 EFX_TXQ_MINNDESCS, EFX_TXQ_MAXNDESCS(efx_nic_cfg_get(enp)));
769 error = EINVAL;
770 goto fail_tx_ring_entries;
771 }
772 sc->txq_entries = sfxge_tx_ring_entries;
773
774 SYSCTL_ADD_STRING(device_get_sysctl_ctx(dev),
775 SYSCTL_CHILDREN(device_get_sysctl_tree(dev)),
776 OID_AUTO, "version", CTLFLAG_RD,
777 SFXGE_VERSION_STRING, 0,
778 "Driver version");
779
780 SYSCTL_ADD_UINT(device_get_sysctl_ctx(dev),
781 SYSCTL_CHILDREN(device_get_sysctl_tree(dev)),
782 OID_AUTO, "phy_type", CTLFLAG_RD,
783 NULL, efx_nic_cfg_get(enp)->enc_phy_type,
784 "PHY type");
785
786 /* Initialize the NVRAM. */
787 DBGPRINT(sc->dev, "nvram_init...");
788 if ((error = efx_nvram_init(enp)) != 0)
789 goto fail6;
790
791 /* Initialize the VPD. */
792 DBGPRINT(sc->dev, "vpd_init...");
793 if ((error = efx_vpd_init(enp)) != 0)
794 goto fail7;
795
796 efx_mcdi_new_epoch(enp);
797
798 /* Reset the NIC. */
799 DBGPRINT(sc->dev, "nic_reset...");
800 if ((error = efx_nic_reset(enp)) != 0)
801 goto fail8;
802
803 /* Initialize buffer table allocation. */
804 sc->buffer_table_next = 0;
805
806 /*
807 * Guarantee minimum and estimate maximum number of event queues
808 * to take it into account when MSI-X interrupts are allocated.
809 * It initializes NIC and keeps it initialized on success.
810 */
811 if ((error = sfxge_estimate_rsrc_limits(sc)) != 0)
812 goto fail8;
813
814 /* Set up interrupts. */
815 DBGPRINT(sc->dev, "intr_init...");
816 if ((error = sfxge_intr_init(sc)) != 0)
817 goto fail9;
818
819 /* Initialize event processing state. */
820 DBGPRINT(sc->dev, "ev_init...");
821 if ((error = sfxge_ev_init(sc)) != 0)
822 goto fail11;
823
824 /* Initialize port state. */
825 DBGPRINT(sc->dev, "port_init...");
826 if ((error = sfxge_port_init(sc)) != 0)
827 goto fail12;
828
829 /* Initialize receive state. */
830 DBGPRINT(sc->dev, "rx_init...");
831 if ((error = sfxge_rx_init(sc)) != 0)
832 goto fail13;
833
834 /* Initialize transmit state. */
835 DBGPRINT(sc->dev, "tx_init...");
836 if ((error = sfxge_tx_init(sc)) != 0)
837 goto fail14;
838
839 sc->init_state = SFXGE_INITIALIZED;
840
841 DBGPRINT(sc->dev, "success");
842 return (0);
843
844 fail14:
845 sfxge_rx_fini(sc);
846
847 fail13:
848 sfxge_port_fini(sc);
849
850 fail12:
851 sfxge_ev_fini(sc);
852
853 fail11:
854 sfxge_intr_fini(sc);
855
856 fail9:
857 efx_nic_fini(sc->enp);
858
859 fail8:
860 efx_vpd_fini(enp);
861
862 fail7:
863 efx_nvram_fini(enp);
864
865 fail6:
866 fail_tx_ring_entries:
867 fail_rx_ring_entries:
868 efx_nic_unprobe(enp);
869
870 fail5:
871 sfxge_mcdi_fini(sc);
872
873 fail4:
874 sc->enp = NULL;
875 efx_nic_destroy(enp);
876 SFXGE_EFSYS_LOCK_DESTROY(&sc->enp_lock);
877
878 fail3:
879 sfxge_bar_fini(sc);
880 (void) pci_disable_busmaster(sc->dev);
881
882 fail:
883 DBGPRINT(sc->dev, "failed %d", error);
884 sc->dev = NULL;
885 SFXGE_ADAPTER_LOCK_DESTROY(sc);
886 return (error);
887 }
888
889 static void
890 sfxge_destroy(struct sfxge_softc *sc)
891 {
892 efx_nic_t *enp;
893
894 /* Clean up transmit state. */
895 sfxge_tx_fini(sc);
896
897 /* Clean up receive state. */
898 sfxge_rx_fini(sc);
899
900 /* Clean up port state. */
901 sfxge_port_fini(sc);
902
903 /* Clean up event processing state. */
904 sfxge_ev_fini(sc);
905
906 /* Clean up interrupts. */
907 sfxge_intr_fini(sc);
908
909 /* Tear down common code subsystems. */
910 efx_nic_reset(sc->enp);
911 efx_vpd_fini(sc->enp);
912 efx_nvram_fini(sc->enp);
913 efx_nic_unprobe(sc->enp);
914
915 /* Tear down MCDI. */
916 sfxge_mcdi_fini(sc);
917
918 /* Destroy common code context. */
919 enp = sc->enp;
920 sc->enp = NULL;
921 efx_nic_destroy(enp);
922
923 /* Free DMA memory. */
924 sfxge_dma_fini(sc);
925
926 /* Free mapped BARs. */
927 sfxge_bar_fini(sc);
928
929 (void) pci_disable_busmaster(sc->dev);
930
931 taskqueue_drain(taskqueue_thread, &sc->task_reset);
932
933 /* Destroy the softc lock. */
934 SFXGE_ADAPTER_LOCK_DESTROY(sc);
935 }
936
937 static int
938 sfxge_vpd_handler(SYSCTL_HANDLER_ARGS)
939 {
940 struct sfxge_softc *sc = arg1;
941 efx_vpd_value_t value;
942 int rc;
943
944 value.evv_tag = arg2 >> 16;
945 value.evv_keyword = arg2 & 0xffff;
946 if ((rc = efx_vpd_get(sc->enp, sc->vpd_data, sc->vpd_size, &value))
947 != 0)
948 return (rc);
949
950 return (SYSCTL_OUT(req, value.evv_value, value.evv_length));
951 }
952
953 static void
954 sfxge_vpd_try_add(struct sfxge_softc *sc, struct sysctl_oid_list *list,
955 efx_vpd_tag_t tag, const char *keyword)
956 {
957 struct sysctl_ctx_list *ctx = device_get_sysctl_ctx(sc->dev);
958 efx_vpd_value_t value;
959
960 /* Check whether VPD tag/keyword is present */
961 value.evv_tag = tag;
962 value.evv_keyword = EFX_VPD_KEYWORD(keyword[0], keyword[1]);
963 if (efx_vpd_get(sc->enp, sc->vpd_data, sc->vpd_size, &value) != 0)
964 return;
965
966 SYSCTL_ADD_PROC(
967 ctx, list, OID_AUTO, keyword, CTLTYPE_STRING|CTLFLAG_RD,
968 sc, tag << 16 | EFX_VPD_KEYWORD(keyword[0], keyword[1]),
969 sfxge_vpd_handler, "A", "");
970 }
971
972 static int
973 sfxge_vpd_init(struct sfxge_softc *sc)
974 {
975 struct sysctl_ctx_list *ctx = device_get_sysctl_ctx(sc->dev);
976 struct sysctl_oid *vpd_node;
977 struct sysctl_oid_list *vpd_list;
978 char keyword[3];
979 efx_vpd_value_t value;
980 int rc;
981
982 if ((rc = efx_vpd_size(sc->enp, &sc->vpd_size)) != 0) {
983 /*
984 * Unpriviledged functions deny VPD access.
985 * Simply skip VPD in this case.
986 */
987 if (rc == EACCES)
988 goto done;
989 goto fail;
990 }
991 sc->vpd_data = malloc(sc->vpd_size, M_SFXGE, M_WAITOK);
992 if ((rc = efx_vpd_read(sc->enp, sc->vpd_data, sc->vpd_size)) != 0)
993 goto fail2;
994
995 /* Copy ID (product name) into device description, and log it. */
996 value.evv_tag = EFX_VPD_ID;
997 if (efx_vpd_get(sc->enp, sc->vpd_data, sc->vpd_size, &value) == 0) {
998 value.evv_value[value.evv_length] = 0;
999 device_set_desc_copy(sc->dev, value.evv_value);
1000 device_printf(sc->dev, "%s\n", value.evv_value);
1001 }
1002
1003 vpd_node = SYSCTL_ADD_NODE(
1004 ctx, SYSCTL_CHILDREN(device_get_sysctl_tree(sc->dev)),
1005 OID_AUTO, "vpd", CTLFLAG_RD, NULL, "Vital Product Data");
1006 vpd_list = SYSCTL_CHILDREN(vpd_node);
1007
1008 /* Add sysctls for all expected and any vendor-defined keywords. */
1009 sfxge_vpd_try_add(sc, vpd_list, EFX_VPD_RO, "PN");
1010 sfxge_vpd_try_add(sc, vpd_list, EFX_VPD_RO, "EC");
1011 sfxge_vpd_try_add(sc, vpd_list, EFX_VPD_RO, "SN");
1012 keyword[0] = 'V';
1013 keyword[2] = 0;
1014 for (keyword[1] = ''; keyword[1] <= '9'; keyword[1]++)
1015 sfxge_vpd_try_add(sc, vpd_list, EFX_VPD_RO, keyword);
1016 for (keyword[1] = 'A'; keyword[1] <= 'Z'; keyword[1]++)
1017 sfxge_vpd_try_add(sc, vpd_list, EFX_VPD_RO, keyword);
1018
1019 done:
1020 return (0);
1021
1022 fail2:
1023 free(sc->vpd_data, M_SFXGE);
1024 fail:
1025 return (rc);
1026 }
1027
1028 static void
1029 sfxge_vpd_fini(struct sfxge_softc *sc)
1030 {
1031 free(sc->vpd_data, M_SFXGE);
1032 }
1033
1034 static void
1035 sfxge_reset(void *arg, int npending)
1036 {
1037 struct sfxge_softc *sc;
1038 int rc;
1039 unsigned attempt;
1040
1041 (void)npending;
1042
1043 sc = (struct sfxge_softc *)arg;
1044
1045 SFXGE_ADAPTER_LOCK(sc);
1046
1047 if (sc->init_state != SFXGE_STARTED)
1048 goto done;
1049
1050 sfxge_stop(sc);
1051 efx_nic_reset(sc->enp);
1052 for (attempt = 0; attempt < sfxge_restart_attempts; ++attempt) {
1053 if ((rc = sfxge_start(sc)) == 0)
1054 goto done;
1055
1056 device_printf(sc->dev, "start on reset failed (%d)\n", rc);
1057 DELAY(100000);
1058 }
1059
1060 device_printf(sc->dev, "reset failed; interface is now stopped\n");
1061
1062 done:
1063 SFXGE_ADAPTER_UNLOCK(sc);
1064 }
1065
1066 void
1067 sfxge_schedule_reset(struct sfxge_softc *sc)
1068 {
1069 taskqueue_enqueue(taskqueue_thread, &sc->task_reset);
1070 }
1071
1072 static int
1073 sfxge_attach(device_t dev)
1074 {
1075 struct sfxge_softc *sc;
1076 struct ifnet *ifp;
1077 int error;
1078
1079 sc = device_get_softc(dev);
1080 sc->dev = dev;
1081
1082 /* Allocate ifnet. */
1083 ifp = if_alloc(IFT_ETHER);
1084 if (ifp == NULL) {
1085 device_printf(dev, "Couldn't allocate ifnet\n");
1086 error = ENOMEM;
1087 goto fail;
1088 }
1089 sc->ifnet = ifp;
1090
1091 /* Initialize hardware. */
1092 DBGPRINT(sc->dev, "create nic");
1093 if ((error = sfxge_create(sc)) != 0)
1094 goto fail2;
1095
1096 /* Create the ifnet for the port. */
1097 DBGPRINT(sc->dev, "init ifnet");
1098 if ((error = sfxge_ifnet_init(ifp, sc)) != 0)
1099 goto fail3;
1100
1101 DBGPRINT(sc->dev, "init vpd");
1102 if ((error = sfxge_vpd_init(sc)) != 0)
1103 goto fail4;
1104
1105 /*
1106 * NIC is initialized inside sfxge_create() and kept inialized
1107 * to be able to initialize port to discover media types in
1108 * sfxge_ifnet_init().
1109 */
1110 efx_nic_fini(sc->enp);
1111
1112 sc->init_state = SFXGE_REGISTERED;
1113
1114 DBGPRINT(sc->dev, "success");
1115 return (0);
1116
1117 fail4:
1118 sfxge_ifnet_fini(ifp);
1119 fail3:
1120 efx_nic_fini(sc->enp);
1121 sfxge_destroy(sc);
1122
1123 fail2:
1124 if_free(sc->ifnet);
1125
1126 fail:
1127 DBGPRINT(sc->dev, "failed %d", error);
1128 return (error);
1129 }
1130
1131 static int
1132 sfxge_detach(device_t dev)
1133 {
1134 struct sfxge_softc *sc;
1135
1136 sc = device_get_softc(dev);
1137
1138 sfxge_vpd_fini(sc);
1139
1140 /* Destroy the ifnet. */
1141 sfxge_ifnet_fini(sc->ifnet);
1142
1143 /* Tear down hardware. */
1144 sfxge_destroy(sc);
1145
1146 return (0);
1147 }
1148
1149 static int
1150 sfxge_probe(device_t dev)
1151 {
1152 uint16_t pci_vendor_id;
1153 uint16_t pci_device_id;
1154 efx_family_t family;
1155 int rc;
1156
1157 pci_vendor_id = pci_get_vendor(dev);
1158 pci_device_id = pci_get_device(dev);
1159
1160 DBGPRINT(dev, "PCI ID %04x:%04x", pci_vendor_id, pci_device_id);
1161 rc = efx_family(pci_vendor_id, pci_device_id, &family);
1162 if (rc != 0) {
1163 DBGPRINT(dev, "efx_family fail %d", rc);
1164 return (ENXIO);
1165 }
1166
1167 if (family == EFX_FAMILY_SIENA) {
1168 device_set_desc(dev, "Solarflare SFC9000 family");
1169 return (0);
1170 }
1171
1172 if (family == EFX_FAMILY_HUNTINGTON) {
1173 device_set_desc(dev, "Solarflare SFC9100 family");
1174 return (0);
1175 }
1176
1177 if (family == EFX_FAMILY_MEDFORD) {
1178 device_set_desc(dev, "Solarflare SFC9200 family");
1179 return (0);
1180 }
1181
1182 DBGPRINT(dev, "impossible controller family %d", family);
1183 return (ENXIO);
1184 }
1185
1186 static device_method_t sfxge_methods[] = {
1187 DEVMETHOD(device_probe, sfxge_probe),
1188 DEVMETHOD(device_attach, sfxge_attach),
1189 DEVMETHOD(device_detach, sfxge_detach),
1190
1191 DEVMETHOD_END
1192 };
1193
1194 static devclass_t sfxge_devclass;
1195
1196 static driver_t sfxge_driver = {
1197 "sfxge",
1198 sfxge_methods,
1199 sizeof(struct sfxge_softc)
1200 };
1201
1202 DRIVER_MODULE(sfxge, pci, sfxge_driver, sfxge_devclass, 0, 0);
Cache object: 8c0e6a54a3910022c11cafbf1fe9e884
|