2 * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
4 * Copyright (c) 2011 Chelsio Communications, Inc.
6 * Written by: Navdeep Parhar <np@FreeBSD.org>
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 #ifndef __T4_ADAPTER_H__
34 #define __T4_ADAPTER_H__
36 #include <sys/kernel.h>
38 #include <sys/counter.h>
40 #include <sys/types.h>
42 #include <sys/malloc.h>
43 #include <sys/rwlock.h>
48 #include <dev/pci/pcivar.h>
49 #include <dev/pci/pcireg.h>
50 #include <machine/bus.h>
51 #include <sys/socket.h>
52 #include <sys/sysctl.h>
53 #include <net/ethernet.h>
55 #include <net/if_var.h>
56 #include <net/if_media.h>
58 #include <netinet/in.h>
59 #include <netinet/tcp_lro.h>
63 #include "common/t4_msg.h"
64 #include "firmware/t4fw_interface.h"
66 #define KTR_CXGBE KTR_SPARE3
67 MALLOC_DECLARE(M_CXGBE);
68 #define CXGBE_UNIMPLEMENTED(s) \
69 panic("%s (%s, line %d) not implemented yet.", s, __FILE__, __LINE__)
71 #if defined(__i386__) || defined(__amd64__)
75 __asm volatile("prefetcht0 %0" :: "m" (*(unsigned long *)x));
78 #define prefetch(x) __builtin_prefetch(x)
81 #ifndef SYSCTL_ADD_UQUAD
82 #define SYSCTL_ADD_UQUAD SYSCTL_ADD_QUAD
83 #define sysctl_handle_64 sysctl_handle_quad
84 #define CTLTYPE_U64 CTLTYPE_QUAD
87 SYSCTL_DECL(_hw_cxgbe);
90 typedef struct adapter adapter_t;
94 * All ingress queues use this entry size. Note that the firmware event
95 * queue and any iq expecting CPL_RX_PKT in the descriptor needs this to
100 /* Default queue sizes for all kinds of ingress queues */
104 /* All egress queues use this entry size */
107 /* Default queue sizes for all kinds of egress queues */
108 CTRL_EQ_QSIZE = 1024,
111 #if MJUMPAGESIZE != MCLBYTES
112 SW_ZONE_SIZES = 4, /* cluster, jumbop, jumbo9k, jumbo16k */
114 SW_ZONE_SIZES = 3, /* cluster, jumbo9k, jumbo16k */
116 CL_METADATA_SIZE = CACHE_LINE_SIZE,
118 SGE_MAX_WR_NDESC = SGE_MAX_WR_LEN / EQ_ESIZE, /* max WR size in desc */
120 TX_SGL_SEGS_TSO = 38,
122 TX_SGL_SEGS_VM_TSO = 37,
123 TX_SGL_SEGS_EO_TSO = 30, /* XXX: lower for IPv6. */
124 TX_SGL_SEGS_VXLAN_TSO = 37,
125 TX_WR_FLITS = SGE_MAX_WR_LEN / 8
129 /* adapter intr_type */
130 INTR_INTX = (1 << 0),
136 XGMAC_MTU = (1 << 0),
137 XGMAC_PROMISC = (1 << 1),
138 XGMAC_ALLMULTI = (1 << 2),
139 XGMAC_VLANEX = (1 << 3),
140 XGMAC_UCADDR = (1 << 4),
141 XGMAC_MCADDRS = (1 << 5),
147 /* flags understood by begin_synchronized_op */
148 HOLD_LOCK = (1 << 0),
152 /* flags understood by end_synchronized_op */
153 LOCK_HELD = HOLD_LOCK,
158 FULL_INIT_DONE = (1 << 0),
160 CHK_MBOX_ACCESS = (1 << 2),
161 MASTER_PF = (1 << 3),
162 ADAP_SYSCTL_CTX = (1 << 4),
164 BUF_PACKING_OK = (1 << 6),
166 KERN_TLS_OK = (1 << 8),
168 CXGBE_BUSY = (1 << 9),
171 HAS_TRACEQ = (1 << 3),
172 FIXED_IFMEDIA = (1 << 4), /* ifmedia list doesn't change. */
176 VI_INIT_DONE = (1 << 1),
177 VI_SYSCTL_CTX = (1 << 2),
178 TX_USES_VM_WR = (1 << 3),
180 /* adapter debug_flags */
181 DF_DUMP_MBOX = (1 << 0), /* Log all mbox cmd/rpl. */
182 DF_LOAD_FW_ANYTIME = (1 << 1), /* Allow LOAD_FW after init */
183 DF_DISABLE_TCB_CACHE = (1 << 2), /* Disable TCB cache (T6+) */
184 DF_DISABLE_CFG_RETRY = (1 << 3), /* Disable fallback config */
185 DF_VERBOSE_SLOWINTR = (1 << 4), /* Chatty slow intr handler */
188 #define IS_DOOMED(vi) ((vi)->flags & DOOMED)
189 #define SET_DOOMED(vi) do {(vi)->flags |= DOOMED;} while (0)
190 #define IS_BUSY(sc) ((sc)->flags & CXGBE_BUSY)
191 #define SET_BUSY(sc) do {(sc)->flags |= CXGBE_BUSY;} while (0)
192 #define CLR_BUSY(sc) do {(sc)->flags &= ~CXGBE_BUSY;} while (0)
196 struct port_info *pi;
197 struct adapter *adapter;
200 struct pfil_head *pfil;
205 uint16_t *rss, *nm_rss;
206 uint16_t viid; /* opaque VI identifier */
210 int16_t xact_addr_filt;/* index of exact MAC address filter */
211 uint16_t rss_size; /* size of VI's RSS table slice */
212 uint16_t rss_base; /* start of VI's RSS table slice */
218 /* These need to be int as they are used in sysctl */
219 int ntxq; /* # of tx queues */
220 int first_txq; /* index of first tx queue */
221 int rsrv_noflowq; /* Reserve queue 0 for non-flowid packets */
222 int nrxq; /* # of rx queues */
223 int first_rxq; /* index of first rx queue */
224 int nofldtxq; /* # of offload tx queues */
225 int first_ofld_txq; /* index of first offload tx queue */
226 int nofldrxq; /* # of offload rx queues */
227 int first_ofld_rxq; /* index of first offload rx queue */
239 struct timeval last_refreshed;
240 struct fw_vi_stats_vf stats;
243 struct sysctl_ctx_list ctx; /* from ifconfig up to driver detach */
245 uint8_t hw_addr[ETHER_ADDR_LEN]; /* factory MAC address, won't change */
248 struct tx_ch_rl_params {
249 enum fw_sched_params_rate ratemode; /* %port (REL) or kbps (ABS) */
254 CLRL_USER = (1 << 0), /* allocated manually. */
255 CLRL_SYNC = (1 << 1), /* sync hw update in progress. */
256 CLRL_ASYNC = (1 << 2), /* async hw update requested. */
257 CLRL_ERR = (1 << 3), /* last hw setup ended in error. */
260 struct tx_cl_rl_params {
263 enum fw_sched_params_rate ratemode; /* %port REL or ABS value */
264 enum fw_sched_params_unit rateunit; /* kbps or pps (when ABS) */
265 enum fw_sched_params_mode mode; /* aggr or per-flow */
271 /* Tx scheduler parameters for a channel/port */
272 struct tx_sched_params {
273 /* Channel Rate Limiter */
274 struct tx_ch_rl_params ch_rl;
279 /* Class Rate Limiter (including the default pktsize and burstsize). */
282 struct tx_cl_rl_params cl_rl[];
287 struct adapter *adapter;
293 bool vxlan_tcam_entry;
295 struct tx_sched_params *sched_params;
301 uint8_t lport; /* associated offload logical port */
307 uint8_t mps_bg_map; /* rx MPS buffer group bitmap */
308 uint8_t rx_e_chan_map; /* rx TP e-channel bitmap */
310 struct link_config link_cfg;
311 struct ifmedia media;
313 struct timeval last_refreshed;
314 struct port_stats stats;
315 u_int tnl_cong_drops;
316 u_int tx_parse_error;
317 u_long tx_toe_tls_records;
318 u_long tx_toe_tls_octets;
319 u_long rx_toe_tls_records;
320 u_long rx_toe_tls_octets;
325 #define IS_MAIN_VI(vi) ((vi) == &((vi)->pi->vi[0]))
327 struct cluster_metadata {
335 uint16_t nmbuf; /* # of driver originated mbufs with ref on cluster */
336 int16_t moff; /* offset of metadata from cl */
345 struct mbuf *m; /* m_nextpkt linked chain of frames */
346 uint8_t desc_used; /* # of hardware descriptors used by the WR */
350 #define IQ_PAD (IQ_ESIZE - sizeof(struct rsp_ctrl) - sizeof(struct rss_header))
352 struct rss_header rss;
357 CTASSERT(sizeof(struct iq_desc) == IQ_ESIZE);
361 IQ_ALLOCATED = (1 << 0), /* firmware resources allocated */
362 IQ_HAS_FL = (1 << 1), /* iq associated with a freelist */
363 IQ_RX_TIMESTAMP = (1 << 2), /* provide the SGE rx timestamp */
364 IQ_LRO_ENABLED = (1 << 3), /* iq is an eth rxq with LRO enabled */
365 IQ_ADJ_CREDIT = (1 << 4), /* hw is off by 1 credit for this iq */
372 /* netmap related flags */
379 CPL_COOKIE_RESERVED = 0,
384 CPL_COOKIE_HASHFILTER,
388 NUM_CPL_COOKIES = 8 /* Limited by M_COOKIE. Do not increase. */
393 typedef int (*cpl_handler_t)(struct sge_iq *, const struct rss_header *,
395 typedef int (*an_handler_t)(struct sge_iq *, const struct rsp_ctrl *);
396 typedef int (*fw_msg_handler_t)(struct adapter *, const __be64 *);
399 * Ingress Queue: T4 is producer, driver is consumer.
404 struct adapter *adapter;
405 struct iq_desc *desc; /* KVA of descriptor ring */
406 int8_t intr_pktc_idx; /* packet count threshold index */
407 uint8_t gen; /* generation bit */
408 uint8_t intr_params; /* interrupt holdoff parameters */
409 uint8_t intr_next; /* XXX: holdoff for next interrupt */
410 uint16_t qsize; /* size (# of entries) of the queue */
411 uint16_t sidx; /* index of the entry with the status page */
412 uint16_t cidx; /* consumer index */
413 uint16_t cntxt_id; /* SGE context id for the iq */
414 uint16_t abs_id; /* absolute SGE id for the iq */
416 STAILQ_ENTRY(sge_iq) link;
418 bus_dma_tag_t desc_tag;
419 bus_dmamap_t desc_map;
420 bus_addr_t ba; /* bus address of descriptor ring */
429 EQ_TYPEMASK = 0x3, /* 2 lsbits hold the type (see above) */
430 EQ_ALLOCATED = (1 << 2), /* firmware resources allocated */
431 EQ_ENABLED = (1 << 3), /* open for business */
432 EQ_QFLUSH = (1 << 4), /* if_qflush in progress */
435 /* Listed in order of preference. Update t4_sysctls too if you change these */
436 enum {DOORBELL_UDB, DOORBELL_WCWR, DOORBELL_UDBWC, DOORBELL_KDB};
439 * Egress Queue: driver is producer, T4 is consumer.
441 * Note: A free list is an egress queue (driver produces the buffers and T4
442 * consumes them) but it's special enough to have its own struct (see sge_fl).
445 unsigned int flags; /* MUST be first */
446 unsigned int cntxt_id; /* SGE context id for the eq */
447 unsigned int abs_id; /* absolute SGE id for the eq */
450 struct tx_desc *desc; /* KVA of descriptor ring */
452 volatile uint32_t *udb; /* KVA of doorbell (lies within BAR2) */
453 u_int udb_qid; /* relative qid within the doorbell page */
454 uint16_t sidx; /* index of the entry with the status page */
455 uint16_t cidx; /* consumer idx (desc idx) */
456 uint16_t pidx; /* producer idx (desc idx) */
457 uint16_t equeqidx; /* EQUEQ last requested at this pidx */
458 uint16_t dbidx; /* pidx of the most recent doorbell */
459 uint16_t iqid; /* iq that gets egr_update for the eq */
460 uint8_t tx_chan; /* tx channel used by the eq */
461 volatile u_int equiq; /* EQUIQ outstanding */
463 bus_dma_tag_t desc_tag;
464 bus_dmamap_t desc_map;
465 bus_addr_t ba; /* bus address of descriptor ring */
470 uma_zone_t zone; /* zone that this cluster comes from */
471 uint16_t size1; /* same as size of cluster: 2K/4K/9K/16K.
472 * hwsize[hwidx1] = size1. No spare. */
473 uint16_t size2; /* hwsize[hwidx2] = size2.
474 * spare in cluster = size1 - size2. */
475 int8_t hwidx1; /* SGE bufsize idx for size1 */
476 int8_t hwidx2; /* SGE bufsize idx for size2 */
477 uint8_t type; /* EXT_xxx type of the cluster */
483 MEMWIN0_APERTURE = 2048,
484 MEMWIN0_BASE = 0x1b800,
486 MEMWIN1_APERTURE = 32768,
487 MEMWIN1_BASE = 0x28000,
489 MEMWIN2_APERTURE_T4 = 65536,
490 MEMWIN2_BASE_T4 = 0x30000,
492 MEMWIN2_APERTURE_T5 = 128 * 1024,
493 MEMWIN2_BASE_T5 = 0x60000,
497 struct rwlock mw_lock __aligned(CACHE_LINE_SIZE);
498 uint32_t mw_base; /* constant after setup_memwin */
499 uint32_t mw_aperture; /* ditto */
500 uint32_t mw_curpos; /* protected by mw_lock */
504 FL_STARVING = (1 << 0), /* on the adapter's list of starving fl's */
505 FL_DOOMED = (1 << 1), /* about to be destroyed */
506 FL_BUF_PACKING = (1 << 2), /* buffer packing enabled */
507 FL_BUF_RESUME = (1 << 3), /* resume from the middle of the frame */
510 #define FL_RUNNING_LOW(fl) \
511 (IDXDIFF(fl->dbidx * 8, fl->cidx, fl->sidx * 8) <= fl->lowat)
512 #define FL_NOT_RUNNING_LOW(fl) \
513 (IDXDIFF(fl->dbidx * 8, fl->cidx, fl->sidx * 8) >= 2 * fl->lowat)
517 __be64 *desc; /* KVA of descriptor ring, ptr to addresses */
518 struct fl_sdesc *sdesc; /* KVA of software descriptor ring */
519 uint16_t zidx; /* refill zone idx */
521 uint16_t lowat; /* # of buffers <= this means fl needs help */
523 uint16_t buf_boundary;
525 /* The 16b idx all deal with hw descriptors */
526 uint16_t dbidx; /* hw pidx after last doorbell */
527 uint16_t sidx; /* index of status page */
528 volatile uint16_t hw_cidx;
530 /* The 32b idx are all buffer idx, not hardware descriptor idx */
531 uint32_t cidx; /* consumer index */
532 uint32_t pidx; /* producer index */
535 u_int rx_offset; /* offset in fl buf (when buffer packing) */
536 volatile uint32_t *udb;
538 uint64_t cl_allocated; /* # of clusters allocated */
539 uint64_t cl_recycled; /* # of clusters recycled */
540 uint64_t cl_fast_recycled; /* # of clusters recycled (fast) */
542 /* These 3 are valid when FL_BUF_RESUME is set, stale otherwise. */
547 uint16_t qsize; /* # of hw descriptors (status page included) */
548 uint16_t cntxt_id; /* SGE context id for the freelist */
549 TAILQ_ENTRY(sge_fl) link; /* All starving freelists */
550 bus_dma_tag_t desc_tag;
551 bus_dmamap_t desc_map;
553 bus_addr_t ba; /* bus address of descriptor ring */
559 uint8_t wr_type; /* type 0 or type 1 */
560 uint8_t npkt; /* # of packets in this work request */
561 uint8_t len16; /* # of 16B pieces used by this work request */
562 uint8_t score; /* 1-10. coalescing attempted if score > 3 */
563 uint8_t max_npkt; /* maximum number of packets allowed */
564 uint16_t plen; /* total payload (sum of all packets) */
566 /* straight from fw_eth_tx_pkts_vm_wr. */
575 /* txq: SGE egress queue + what's needed for Ethernet NIC */
577 struct sge_eq eq; /* MUST be first */
579 struct ifnet *ifp; /* the interface this txq belongs to */
580 struct mp_ring *r; /* tx software ring */
581 struct tx_sdesc *sdesc; /* KVA of software descriptor ring */
583 __be32 cpl_ctrl0; /* for convenience */
584 int tc_idx; /* traffic class */
587 struct task tx_reclaim_task;
588 /* stats for common events first */
590 uint64_t txcsum; /* # of times hardware assisted with checksum */
591 uint64_t tso_wrs; /* # of TSO work requests */
592 uint64_t vlan_insertion;/* # of times VLAN tag was inserted */
593 uint64_t imm_wrs; /* # of work requests with immediate data */
594 uint64_t sgl_wrs; /* # of work requests with direct SGL */
595 uint64_t txpkt_wrs; /* # of txpkt work requests (not coalesced) */
596 uint64_t txpkts0_wrs; /* # of type0 coalesced tx work requests */
597 uint64_t txpkts1_wrs; /* # of type1 coalesced tx work requests */
598 uint64_t txpkts0_pkts; /* # of frames in type0 coalesced tx WRs */
599 uint64_t txpkts1_pkts; /* # of frames in type1 coalesced tx WRs */
600 uint64_t raw_wrs; /* # of raw work requests (alloc_wr_mbuf) */
601 uint64_t vxlan_tso_wrs; /* # of VXLAN TSO work requests */
602 uint64_t vxlan_txcsum;
604 uint64_t kern_tls_records;
605 uint64_t kern_tls_short;
606 uint64_t kern_tls_partial;
607 uint64_t kern_tls_full;
608 uint64_t kern_tls_octets;
609 uint64_t kern_tls_waste;
610 uint64_t kern_tls_options;
611 uint64_t kern_tls_header;
612 uint64_t kern_tls_fin;
613 uint64_t kern_tls_fin_short;
614 uint64_t kern_tls_cbc;
615 uint64_t kern_tls_gcm;
617 /* stats for not-that-common events */
619 /* Optional scratch space for constructing work requests. */
620 uint8_t ss[SGE_MAX_WR_LEN] __aligned(16);
621 } __aligned(CACHE_LINE_SIZE);
623 /* rxq: SGE ingress queue + SGE free list + miscellaneous items */
625 struct sge_iq iq; /* MUST be first */
626 struct sge_fl fl; /* MUST follow iq */
628 struct ifnet *ifp; /* the interface this rxq belongs to */
629 struct lro_ctrl lro; /* LRO state */
631 /* stats for common events first */
633 uint64_t rxcsum; /* # of times hardware assisted with checksum */
634 uint64_t vlan_extraction;/* # of times VLAN tag was extracted */
635 uint64_t vxlan_rxcsum;
637 /* stats for not-that-common events */
639 } __aligned(CACHE_LINE_SIZE);
641 static inline struct sge_rxq *
642 iq_to_rxq(struct sge_iq *iq)
645 return (__containerof(iq, struct sge_rxq, iq));
649 /* ofld_rxq: SGE ingress queue + SGE free list + miscellaneous items */
650 struct sge_ofld_rxq {
651 struct sge_iq iq; /* MUST be first */
652 struct sge_fl fl; /* MUST follow iq */
653 } __aligned(CACHE_LINE_SIZE);
655 static inline struct sge_ofld_rxq *
656 iq_to_ofld_rxq(struct sge_iq *iq)
659 return (__containerof(iq, struct sge_ofld_rxq, iq));
663 STAILQ_ENTRY(wrqe) link;
666 char wr[] __aligned(16);
670 TAILQ_ENTRY(wrq_cookie) link;
676 * wrq: SGE egress queue that is given prebuilt work requests. Both the control
677 * and offload tx queues are of this type.
680 struct sge_eq eq; /* MUST be first */
682 struct adapter *adapter;
683 struct task wrq_tx_task;
685 /* Tx desc reserved but WR not "committed" yet. */
686 TAILQ_HEAD(wrq_incomplete_wrs , wrq_cookie) incomplete_wrs;
688 /* List of WRs ready to go out as soon as descriptors are available. */
689 STAILQ_HEAD(, wrqe) wr_list;
693 /* stats for common events first */
695 uint64_t tx_wrs_direct; /* # of WRs written directly to desc ring. */
696 uint64_t tx_wrs_ss; /* # of WRs copied from scratch space. */
697 uint64_t tx_wrs_copied; /* # of WRs queued and copied to desc ring. */
699 /* stats for not-that-common events */
702 * Scratch space for work requests that wrap around after reaching the
703 * status page, and some information about the last WR that used it.
707 uint8_t ss[SGE_MAX_WR_LEN];
709 } __aligned(CACHE_LINE_SIZE);
711 #define INVALID_NM_RXQ_CNTXT_ID ((uint16_t)(-1))
713 /* Items used by the driver rx ithread are in this cacheline. */
714 volatile int nm_state __aligned(CACHE_LINE_SIZE); /* NM_OFF, NM_ON, or NM_BUSY */
715 u_int nid; /* netmap ring # for this queue */
718 struct iq_desc *iq_desc;
720 uint16_t iq_cntxt_id;
726 /* Items used by netmap rxsync are in this cacheline. */
727 __be64 *fl_desc __aligned(CACHE_LINE_SIZE);
728 uint16_t fl_cntxt_id;
730 uint32_t fl_sidx2; /* copy of fl_sidx */
733 u_int fl_db_threshold; /* in descriptors */
737 * fl_cidx is used by both the ithread and rxsync, the rest are not used
738 * in the rx fast path.
740 uint32_t fl_cidx __aligned(CACHE_LINE_SIZE);
742 bus_dma_tag_t iq_desc_tag;
743 bus_dmamap_t iq_desc_map;
747 bus_dma_tag_t fl_desc_tag;
748 bus_dmamap_t fl_desc_map;
752 #define INVALID_NM_TXQ_CNTXT_ID ((u_int)(-1))
754 struct tx_desc *desc;
758 uint16_t equiqidx; /* EQUIQ last requested at this pidx */
759 uint16_t equeqidx; /* EQUEQ last requested at this pidx */
760 uint16_t dbidx; /* pidx of the most recent doorbell */
762 volatile uint32_t *udb;
765 __be32 cpl_ctrl0; /* for convenience */
766 __be32 op_pkd; /* ditto */
767 u_int nid; /* netmap ring # for this queue */
769 /* infrequently used items after this */
771 bus_dma_tag_t desc_tag;
772 bus_dmamap_t desc_map;
775 } __aligned(CACHE_LINE_SIZE);
778 int nrxq; /* total # of Ethernet rx queues */
779 int ntxq; /* total # of Ethernet tx queues */
780 int nofldrxq; /* total # of TOE rx queues */
781 int nofldtxq; /* total # of TOE tx queues */
782 int nnmrxq; /* total # of netmap rx queues */
783 int nnmtxq; /* total # of netmap tx queues */
784 int niq; /* total # of ingress queues */
785 int neq; /* total # of egress queues */
787 struct sge_iq fwq; /* Firmware event queue */
788 struct sge_wrq *ctrlq; /* Control queues */
789 struct sge_txq *txq; /* NIC tx queues */
790 struct sge_rxq *rxq; /* NIC rx queues */
791 struct sge_wrq *ofld_txq; /* TOE tx queues */
792 struct sge_ofld_rxq *ofld_rxq; /* TOE rx queues */
793 struct sge_nm_txq *nm_txq; /* netmap tx queues */
794 struct sge_nm_rxq *nm_rxq; /* netmap rx queues */
796 uint16_t iq_start; /* first cntxt_id */
797 uint16_t iq_base; /* first abs_id */
798 int eq_start; /* first cntxt_id */
799 int eq_base; /* first abs_id */
800 struct sge_iq **iqmap; /* iq->cntxt_id to iq mapping */
801 struct sge_eq **eqmap; /* eq->cntxt_id to eq mapping */
804 struct rx_buf_info rx_buf_info[SW_ZONE_SIZES];
808 const char *nexus_name;
809 const char *ifnet_name;
810 const char *vi_ifnet_name;
811 const char *pf03_drv_name;
812 const char *vf_nexus_name;
813 const char *vf_ifnet_name;
819 SLIST_ENTRY(adapter) link;
822 const struct devnames *names;
824 /* PCIe register resources */
826 struct resource *regs_res;
828 struct resource *msix_res;
829 bus_space_handle_t bh;
833 struct resource *udbs_res;
834 volatile uint8_t *udbs_base;
838 unsigned int vpd_busy;
839 unsigned int vpd_flag;
841 /* Interrupt information */
845 struct resource *res;
849 struct sge_nm_rxq *nm_rxq;
850 } __aligned(CACHE_LINE_SIZE) *irq;
852 int sge_kdoorbell_reg;
854 bus_dma_tag_t dmat; /* Parent DMA tag */
861 u_int vxlan_refcount;
865 struct taskqueue *tq[MAX_NCHAN]; /* General purpose taskqueues */
866 struct task async_event_task;
867 struct port_info *port[MAX_NPORTS];
868 uint8_t chan_map[MAX_NCHAN]; /* channel -> port */
870 struct mtx clip_table_lock;
871 TAILQ_HEAD(, clip_entry) clip_table;
874 void *tom_softc; /* (struct tom_data *) */
875 struct tom_tunables tt;
876 struct t4_offload_policy *policy;
877 struct rwlock policy_lock;
879 void *iwarp_softc; /* (struct c4iw_dev *) */
880 struct iw_tunables iwt;
881 void *iscsi_ulp_softc; /* (struct cxgbei_data *) */
882 void *ccr_softc; /* (struct ccr_softc *) */
883 struct l2t_data *l2t; /* L2 table */
884 struct smt_data *smt; /* Source MAC Table */
885 struct tid_info tids;
887 struct tls_tunables tlst;
890 int offload_map; /* ports with IFCAP_TOE enabled */
891 int active_ulds; /* ULDs activated on this adapter */
895 char ifp_lockname[16];
897 struct ifnet *ifp; /* tracer ifp */
898 struct ifmedia media;
899 int traceq; /* iq used by all tracers, -1 if none */
900 int tracer_valid; /* bitmap of valid tracers */
901 int tracer_enabled; /* bitmap of enabled tracers */
909 struct adapter_params params;
910 const struct chip_params *chip_params;
911 struct t4_virt_res vres;
923 struct sysctl_ctx_list ctx; /* from adapter_full_init to full_uninit */
928 /* Starving free lists */
929 struct mtx sfl_lock; /* same cache-line as sc_lock? but that's ok */
930 TAILQ_HEAD(, sge_fl) sfl;
931 struct callout sfl_callout;
933 struct mtx reg_lock; /* for indirect register access */
935 struct memwin memwin[NUM_MEMWIN]; /* memory windows */
941 const void *last_op_thr;
947 struct callout ktls_tick;
950 #define ADAPTER_LOCK(sc) mtx_lock(&(sc)->sc_lock)
951 #define ADAPTER_UNLOCK(sc) mtx_unlock(&(sc)->sc_lock)
952 #define ADAPTER_LOCK_ASSERT_OWNED(sc) mtx_assert(&(sc)->sc_lock, MA_OWNED)
953 #define ADAPTER_LOCK_ASSERT_NOTOWNED(sc) mtx_assert(&(sc)->sc_lock, MA_NOTOWNED)
955 #define ASSERT_SYNCHRONIZED_OP(sc) \
956 KASSERT(IS_BUSY(sc) && \
957 (mtx_owned(&(sc)->sc_lock) || sc->last_op_thr == curthread), \
958 ("%s: operation not synchronized.", __func__))
960 #define PORT_LOCK(pi) mtx_lock(&(pi)->pi_lock)
961 #define PORT_UNLOCK(pi) mtx_unlock(&(pi)->pi_lock)
962 #define PORT_LOCK_ASSERT_OWNED(pi) mtx_assert(&(pi)->pi_lock, MA_OWNED)
963 #define PORT_LOCK_ASSERT_NOTOWNED(pi) mtx_assert(&(pi)->pi_lock, MA_NOTOWNED)
965 #define FL_LOCK(fl) mtx_lock(&(fl)->fl_lock)
966 #define FL_TRYLOCK(fl) mtx_trylock(&(fl)->fl_lock)
967 #define FL_UNLOCK(fl) mtx_unlock(&(fl)->fl_lock)
968 #define FL_LOCK_ASSERT_OWNED(fl) mtx_assert(&(fl)->fl_lock, MA_OWNED)
969 #define FL_LOCK_ASSERT_NOTOWNED(fl) mtx_assert(&(fl)->fl_lock, MA_NOTOWNED)
971 #define RXQ_FL_LOCK(rxq) FL_LOCK(&(rxq)->fl)
972 #define RXQ_FL_UNLOCK(rxq) FL_UNLOCK(&(rxq)->fl)
973 #define RXQ_FL_LOCK_ASSERT_OWNED(rxq) FL_LOCK_ASSERT_OWNED(&(rxq)->fl)
974 #define RXQ_FL_LOCK_ASSERT_NOTOWNED(rxq) FL_LOCK_ASSERT_NOTOWNED(&(rxq)->fl)
976 #define EQ_LOCK(eq) mtx_lock(&(eq)->eq_lock)
977 #define EQ_TRYLOCK(eq) mtx_trylock(&(eq)->eq_lock)
978 #define EQ_UNLOCK(eq) mtx_unlock(&(eq)->eq_lock)
979 #define EQ_LOCK_ASSERT_OWNED(eq) mtx_assert(&(eq)->eq_lock, MA_OWNED)
980 #define EQ_LOCK_ASSERT_NOTOWNED(eq) mtx_assert(&(eq)->eq_lock, MA_NOTOWNED)
982 #define TXQ_LOCK(txq) EQ_LOCK(&(txq)->eq)
983 #define TXQ_TRYLOCK(txq) EQ_TRYLOCK(&(txq)->eq)
984 #define TXQ_UNLOCK(txq) EQ_UNLOCK(&(txq)->eq)
985 #define TXQ_LOCK_ASSERT_OWNED(txq) EQ_LOCK_ASSERT_OWNED(&(txq)->eq)
986 #define TXQ_LOCK_ASSERT_NOTOWNED(txq) EQ_LOCK_ASSERT_NOTOWNED(&(txq)->eq)
988 #define for_each_txq(vi, iter, q) \
989 for (q = &vi->adapter->sge.txq[vi->first_txq], iter = 0; \
990 iter < vi->ntxq; ++iter, ++q)
991 #define for_each_rxq(vi, iter, q) \
992 for (q = &vi->adapter->sge.rxq[vi->first_rxq], iter = 0; \
993 iter < vi->nrxq; ++iter, ++q)
994 #define for_each_ofld_txq(vi, iter, q) \
995 for (q = &vi->adapter->sge.ofld_txq[vi->first_ofld_txq], iter = 0; \
996 iter < vi->nofldtxq; ++iter, ++q)
997 #define for_each_ofld_rxq(vi, iter, q) \
998 for (q = &vi->adapter->sge.ofld_rxq[vi->first_ofld_rxq], iter = 0; \
999 iter < vi->nofldrxq; ++iter, ++q)
1000 #define for_each_nm_txq(vi, iter, q) \
1001 for (q = &vi->adapter->sge.nm_txq[vi->first_nm_txq], iter = 0; \
1002 iter < vi->nnmtxq; ++iter, ++q)
1003 #define for_each_nm_rxq(vi, iter, q) \
1004 for (q = &vi->adapter->sge.nm_rxq[vi->first_nm_rxq], iter = 0; \
1005 iter < vi->nnmrxq; ++iter, ++q)
1006 #define for_each_vi(_pi, _iter, _vi) \
1007 for ((_vi) = (_pi)->vi, (_iter) = 0; (_iter) < (_pi)->nvi; \
1010 #define IDXINCR(idx, incr, wrap) do { \
1011 idx = wrap - idx > incr ? idx + incr : incr - (wrap - idx); \
1013 #define IDXDIFF(head, tail, wrap) \
1014 ((head) >= (tail) ? (head) - (tail) : (wrap) - (tail) + (head))
1016 /* One for errors, one for firmware events */
1017 #define T4_EXTRA_INTR 2
1019 /* One for firmware events */
1020 #define T4VF_EXTRA_INTR 1
1023 forwarding_intr_to_fwq(struct adapter *sc)
1026 return (sc->intr_count == 1);
1029 static inline uint32_t
1030 t4_read_reg(struct adapter *sc, uint32_t reg)
1033 return bus_space_read_4(sc->bt, sc->bh, reg);
1037 t4_write_reg(struct adapter *sc, uint32_t reg, uint32_t val)
1040 bus_space_write_4(sc->bt, sc->bh, reg, val);
1043 static inline uint64_t
1044 t4_read_reg64(struct adapter *sc, uint32_t reg)
1048 return bus_space_read_8(sc->bt, sc->bh, reg);
1050 return (uint64_t)bus_space_read_4(sc->bt, sc->bh, reg) +
1051 ((uint64_t)bus_space_read_4(sc->bt, sc->bh, reg + 4) << 32);
1057 t4_write_reg64(struct adapter *sc, uint32_t reg, uint64_t val)
1061 bus_space_write_8(sc->bt, sc->bh, reg, val);
1063 bus_space_write_4(sc->bt, sc->bh, reg, val);
1064 bus_space_write_4(sc->bt, sc->bh, reg + 4, val>> 32);
1069 t4_os_pci_read_cfg1(struct adapter *sc, int reg, uint8_t *val)
1072 *val = pci_read_config(sc->dev, reg, 1);
1076 t4_os_pci_write_cfg1(struct adapter *sc, int reg, uint8_t val)
1079 pci_write_config(sc->dev, reg, val, 1);
1083 t4_os_pci_read_cfg2(struct adapter *sc, int reg, uint16_t *val)
1086 *val = pci_read_config(sc->dev, reg, 2);
1090 t4_os_pci_write_cfg2(struct adapter *sc, int reg, uint16_t val)
1093 pci_write_config(sc->dev, reg, val, 2);
1097 t4_os_pci_read_cfg4(struct adapter *sc, int reg, uint32_t *val)
1100 *val = pci_read_config(sc->dev, reg, 4);
1104 t4_os_pci_write_cfg4(struct adapter *sc, int reg, uint32_t val)
1107 pci_write_config(sc->dev, reg, val, 4);
1110 static inline struct port_info *
1111 adap2pinfo(struct adapter *sc, int idx)
1114 return (sc->port[idx]);
1118 t4_os_set_hw_addr(struct port_info *pi, uint8_t hw_addr[])
1121 bcopy(hw_addr, pi->vi[0].hw_addr, ETHER_ADDR_LEN);
1125 tx_resume_threshold(struct sge_eq *eq)
1128 /* not quite the same as qsize / 4, but this will do. */
1129 return (eq->sidx / 4);
1133 t4_use_ldst(struct adapter *sc)
1137 return (sc->flags & FW_OK || !sc->use_bd);
1144 CH_DUMP_MBOX(struct adapter *sc, int mbox, const int reg,
1145 const char *msg, const __be64 *const p, const bool err)
1148 if (!(sc->debug_flags & DF_DUMP_MBOX) && !err)
1151 log(err ? LOG_ERR : LOG_DEBUG,
1152 "%s: mbox %u %s %016llx %016llx %016llx %016llx "
1153 "%016llx %016llx %016llx %016llx\n",
1154 device_get_nameunit(sc->dev), mbox, msg,
1155 (long long)be64_to_cpu(p[0]), (long long)be64_to_cpu(p[1]),
1156 (long long)be64_to_cpu(p[2]), (long long)be64_to_cpu(p[3]),
1157 (long long)be64_to_cpu(p[4]), (long long)be64_to_cpu(p[5]),
1158 (long long)be64_to_cpu(p[6]), (long long)be64_to_cpu(p[7]));
1160 log(err ? LOG_ERR : LOG_DEBUG,
1161 "%s: mbox %u %s %016llx %016llx %016llx %016llx "
1162 "%016llx %016llx %016llx %016llx\n",
1163 device_get_nameunit(sc->dev), mbox, msg,
1164 (long long)t4_read_reg64(sc, reg),
1165 (long long)t4_read_reg64(sc, reg + 8),
1166 (long long)t4_read_reg64(sc, reg + 16),
1167 (long long)t4_read_reg64(sc, reg + 24),
1168 (long long)t4_read_reg64(sc, reg + 32),
1169 (long long)t4_read_reg64(sc, reg + 40),
1170 (long long)t4_read_reg64(sc, reg + 48),
1171 (long long)t4_read_reg64(sc, reg + 56));
1178 extern int t4_intr_types;
1179 extern int t4_tmr_idx;
1180 extern int t4_pktc_idx;
1181 extern unsigned int t4_qsize_rxq;
1182 extern unsigned int t4_qsize_txq;
1183 extern device_method_t cxgbe_methods[];
1185 int t4_os_find_pci_capability(struct adapter *, int);
1186 int t4_os_pci_save_state(struct adapter *);
1187 int t4_os_pci_restore_state(struct adapter *);
1188 void t4_os_portmod_changed(struct port_info *);
1189 void t4_os_link_changed(struct port_info *);
1190 void t4_iterate(void (*)(struct adapter *, void *), void *);
1191 void t4_init_devnames(struct adapter *);
1192 void t4_add_adapter(struct adapter *);
1193 int t4_detach_common(device_t);
1194 int t4_map_bars_0_and_4(struct adapter *);
1195 int t4_map_bar_2(struct adapter *);
1196 int t4_setup_intr_handlers(struct adapter *);
1197 void t4_sysctls(struct adapter *);
1198 int begin_synchronized_op(struct adapter *, struct vi_info *, int, char *);
1199 void doom_vi(struct adapter *, struct vi_info *);
1200 void end_synchronized_op(struct adapter *, int);
1201 int update_mac_settings(struct ifnet *, int);
1202 int adapter_full_init(struct adapter *);
1203 int adapter_full_uninit(struct adapter *);
1204 uint64_t cxgbe_get_counter(struct ifnet *, ift_counter);
1205 void cxgbe_snd_tag_init(struct cxgbe_snd_tag *, struct ifnet *, int);
1206 int vi_full_init(struct vi_info *);
1207 int vi_full_uninit(struct vi_info *);
1208 void vi_sysctls(struct vi_info *);
1209 void vi_tick(void *);
1210 int rw_via_memwin(struct adapter *, int, uint32_t, uint32_t *, int, int);
1211 int alloc_atid(struct adapter *, void *);
1212 void *lookup_atid(struct adapter *, int);
1213 void free_atid(struct adapter *, int);
1214 void release_tid(struct adapter *, int, struct sge_wrq *);
1215 int cxgbe_media_change(struct ifnet *);
1216 void cxgbe_media_status(struct ifnet *, struct ifmediareq *);
1217 bool t4_os_dump_cimla(struct adapter *, int, bool);
1218 void t4_os_dump_devlog(struct adapter *);
1222 int cxgbe_tls_tag_alloc(struct ifnet *, union if_snd_tag_alloc_params *,
1223 struct m_snd_tag **);
1224 void cxgbe_tls_tag_free(struct m_snd_tag *);
1225 void t6_ktls_modload(void);
1226 void t6_ktls_modunload(void);
1227 int t6_ktls_try(struct ifnet *, struct socket *, struct ktls_session *);
1228 int t6_ktls_parse_pkt(struct mbuf *, int *, int *);
1229 int t6_ktls_write_wr(struct sge_txq *, void *, struct mbuf *, u_int, u_int);
1236 void t4_aes_getdeckey(void *, const void *, unsigned int);
1237 void t4_copy_partial_hash(int, union authctx *, void *);
1238 void t4_init_gmac_hash(const char *, int, char *);
1239 void t4_init_hmac_digest(struct auth_hash *, u_int, const char *, int, char *);
1244 void cxgbe_nm_attach(struct vi_info *);
1245 void cxgbe_nm_detach(struct vi_info *);
1246 void service_nm_rxq(struct sge_nm_rxq *);
1250 void t4_sge_modload(void);
1251 void t4_sge_modunload(void);
1252 uint64_t t4_sge_extfree_refs(void);
1253 void t4_tweak_chip_settings(struct adapter *);
1254 int t4_read_chip_settings(struct adapter *);
1255 int t4_create_dma_tag(struct adapter *);
1256 void t4_sge_sysctls(struct adapter *, struct sysctl_ctx_list *,
1257 struct sysctl_oid_list *);
1258 int t4_destroy_dma_tag(struct adapter *);
1259 int t4_setup_adapter_queues(struct adapter *);
1260 int t4_teardown_adapter_queues(struct adapter *);
1261 int t4_setup_vi_queues(struct vi_info *);
1262 int t4_teardown_vi_queues(struct vi_info *);
1263 void t4_intr_all(void *);
1264 void t4_intr(void *);
1266 void t4_nm_intr(void *);
1267 void t4_vi_intr(void *);
1269 void t4_intr_err(void *);
1270 void t4_intr_evt(void *);
1271 void t4_wrq_tx_locked(struct adapter *, struct sge_wrq *, struct wrqe *);
1272 void t4_update_fl_bufsize(struct ifnet *);
1273 struct mbuf *alloc_wr_mbuf(int, int);
1274 int parse_pkt(struct mbuf **, bool);
1275 void *start_wrq_wr(struct sge_wrq *, int, struct wrq_cookie *);
1276 void commit_wrq_wr(struct sge_wrq *, void *, struct wrq_cookie *);
1277 int tnl_cong(struct port_info *, int);
1278 void t4_register_an_handler(an_handler_t);
1279 void t4_register_fw_msg_handler(int, fw_msg_handler_t);
1280 void t4_register_cpl_handler(int, cpl_handler_t);
1281 void t4_register_shared_cpl_handler(int, cpl_handler_t, int);
1283 int ethofld_transmit(struct ifnet *, struct mbuf *);
1284 void send_etid_flush_wr(struct cxgbe_rate_tag *);
1289 void t4_tracer_modload(void);
1290 void t4_tracer_modunload(void);
1291 void t4_tracer_port_detach(struct adapter *);
1292 int t4_get_tracer(struct adapter *, struct t4_tracer *);
1293 int t4_set_tracer(struct adapter *, struct t4_tracer *);
1294 int t4_trace_pkt(struct sge_iq *, const struct rss_header *, struct mbuf *);
1295 int t5_trace_pkt(struct sge_iq *, const struct rss_header *, struct mbuf *);
1298 int t4_set_sched_class(struct adapter *, struct t4_sched_params *);
1299 int t4_set_sched_queue(struct adapter *, struct t4_sched_queue *);
1300 int t4_init_tx_sched(struct adapter *);
1301 int t4_free_tx_sched(struct adapter *);
1302 void t4_update_tx_sched(struct adapter *);
1303 int t4_reserve_cl_rl_kbps(struct adapter *, int, u_int, int *);
1304 void t4_release_cl_rl(struct adapter *, int, int);
1305 int sysctl_tc(SYSCTL_HANDLER_ARGS);
1306 int sysctl_tc_params(SYSCTL_HANDLER_ARGS);
1308 void t4_init_etid_table(struct adapter *);
1309 void t4_free_etid_table(struct adapter *);
1310 struct cxgbe_rate_tag *lookup_etid(struct adapter *, int);
1311 int cxgbe_rate_tag_alloc(struct ifnet *, union if_snd_tag_alloc_params *,
1312 struct m_snd_tag **);
1313 int cxgbe_rate_tag_modify(struct m_snd_tag *, union if_snd_tag_modify_params *);
1314 int cxgbe_rate_tag_query(struct m_snd_tag *, union if_snd_tag_query_params *);
1315 void cxgbe_rate_tag_free(struct m_snd_tag *);
1316 void cxgbe_rate_tag_free_locked(struct cxgbe_rate_tag *);
1317 void cxgbe_ratelimit_query(struct ifnet *, struct if_ratelimit_query_results *);
1321 int get_filter_mode(struct adapter *, uint32_t *);
1322 int set_filter_mode(struct adapter *, uint32_t);
1323 int get_filter(struct adapter *, struct t4_filter *);
1324 int set_filter(struct adapter *, struct t4_filter *);
1325 int del_filter(struct adapter *, struct t4_filter *);
1326 int t4_filter_rpl(struct sge_iq *, const struct rss_header *, struct mbuf *);
1327 int t4_hashfilter_ao_rpl(struct sge_iq *, const struct rss_header *, struct mbuf *);
1328 int t4_hashfilter_tcb_rpl(struct sge_iq *, const struct rss_header *, struct mbuf *);
1329 int t4_del_hashfilter_rpl(struct sge_iq *, const struct rss_header *, struct mbuf *);
1330 void free_hftid_hash(struct tid_info *);
1332 static inline struct wrqe *
1333 alloc_wrqe(int wr_len, struct sge_wrq *wrq)
1335 int len = offsetof(struct wrqe, wr) + wr_len;
1338 wr = malloc(len, M_CXGBE, M_NOWAIT);
1339 if (__predict_false(wr == NULL))
1341 wr->wr_len = wr_len;
1346 static inline void *
1347 wrtod(struct wrqe *wr)
1349 return (&wr->wr[0]);
1353 free_wrqe(struct wrqe *wr)
1359 t4_wrq_tx(struct adapter *sc, struct wrqe *wr)
1361 struct sge_wrq *wrq = wr->wrq;
1364 t4_wrq_tx_locked(sc, wrq, wr);
1369 read_via_memwin(struct adapter *sc, int idx, uint32_t addr, uint32_t *val,
1373 return (rw_via_memwin(sc, idx, addr, val, len, 0));
1377 write_via_memwin(struct adapter *sc, int idx, uint32_t addr,
1378 const uint32_t *val, int len)
1381 return (rw_via_memwin(sc, idx, addr, (void *)(uintptr_t)val, len, 1));
1384 /* Number of len16 -> number of descriptors */
1386 tx_len16_to_desc(int len16)
1389 return (howmany(len16, EQ_ESIZE / 16));