2 * Copyright (c) 2015-2019 Mellanox Technologies. All rights reserved.
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
7 * 1. Redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer.
9 * 2. Redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution.
13 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND
14 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
16 * ARE DISCLAIMED. IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
17 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
18 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
19 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
20 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
21 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
22 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 #include <net/sff8472.h>
32 mlx5e_create_stats(struct sysctl_ctx_list *ctx,
33 struct sysctl_oid_list *parent, const char *buffer,
34 const char **desc, unsigned num, u64 * arg)
36 struct sysctl_oid *node;
41 node = SYSCTL_ADD_NODE(ctx, parent, OID_AUTO,
42 buffer, CTLFLAG_RD, NULL, "Statistics");
45 for (x = 0; x != num; x++) {
46 SYSCTL_ADD_UQUAD(ctx, SYSCTL_CHILDREN(node), OID_AUTO,
47 desc[2 * x], CTLFLAG_RD, arg + x, desc[2 * x + 1]);
52 mlx5e_ethtool_sync_tx_completion_fact(struct mlx5e_priv *priv)
55 * Limit the maximum distance between completion events to
56 * half of the currently set TX queue size.
58 * The maximum number of queue entries a single IP packet can
59 * consume is given by MLX5_SEND_WQE_MAX_WQEBBS.
61 * The worst case max value is then given as below:
63 uint64_t max = priv->params_ethtool.tx_queue_size /
64 (2 * MLX5_SEND_WQE_MAX_WQEBBS);
67 * Update the maximum completion factor value in case the
68 * tx_queue_size field changed. Ensure we don't overflow
75 priv->params_ethtool.tx_completion_fact_max = max;
78 * Verify that the current TX completion factor is within the
81 if (priv->params_ethtool.tx_completion_fact < 1)
82 priv->params_ethtool.tx_completion_fact = 1;
83 else if (priv->params_ethtool.tx_completion_fact > max)
84 priv->params_ethtool.tx_completion_fact = max;
88 mlx5e_getmaxrate(struct mlx5e_priv *priv)
90 struct mlx5_core_dev *mdev = priv->mdev;
91 u8 max_bw_unit[IEEE_8021QAZ_MAX_TCS];
92 u8 max_bw_value[IEEE_8021QAZ_MAX_TCS];
97 err = -mlx5_query_port_tc_rate_limit(mdev, max_bw_value, max_bw_unit);
101 for (i = 0; i <= mlx5_max_tc(mdev); i++) {
102 switch (max_bw_unit[i]) {
103 case MLX5_100_MBPS_UNIT:
104 priv->params_ethtool.max_bw_value[i] = max_bw_value[i] * MLX5E_100MB;
107 priv->params_ethtool.max_bw_value[i] = max_bw_value[i] * MLX5E_1GB;
109 case MLX5_BW_NO_LIMIT:
110 priv->params_ethtool.max_bw_value[i] = 0;
113 priv->params_ethtool.max_bw_value[i] = -1;
114 WARN_ONCE(true, "non-supported BW unit");
124 mlx5e_get_max_alloc(struct mlx5e_priv *priv)
126 struct mlx5_core_dev *mdev = priv->mdev;
131 err = -mlx5_query_port_tc_bw_alloc(mdev, priv->params_ethtool.max_bw_share);
133 /* set default value */
134 for (x = 0; x != IEEE_8021QAZ_MAX_TCS; x++) {
135 priv->params_ethtool.max_bw_share[x] =
136 100 / IEEE_8021QAZ_MAX_TCS;
138 err = -mlx5_set_port_tc_bw_alloc(mdev,
139 priv->params_ethtool.max_bw_share);
147 mlx5e_get_dscp(struct mlx5e_priv *priv)
149 struct mlx5_core_dev *mdev = priv->mdev;
152 if (MLX5_CAP_GEN(mdev, qcam_reg) == 0 ||
153 MLX5_CAP_QCAM_REG(mdev, qpts) == 0 ||
154 MLX5_CAP_QCAM_REG(mdev, qpdpm) == 0)
158 err = -mlx5_query_dscp2prio(mdev, priv->params_ethtool.dscp2prio);
162 err = -mlx5_query_trust_state(mdev, &priv->params_ethtool.trust_state);
171 mlx5e_tc_get_parameters(struct mlx5e_priv *priv,
172 u64 *new_bw_value, u8 *max_bw_value, u8 *max_bw_unit)
174 const u64 upper_limit_mbps = 255 * MLX5E_100MB;
175 const u64 upper_limit_gbps = 255 * MLX5E_1GB;
179 memset(max_bw_value, 0, IEEE_8021QAZ_MAX_TCS);
180 memset(max_bw_unit, 0, IEEE_8021QAZ_MAX_TCS);
182 for (i = 0; i <= mlx5_max_tc(priv->mdev); i++) {
183 temp = (new_bw_value != NULL) ?
184 new_bw_value[i] : priv->params_ethtool.max_bw_value[i];
187 max_bw_unit[i] = MLX5_BW_NO_LIMIT;
188 } else if (temp > upper_limit_gbps) {
189 max_bw_unit[i] = MLX5_BW_NO_LIMIT;
190 } else if (temp <= upper_limit_mbps) {
191 max_bw_value[i] = howmany(temp, MLX5E_100MB);
192 max_bw_unit[i] = MLX5_100_MBPS_UNIT;
194 max_bw_value[i] = howmany(temp, MLX5E_1GB);
195 max_bw_unit[i] = MLX5_GBPS_UNIT;
201 mlx5e_tc_maxrate_handler(SYSCTL_HANDLER_ARGS)
203 struct mlx5e_priv *priv = arg1;
204 struct mlx5_core_dev *mdev = priv->mdev;
205 u8 max_bw_unit[IEEE_8021QAZ_MAX_TCS];
206 u8 max_bw_value[IEEE_8021QAZ_MAX_TCS];
207 u64 new_bw_value[IEEE_8021QAZ_MAX_TCS];
208 u8 max_rates = mlx5_max_tc(mdev) + 1;
213 err = SYSCTL_OUT(req, priv->params_ethtool.max_bw_value,
214 sizeof(priv->params_ethtool.max_bw_value[0]) * max_rates);
215 if (err || !req->newptr)
217 err = SYSCTL_IN(req, new_bw_value,
218 sizeof(new_bw_value[0]) * max_rates);
222 /* range check input value */
223 for (x = 0; x != max_rates; x++) {
224 if (new_bw_value[x] % MLX5E_100MB) {
230 mlx5e_tc_get_parameters(priv, new_bw_value, max_bw_value, max_bw_unit);
232 err = -mlx5_modify_port_tc_rate_limit(mdev, max_bw_value, max_bw_unit);
236 memcpy(priv->params_ethtool.max_bw_value, new_bw_value,
237 sizeof(priv->params_ethtool.max_bw_value));
244 mlx5e_tc_rate_share_handler(SYSCTL_HANDLER_ARGS)
246 struct mlx5e_priv *priv = arg1;
247 struct mlx5_core_dev *mdev = priv->mdev;
248 u8 max_bw_share[IEEE_8021QAZ_MAX_TCS];
249 u8 max_rates = mlx5_max_tc(mdev) + 1;
255 err = SYSCTL_OUT(req, priv->params_ethtool.max_bw_share, max_rates);
256 if (err || !req->newptr)
258 err = SYSCTL_IN(req, max_bw_share, max_rates);
262 /* range check input value */
263 for (sum = i = 0; i != max_rates; i++) {
264 if (max_bw_share[i] < 1 || max_bw_share[i] > 100) {
268 sum += max_bw_share[i];
271 /* sum of values should be as close to 100 as possible */
272 if (sum < (100 - max_rates + 1) || sum > 100) {
277 err = -mlx5_set_port_tc_bw_alloc(mdev, max_bw_share);
281 memcpy(priv->params_ethtool.max_bw_share, max_bw_share,
282 sizeof(priv->params_ethtool.max_bw_share));
289 mlx5e_get_prio_tc(struct mlx5e_priv *priv)
291 struct mlx5_core_dev *mdev = priv->mdev;
296 if (!MLX5_CAP_GEN(priv->mdev, ets)) {
301 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) {
302 err = -mlx5_query_port_prio_tc(mdev, i, priv->params_ethtool.prio_tc + i);
311 mlx5e_prio_to_tc_handler(SYSCTL_HANDLER_ARGS)
313 struct mlx5e_priv *priv = arg1;
314 struct mlx5_core_dev *mdev = priv->mdev;
315 uint8_t temp[MLX5E_MAX_PRIORITY];
320 err = SYSCTL_OUT(req, priv->params_ethtool.prio_tc, MLX5E_MAX_PRIORITY);
321 if (err || !req->newptr)
323 err = SYSCTL_IN(req, temp, MLX5E_MAX_PRIORITY);
327 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) {
328 if (temp[i] > mlx5_max_tc(mdev)) {
334 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) {
335 if (temp[i] == priv->params_ethtool.prio_tc[i])
337 err = -mlx5_set_port_prio_tc(mdev, i, temp[i]);
340 /* update cached value */
341 priv->params_ethtool.prio_tc[i] = temp[i];
349 mlx5e_trust_state_handler(SYSCTL_HANDLER_ARGS)
351 struct mlx5e_priv *priv = arg1;
352 struct mlx5_core_dev *mdev = priv->mdev;
357 result = priv->params_ethtool.trust_state;
358 err = sysctl_handle_8(oidp, &result, 0, req);
359 if (err || !req->newptr ||
360 result == priv->params_ethtool.trust_state)
364 case MLX5_QPTS_TRUST_PCP:
365 case MLX5_QPTS_TRUST_DSCP:
367 case MLX5_QPTS_TRUST_BOTH:
368 if (!MLX5_CAP_QCAM_FEATURE(mdev, qpts_trust_both)) {
378 err = -mlx5_set_trust_state(mdev, result);
382 priv->params_ethtool.trust_state = result;
384 /* update inline mode */
385 mlx5e_refresh_sq_inline(priv);
387 mlx5e_rl_refresh_sq_inline(&priv->rl);
395 mlx5e_dscp_prio_handler(SYSCTL_HANDLER_ARGS)
397 struct mlx5e_priv *priv = arg1;
398 int prio_index = arg2;
399 struct mlx5_core_dev *mdev = priv->mdev;
400 uint8_t dscp2prio[MLX5_MAX_SUPPORTED_DSCP];
405 err = SYSCTL_OUT(req, priv->params_ethtool.dscp2prio + prio_index,
406 sizeof(priv->params_ethtool.dscp2prio) / 8);
407 if (err || !req->newptr)
410 memcpy(dscp2prio, priv->params_ethtool.dscp2prio, sizeof(dscp2prio));
411 err = SYSCTL_IN(req, dscp2prio + prio_index, sizeof(dscp2prio) / 8);
414 for (x = 0; x != MLX5_MAX_SUPPORTED_DSCP; x++) {
415 if (dscp2prio[x] > 7) {
420 err = -mlx5_set_dscp2prio(mdev, dscp2prio);
424 /* update local array */
425 memcpy(priv->params_ethtool.dscp2prio, dscp2prio,
426 sizeof(priv->params_ethtool.dscp2prio));
432 #define MLX5_PARAM_OFFSET(n) \
433 __offsetof(struct mlx5e_priv, params_ethtool.n)
436 mlx5e_ethtool_handler(SYSCTL_HANDLER_ARGS)
438 struct mlx5e_priv *priv = arg1;
445 value = priv->params_ethtool.arg[arg2];
447 error = sysctl_handle_64(oidp, &value, 0, req);
448 if (error || req->newptr == NULL ||
449 value == priv->params_ethtool.arg[arg2])
452 /* assign new value */
453 priv->params_ethtool.arg[arg2] = value;
457 /* check if device is gone */
462 was_opened = test_bit(MLX5E_STATE_OPENED, &priv->state);
463 mode_modify = MLX5_CAP_GEN(priv->mdev, cq_period_mode_modify);
465 switch (MLX5_PARAM_OFFSET(arg[arg2])) {
466 case MLX5_PARAM_OFFSET(rx_coalesce_usecs):
467 /* import RX coal time */
468 if (priv->params_ethtool.rx_coalesce_usecs < 1)
469 priv->params_ethtool.rx_coalesce_usecs = 0;
470 else if (priv->params_ethtool.rx_coalesce_usecs >
471 MLX5E_FLD_MAX(cqc, cq_period)) {
472 priv->params_ethtool.rx_coalesce_usecs =
473 MLX5E_FLD_MAX(cqc, cq_period);
475 priv->params.rx_cq_moderation_usec =
476 priv->params_ethtool.rx_coalesce_usecs;
478 /* check to avoid down and up the network interface */
480 error = mlx5e_refresh_channel_params(priv);
483 case MLX5_PARAM_OFFSET(rx_coalesce_pkts):
484 /* import RX coal pkts */
485 if (priv->params_ethtool.rx_coalesce_pkts < 1)
486 priv->params_ethtool.rx_coalesce_pkts = 0;
487 else if (priv->params_ethtool.rx_coalesce_pkts >
488 MLX5E_FLD_MAX(cqc, cq_max_count)) {
489 priv->params_ethtool.rx_coalesce_pkts =
490 MLX5E_FLD_MAX(cqc, cq_max_count);
492 priv->params.rx_cq_moderation_pkts =
493 priv->params_ethtool.rx_coalesce_pkts;
495 /* check to avoid down and up the network interface */
497 error = mlx5e_refresh_channel_params(priv);
500 case MLX5_PARAM_OFFSET(tx_coalesce_usecs):
501 /* import TX coal time */
502 if (priv->params_ethtool.tx_coalesce_usecs < 1)
503 priv->params_ethtool.tx_coalesce_usecs = 0;
504 else if (priv->params_ethtool.tx_coalesce_usecs >
505 MLX5E_FLD_MAX(cqc, cq_period)) {
506 priv->params_ethtool.tx_coalesce_usecs =
507 MLX5E_FLD_MAX(cqc, cq_period);
509 priv->params.tx_cq_moderation_usec =
510 priv->params_ethtool.tx_coalesce_usecs;
512 /* check to avoid down and up the network interface */
514 error = mlx5e_refresh_channel_params(priv);
517 case MLX5_PARAM_OFFSET(tx_coalesce_pkts):
518 /* import TX coal pkts */
519 if (priv->params_ethtool.tx_coalesce_pkts < 1)
520 priv->params_ethtool.tx_coalesce_pkts = 0;
521 else if (priv->params_ethtool.tx_coalesce_pkts >
522 MLX5E_FLD_MAX(cqc, cq_max_count)) {
523 priv->params_ethtool.tx_coalesce_pkts =
524 MLX5E_FLD_MAX(cqc, cq_max_count);
526 priv->params.tx_cq_moderation_pkts =
527 priv->params_ethtool.tx_coalesce_pkts;
529 /* check to avoid down and up the network interface */
531 error = mlx5e_refresh_channel_params(priv);
534 case MLX5_PARAM_OFFSET(tx_queue_size):
535 /* network interface must be down */
537 mlx5e_close_locked(priv->ifp);
539 /* import TX queue size */
540 if (priv->params_ethtool.tx_queue_size <
541 (1 << MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE)) {
542 priv->params_ethtool.tx_queue_size =
543 (1 << MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE);
544 } else if (priv->params_ethtool.tx_queue_size >
545 priv->params_ethtool.tx_queue_size_max) {
546 priv->params_ethtool.tx_queue_size =
547 priv->params_ethtool.tx_queue_size_max;
549 /* store actual TX queue size */
550 priv->params.log_sq_size =
551 order_base_2(priv->params_ethtool.tx_queue_size);
552 priv->params_ethtool.tx_queue_size =
553 1 << priv->params.log_sq_size;
555 /* verify TX completion factor */
556 mlx5e_ethtool_sync_tx_completion_fact(priv);
558 /* restart network interface, if any */
560 mlx5e_open_locked(priv->ifp);
563 case MLX5_PARAM_OFFSET(rx_queue_size):
564 /* network interface must be down */
566 mlx5e_close_locked(priv->ifp);
568 /* import RX queue size */
569 if (priv->params_ethtool.rx_queue_size <
570 (1 << MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE)) {
571 priv->params_ethtool.rx_queue_size =
572 (1 << MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE);
573 } else if (priv->params_ethtool.rx_queue_size >
574 priv->params_ethtool.rx_queue_size_max) {
575 priv->params_ethtool.rx_queue_size =
576 priv->params_ethtool.rx_queue_size_max;
578 /* store actual RX queue size */
579 priv->params.log_rq_size =
580 order_base_2(priv->params_ethtool.rx_queue_size);
581 priv->params_ethtool.rx_queue_size =
582 1 << priv->params.log_rq_size;
584 /* update least number of RX WQEs */
585 priv->params.min_rx_wqes = min(
586 priv->params_ethtool.rx_queue_size - 1,
587 MLX5E_PARAMS_DEFAULT_MIN_RX_WQES);
589 /* restart network interface, if any */
591 mlx5e_open_locked(priv->ifp);
594 case MLX5_PARAM_OFFSET(channels_rsss):
595 /* network interface must be down */
597 mlx5e_close_locked(priv->ifp);
599 /* import number of channels */
600 if (priv->params_ethtool.channels_rsss < 1)
601 priv->params_ethtool.channels_rsss = 1;
602 else if (priv->params_ethtool.channels_rsss > 128)
603 priv->params_ethtool.channels_rsss = 128;
605 priv->params.channels_rsss = priv->params_ethtool.channels_rsss;
607 /* restart network interface, if any */
609 mlx5e_open_locked(priv->ifp);
612 case MLX5_PARAM_OFFSET(channels):
613 /* network interface must be down */
615 mlx5e_close_locked(priv->ifp);
617 /* import number of channels */
618 if (priv->params_ethtool.channels < 1)
619 priv->params_ethtool.channels = 1;
620 else if (priv->params_ethtool.channels >
621 (u64) priv->mdev->priv.eq_table.num_comp_vectors) {
622 priv->params_ethtool.channels =
623 (u64) priv->mdev->priv.eq_table.num_comp_vectors;
625 priv->params.num_channels = priv->params_ethtool.channels;
627 /* restart network interface, if any */
629 mlx5e_open_locked(priv->ifp);
632 case MLX5_PARAM_OFFSET(rx_coalesce_mode):
633 /* network interface must be down */
634 if (was_opened != 0 && mode_modify == 0)
635 mlx5e_close_locked(priv->ifp);
637 /* import RX coalesce mode */
638 if (priv->params_ethtool.rx_coalesce_mode > 3)
639 priv->params_ethtool.rx_coalesce_mode = 3;
640 priv->params.rx_cq_moderation_mode =
641 priv->params_ethtool.rx_coalesce_mode;
643 /* restart network interface, if any */
644 if (was_opened != 0) {
645 if (mode_modify == 0)
646 mlx5e_open_locked(priv->ifp);
648 error = mlx5e_refresh_channel_params(priv);
652 case MLX5_PARAM_OFFSET(tx_coalesce_mode):
653 /* network interface must be down */
654 if (was_opened != 0 && mode_modify == 0)
655 mlx5e_close_locked(priv->ifp);
657 /* import TX coalesce mode */
658 if (priv->params_ethtool.tx_coalesce_mode != 0)
659 priv->params_ethtool.tx_coalesce_mode = 1;
660 priv->params.tx_cq_moderation_mode =
661 priv->params_ethtool.tx_coalesce_mode;
663 /* restart network interface, if any */
664 if (was_opened != 0) {
665 if (mode_modify == 0)
666 mlx5e_open_locked(priv->ifp);
668 error = mlx5e_refresh_channel_params(priv);
672 case MLX5_PARAM_OFFSET(hw_lro):
673 /* network interface must be down */
675 mlx5e_close_locked(priv->ifp);
677 /* import HW LRO mode */
678 if (priv->params_ethtool.hw_lro != 0 &&
679 MLX5_CAP_ETH(priv->mdev, lro_cap)) {
680 priv->params_ethtool.hw_lro = 1;
681 /* check if feature should actually be enabled */
682 if (priv->ifp->if_capenable & IFCAP_LRO) {
683 priv->params.hw_lro_en = true;
685 priv->params.hw_lro_en = false;
687 if_printf(priv->ifp, "To enable HW LRO "
688 "please also enable LRO via ifconfig(8).\n");
691 /* return an error if HW does not support this feature */
692 if (priv->params_ethtool.hw_lro != 0)
694 priv->params.hw_lro_en = false;
695 priv->params_ethtool.hw_lro = 0;
697 /* restart network interface, if any */
699 mlx5e_open_locked(priv->ifp);
702 case MLX5_PARAM_OFFSET(cqe_zipping):
703 /* network interface must be down */
705 mlx5e_close_locked(priv->ifp);
707 /* import CQE zipping mode */
708 if (priv->params_ethtool.cqe_zipping &&
709 MLX5_CAP_GEN(priv->mdev, cqe_compression)) {
710 priv->params.cqe_zipping_en = true;
711 priv->params_ethtool.cqe_zipping = 1;
713 priv->params.cqe_zipping_en = false;
714 priv->params_ethtool.cqe_zipping = 0;
716 /* restart network interface, if any */
718 mlx5e_open_locked(priv->ifp);
721 case MLX5_PARAM_OFFSET(tx_completion_fact):
722 /* network interface must be down */
724 mlx5e_close_locked(priv->ifp);
726 /* verify parameter */
727 mlx5e_ethtool_sync_tx_completion_fact(priv);
729 /* restart network interface, if any */
731 mlx5e_open_locked(priv->ifp);
734 case MLX5_PARAM_OFFSET(modify_tx_dma):
735 /* check if network interface is opened */
737 priv->params_ethtool.modify_tx_dma =
738 priv->params_ethtool.modify_tx_dma ? 1 : 0;
739 /* modify tx according to value */
740 mlx5e_modify_tx_dma(priv, value != 0);
742 /* if closed force enable tx */
743 priv->params_ethtool.modify_tx_dma = 0;
747 case MLX5_PARAM_OFFSET(modify_rx_dma):
748 /* check if network interface is opened */
750 priv->params_ethtool.modify_rx_dma =
751 priv->params_ethtool.modify_rx_dma ? 1 : 0;
752 /* modify rx according to value */
753 mlx5e_modify_rx_dma(priv, value != 0);
755 /* if closed force enable rx */
756 priv->params_ethtool.modify_rx_dma = 0;
760 case MLX5_PARAM_OFFSET(diag_pci_enable):
761 priv->params_ethtool.diag_pci_enable =
762 priv->params_ethtool.diag_pci_enable ? 1 : 0;
764 error = -mlx5_core_set_diagnostics_full(priv->mdev,
765 priv->params_ethtool.diag_pci_enable,
766 priv->params_ethtool.diag_general_enable);
769 case MLX5_PARAM_OFFSET(diag_general_enable):
770 priv->params_ethtool.diag_general_enable =
771 priv->params_ethtool.diag_general_enable ? 1 : 0;
773 error = -mlx5_core_set_diagnostics_full(priv->mdev,
774 priv->params_ethtool.diag_pci_enable,
775 priv->params_ethtool.diag_general_enable);
778 case MLX5_PARAM_OFFSET(mc_local_lb):
779 priv->params_ethtool.mc_local_lb =
780 priv->params_ethtool.mc_local_lb ? 1 : 0;
782 if (MLX5_CAP_GEN(priv->mdev, disable_local_lb)) {
783 error = mlx5_nic_vport_modify_local_lb(priv->mdev,
784 MLX5_LOCAL_MC_LB, priv->params_ethtool.mc_local_lb);
790 case MLX5_PARAM_OFFSET(uc_local_lb):
791 priv->params_ethtool.uc_local_lb =
792 priv->params_ethtool.uc_local_lb ? 1 : 0;
794 if (MLX5_CAP_GEN(priv->mdev, disable_local_lb)) {
795 error = mlx5_nic_vport_modify_local_lb(priv->mdev,
796 MLX5_LOCAL_UC_LB, priv->params_ethtool.uc_local_lb);
811 * Read the first three bytes of the eeprom in order to get the needed info
812 * for the whole reading.
813 * Byte 0 - Identifier byte
814 * Byte 1 - Revision byte
815 * Byte 2 - Status byte
818 mlx5e_get_eeprom_info(struct mlx5e_priv *priv, struct mlx5e_eeprom *eeprom)
820 struct mlx5_core_dev *dev = priv->mdev;
825 ret = mlx5_query_module_num(dev, &eeprom->module_num);
827 if_printf(priv->ifp, "%s:%d: Failed query module error=%d\n",
828 __func__, __LINE__, ret);
832 /* Read the first three bytes to get Identifier, Revision and Status */
833 ret = mlx5_query_eeprom(dev, eeprom->i2c_addr, eeprom->page_num,
834 eeprom->device_addr, MLX5E_EEPROM_INFO_BYTES, eeprom->module_num, &data,
837 if_printf(priv->ifp, "%s:%d: Failed query eeprom module error=0x%x\n",
838 __func__, __LINE__, ret);
842 switch (data & MLX5_EEPROM_IDENTIFIER_BYTE_MASK) {
843 case SFF_8024_ID_QSFP:
844 eeprom->type = MLX5E_ETH_MODULE_SFF_8436;
845 eeprom->len = MLX5E_ETH_MODULE_SFF_8436_LEN;
847 case SFF_8024_ID_QSFPPLUS:
848 case SFF_8024_ID_QSFP28:
849 if ((data & MLX5_EEPROM_IDENTIFIER_BYTE_MASK) == SFF_8024_ID_QSFP28 ||
850 ((data & MLX5_EEPROM_REVISION_ID_BYTE_MASK) >> 8) >= 0x3) {
851 eeprom->type = MLX5E_ETH_MODULE_SFF_8636;
852 eeprom->len = MLX5E_ETH_MODULE_SFF_8636_LEN;
854 eeprom->type = MLX5E_ETH_MODULE_SFF_8436;
855 eeprom->len = MLX5E_ETH_MODULE_SFF_8436_LEN;
857 if ((data & MLX5_EEPROM_PAGE_3_VALID_BIT_MASK) == 0)
858 eeprom->page_valid = 1;
860 case SFF_8024_ID_SFP:
861 eeprom->type = MLX5E_ETH_MODULE_SFF_8472;
862 eeprom->len = MLX5E_ETH_MODULE_SFF_8472_LEN;
865 if_printf(priv->ifp, "%s:%d: Not recognized cable type = 0x%x(%s)\n",
866 __func__, __LINE__, data & MLX5_EEPROM_IDENTIFIER_BYTE_MASK,
867 sff_8024_id[data & MLX5_EEPROM_IDENTIFIER_BYTE_MASK]);
873 /* Read both low and high pages of the eeprom */
875 mlx5e_get_eeprom(struct mlx5e_priv *priv, struct mlx5e_eeprom *ee)
877 struct mlx5_core_dev *dev = priv->mdev;
884 /* Read low page of the eeprom */
885 while (ee->device_addr < ee->len) {
886 ret = mlx5_query_eeprom(dev, ee->i2c_addr, ee->page_num, ee->device_addr,
887 ee->len - ee->device_addr, ee->module_num,
888 ee->data + (ee->device_addr / 4), &size_read);
890 if_printf(priv->ifp, "%s:%d: Failed reading eeprom, "
891 "error = 0x%02x\n", __func__, __LINE__, ret);
894 ee->device_addr += size_read;
897 /* Read high page of the eeprom */
898 if (ee->page_valid) {
899 ee->device_addr = MLX5E_EEPROM_HIGH_PAGE_OFFSET;
900 ee->page_num = MLX5E_EEPROM_HIGH_PAGE;
902 while (ee->device_addr < MLX5E_EEPROM_PAGE_LENGTH) {
903 ret = mlx5_query_eeprom(dev, ee->i2c_addr, ee->page_num,
904 ee->device_addr, MLX5E_EEPROM_PAGE_LENGTH - ee->device_addr,
905 ee->module_num, ee->data + (ee->len / 4) +
906 ((ee->device_addr - MLX5E_EEPROM_HIGH_PAGE_OFFSET) / 4),
909 if_printf(priv->ifp, "%s:%d: Failed reading eeprom, "
910 "error = 0x%02x\n", __func__, __LINE__, ret);
913 ee->device_addr += size_read;
920 mlx5e_print_eeprom(struct mlx5e_eeprom *eeprom)
924 int byte_to_write = 0;
925 int line_length = 16;
927 printf("\nOffset\t\tValues\n");
928 printf("------\t\t------");
929 while (byte_to_write < eeprom->len) {
930 printf("\n0x%04X\t\t", byte_to_write);
931 for (index_in_row = 0; index_in_row < line_length; index_in_row++) {
932 printf("%02X ", ((u8 *)eeprom->data)[byte_to_write]);
937 if (eeprom->page_valid) {
938 row = MLX5E_EEPROM_HIGH_PAGE_OFFSET;
939 printf("\n\nUpper Page 0x03\n");
940 printf("\nOffset\t\tValues\n");
941 printf("------\t\t------");
942 while (row < MLX5E_EEPROM_PAGE_LENGTH) {
943 printf("\n0x%04X\t\t", row);
944 for (index_in_row = 0; index_in_row < line_length; index_in_row++) {
945 printf("%02X ", ((u8 *)eeprom->data)[byte_to_write]);
954 * Read cable EEPROM module information by first inspecting the first
955 * three bytes to get the initial information for a whole reading.
956 * Information will be printed to dmesg.
959 mlx5e_read_eeprom(SYSCTL_HANDLER_ARGS)
961 struct mlx5e_priv *priv = arg1;
962 struct mlx5e_eeprom eeprom;
967 error = sysctl_handle_int(oidp, &result, 0, req);
968 if (error || !req->newptr)
971 /* Check if device is gone */
978 eeprom.i2c_addr = MLX5E_I2C_ADDR_LOW;
979 eeprom.device_addr = 0;
980 eeprom.page_num = MLX5E_EEPROM_LOW_PAGE;
981 eeprom.page_valid = 0;
983 /* Read three first bytes to get important info */
984 error = mlx5e_get_eeprom_info(priv, &eeprom);
986 if_printf(priv->ifp, "%s:%d: Failed reading eeprom's "
987 "initial information\n", __func__, __LINE__);
992 * Allocate needed length buffer and additional space for
995 eeprom.data = malloc(eeprom.len + MLX5E_EEPROM_PAGE_LENGTH,
996 M_MLX5EN, M_WAITOK | M_ZERO);
998 /* Read the whole eeprom information */
999 error = mlx5e_get_eeprom(priv, &eeprom);
1001 if_printf(priv->ifp, "%s:%d: Failed reading eeprom\n",
1002 __func__, __LINE__);
1005 * Continue printing partial information in case of
1009 mlx5e_print_eeprom(&eeprom);
1010 free(eeprom.data, M_MLX5EN);
1017 static const char *mlx5e_params_desc[] = {
1018 MLX5E_PARAMS(MLX5E_STATS_DESC)
1021 static const char *mlx5e_port_stats_debug_desc[] = {
1022 MLX5E_PORT_STATS_DEBUG(MLX5E_STATS_DESC)
1026 mlx5e_ethtool_debug_channel_info(SYSCTL_HANDLER_ARGS)
1028 struct mlx5e_priv *priv;
1030 struct mlx5e_channel *c;
1031 struct mlx5e_sq *sq;
1032 struct mlx5e_rq *rq;
1037 error = sysctl_wire_old_buffer(req, 0);
1040 if (sbuf_new_for_sysctl(&sb, NULL, 1024, req) == NULL)
1042 sbuf_clear_flags(&sb, SBUF_INCLUDENUL);
1045 opened = test_bit(MLX5E_STATE_OPENED, &priv->state);
1047 sbuf_printf(&sb, "pages irq %d\n",
1048 priv->mdev->priv.msix_arr[MLX5_EQ_VEC_PAGES].vector);
1049 sbuf_printf(&sb, "command irq %d\n",
1050 priv->mdev->priv.msix_arr[MLX5_EQ_VEC_CMD].vector);
1051 sbuf_printf(&sb, "async irq %d\n",
1052 priv->mdev->priv.msix_arr[MLX5_EQ_VEC_ASYNC].vector);
1054 for (i = 0; i != priv->params.num_channels; i++) {
1055 int eqn_not_used = -1;
1056 int irqn = MLX5_EQ_VEC_COMP_BASE;
1058 if (mlx5_vector2eqn(priv->mdev, i, &eqn_not_used, &irqn) != 0)
1061 c = opened ? &priv->channel[i] : NULL;
1062 rq = opened ? &c->rq : NULL;
1063 sbuf_printf(&sb, "channel %d rq %d cq %d irq %d\n", i,
1064 opened ? rq->rqn : -1,
1065 opened ? rq->cq.mcq.cqn : -1,
1066 priv->mdev->priv.msix_arr[irqn].vector);
1068 for (tc = 0; tc != priv->num_tc; tc++) {
1069 sq = opened ? &c->sq[tc] : NULL;
1070 sbuf_printf(&sb, "channel %d tc %d sq %d cq %d irq %d\n",
1072 opened ? sq->sqn : -1,
1073 opened ? sq->cq.mcq.cqn : -1,
1074 priv->mdev->priv.msix_arr[irqn].vector);
1078 error = sbuf_finish(&sb);
1084 mlx5e_ethtool_debug_stats(SYSCTL_HANDLER_ARGS)
1086 struct mlx5e_priv *priv = arg1;
1091 if (priv->gone != 0) {
1095 sys_debug = priv->sysctl_debug;
1096 error = sysctl_handle_int(oidp, &sys_debug, 0, req);
1097 if (error != 0 || !req->newptr)
1099 sys_debug = sys_debug ? 1 : 0;
1100 if (sys_debug == priv->sysctl_debug)
1103 if ((priv->sysctl_debug = sys_debug)) {
1104 mlx5e_create_stats(&priv->stats.port_stats_debug.ctx,
1105 SYSCTL_CHILDREN(priv->sysctl_ifnet), "debug_stats",
1106 mlx5e_port_stats_debug_desc, MLX5E_PORT_STATS_DEBUG_NUM,
1107 priv->stats.port_stats_debug.arg);
1108 SYSCTL_ADD_PROC(&priv->stats.port_stats_debug.ctx,
1109 SYSCTL_CHILDREN(priv->sysctl_ifnet), OID_AUTO,
1111 CTLFLAG_RD | CTLFLAG_MPSAFE | CTLTYPE_STRING, priv, 0,
1112 mlx5e_ethtool_debug_channel_info, "S", "");
1114 sysctl_ctx_free(&priv->stats.port_stats_debug.ctx);
1122 mlx5e_create_diagnostics(struct mlx5e_priv *priv)
1124 struct mlx5_core_diagnostics_entry entry;
1125 struct sysctl_ctx_list *ctx;
1126 struct sysctl_oid *node;
1129 /* sysctl context we are using */
1130 ctx = &priv->sysctl_ctx;
1132 /* create root node */
1133 node = SYSCTL_ADD_NODE(ctx,
1134 SYSCTL_CHILDREN(priv->sysctl_ifnet), OID_AUTO,
1135 "diagnostics", CTLFLAG_RD, NULL, "Diagnostics");
1139 /* create PCI diagnostics */
1140 for (x = 0; x != MLX5_CORE_PCI_DIAGNOSTICS_NUM; x++) {
1141 entry = mlx5_core_pci_diagnostics_table[x];
1142 if (mlx5_core_supports_diagnostics(priv->mdev, entry.counter_id) == 0)
1144 SYSCTL_ADD_UQUAD(ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1145 entry.desc, CTLFLAG_RD, priv->params_pci.array + x,
1146 "PCI diagnostics counter");
1149 /* create general diagnostics */
1150 for (x = 0; x != MLX5_CORE_GENERAL_DIAGNOSTICS_NUM; x++) {
1151 entry = mlx5_core_general_diagnostics_table[x];
1152 if (mlx5_core_supports_diagnostics(priv->mdev, entry.counter_id) == 0)
1154 SYSCTL_ADD_UQUAD(ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1155 entry.desc, CTLFLAG_RD, priv->params_general.array + x,
1156 "General diagnostics counter");
1161 mlx5e_create_ethtool(struct mlx5e_priv *priv)
1163 struct sysctl_oid *node, *qos_node;
1164 const char *pnameunit;
1168 /* set some defaults */
1169 priv->params_ethtool.tx_queue_size_max = 1 << MLX5E_PARAMS_MAXIMUM_LOG_SQ_SIZE;
1170 priv->params_ethtool.rx_queue_size_max = 1 << MLX5E_PARAMS_MAXIMUM_LOG_RQ_SIZE;
1171 priv->params_ethtool.tx_queue_size = 1 << priv->params.log_sq_size;
1172 priv->params_ethtool.rx_queue_size = 1 << priv->params.log_rq_size;
1173 priv->params_ethtool.channels = priv->params.num_channels;
1174 priv->params_ethtool.channels_rsss = priv->params.channels_rsss;
1175 priv->params_ethtool.coalesce_pkts_max = MLX5E_FLD_MAX(cqc, cq_max_count);
1176 priv->params_ethtool.coalesce_usecs_max = MLX5E_FLD_MAX(cqc, cq_period);
1177 priv->params_ethtool.rx_coalesce_mode = priv->params.rx_cq_moderation_mode;
1178 priv->params_ethtool.rx_coalesce_usecs = priv->params.rx_cq_moderation_usec;
1179 priv->params_ethtool.rx_coalesce_pkts = priv->params.rx_cq_moderation_pkts;
1180 priv->params_ethtool.tx_coalesce_mode = priv->params.tx_cq_moderation_mode;
1181 priv->params_ethtool.tx_coalesce_usecs = priv->params.tx_cq_moderation_usec;
1182 priv->params_ethtool.tx_coalesce_pkts = priv->params.tx_cq_moderation_pkts;
1183 priv->params_ethtool.hw_lro = priv->params.hw_lro_en;
1184 priv->params_ethtool.cqe_zipping = priv->params.cqe_zipping_en;
1185 mlx5e_ethtool_sync_tx_completion_fact(priv);
1187 /* get default values for local loopback, if any */
1188 if (MLX5_CAP_GEN(priv->mdev, disable_local_lb)) {
1192 err = mlx5_nic_vport_query_local_lb(priv->mdev, MLX5_LOCAL_MC_LB, &val);
1194 priv->params_ethtool.mc_local_lb = val;
1196 err = mlx5_nic_vport_query_local_lb(priv->mdev, MLX5_LOCAL_UC_LB, &val);
1198 priv->params_ethtool.uc_local_lb = val;
1201 /* create root node */
1202 node = SYSCTL_ADD_NODE(&priv->sysctl_ctx,
1203 SYSCTL_CHILDREN(priv->sysctl_ifnet), OID_AUTO,
1204 "conf", CTLFLAG_RW, NULL, "Configuration");
1207 for (x = 0; x != MLX5E_PARAMS_NUM; x++) {
1208 /* check for read-only parameter */
1209 if (strstr(mlx5e_params_desc[2 * x], "_max") != NULL ||
1210 strstr(mlx5e_params_desc[2 * x], "_mtu") != NULL) {
1211 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1212 mlx5e_params_desc[2 * x], CTLTYPE_U64 | CTLFLAG_RD |
1213 CTLFLAG_MPSAFE, priv, x, &mlx5e_ethtool_handler, "QU",
1214 mlx5e_params_desc[2 * x + 1]);
1216 #if (__FreeBSD_version < 1100000)
1220 * NOTE: In FreeBSD-11 and newer the
1221 * CTLFLAG_RWTUN flag will take care of
1222 * loading default sysctl value from the
1223 * kernel environment, if any:
1225 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1226 mlx5e_params_desc[2 * x], CTLTYPE_U64 | CTLFLAG_RWTUN |
1227 CTLFLAG_MPSAFE, priv, x, &mlx5e_ethtool_handler, "QU",
1228 mlx5e_params_desc[2 * x + 1]);
1230 #if (__FreeBSD_version < 1100000)
1231 /* compute path for sysctl */
1232 snprintf(path, sizeof(path), "dev.mce.%d.conf.%s",
1233 device_get_unit(priv->mdev->pdev->dev.bsddev),
1234 mlx5e_params_desc[2 * x]);
1236 /* try to fetch tunable, if any */
1237 if (TUNABLE_QUAD_FETCH(path, &priv->params_ethtool.arg[x]))
1238 mlx5e_ethtool_handler(NULL, priv, x, NULL);
1243 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1244 "debug_stats", CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv,
1245 0, &mlx5e_ethtool_debug_stats, "I", "Extended debug statistics");
1247 pnameunit = device_get_nameunit(priv->mdev->pdev->dev.bsddev);
1249 SYSCTL_ADD_STRING(&priv->sysctl_ctx, SYSCTL_CHILDREN(node),
1250 OID_AUTO, "device_name", CTLFLAG_RD,
1251 __DECONST(void *, pnameunit), 0,
1254 /* EEPROM support */
1255 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO, "eeprom_info",
1256 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv, 0,
1257 mlx5e_read_eeprom, "I", "EEPROM information");
1259 /* Diagnostics support */
1260 mlx5e_create_diagnostics(priv);
1262 /* create qos node */
1263 qos_node = SYSCTL_ADD_NODE(&priv->sysctl_ctx,
1264 SYSCTL_CHILDREN(node), OID_AUTO,
1265 "qos", CTLFLAG_RW, NULL, "Quality Of Service configuration");
1266 if (qos_node == NULL)
1269 /* Priority rate limit support */
1270 if (mlx5e_getmaxrate(priv) == 0) {
1271 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1272 OID_AUTO, "tc_max_rate", CTLTYPE_U64 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1273 priv, 0, mlx5e_tc_maxrate_handler, "QU",
1274 "Max rate for priority, specified in kilobits, where kilo=1000, "
1275 "max_rate must be divisible by 100000");
1278 /* Bandwidth limiting by ratio */
1279 if (mlx5e_get_max_alloc(priv) == 0) {
1280 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1281 OID_AUTO, "tc_rate_share", CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1282 priv, 0, mlx5e_tc_rate_share_handler, "QU",
1283 "Specify bandwidth ratio from 1 to 100 "
1284 "for the available traffic classes");
1287 /* Priority to traffic class mapping */
1288 if (mlx5e_get_prio_tc(priv) == 0) {
1289 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1290 OID_AUTO, "prio_0_7_tc", CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1291 priv, 0, mlx5e_prio_to_tc_handler, "CU",
1292 "Set traffic class 0 to 7 for priority 0 to 7 inclusivly");
1296 if (mlx5e_get_dscp(priv) == 0) {
1297 for (i = 0; i != MLX5_MAX_SUPPORTED_DSCP; i += 8) {
1299 snprintf(name, sizeof(name), "dscp_%d_%d_prio", i, i + 7);
1300 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1301 OID_AUTO, name, CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1302 priv, i, mlx5e_dscp_prio_handler, "CU",
1303 "Set DSCP to priority mapping, 0..7");
1305 #define A "Set trust state, 1:PCP 2:DSCP"
1307 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1308 OID_AUTO, "trust_state", CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1309 priv, 0, mlx5e_trust_state_handler, "CU",
1310 MLX5_CAP_QCAM_FEATURE(priv->mdev, qpts_trust_both) ?