2 * Copyright (c) 2015-2019 Mellanox Technologies. All rights reserved.
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
7 * 1. Redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer.
9 * 2. Redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution.
13 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND
14 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
16 * ARE DISCLAIMED. IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
17 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
18 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
19 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
20 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
21 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
22 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 #include "port_buffer.h"
30 #include <net/sff8472.h>
33 mlx5e_create_stats(struct sysctl_ctx_list *ctx,
34 struct sysctl_oid_list *parent, const char *buffer,
35 const char **desc, unsigned num, u64 * arg)
37 struct sysctl_oid *node;
42 node = SYSCTL_ADD_NODE(ctx, parent, OID_AUTO,
43 buffer, CTLFLAG_RD, NULL, "Statistics");
46 for (x = 0; x != num; x++) {
47 SYSCTL_ADD_UQUAD(ctx, SYSCTL_CHILDREN(node), OID_AUTO,
48 desc[2 * x], CTLFLAG_RD, arg + x, desc[2 * x + 1]);
53 mlx5e_ethtool_sync_tx_completion_fact(struct mlx5e_priv *priv)
56 * Limit the maximum distance between completion events to
57 * half of the currently set TX queue size.
59 * The maximum number of queue entries a single IP packet can
60 * consume is given by MLX5_SEND_WQE_MAX_WQEBBS.
62 * The worst case max value is then given as below:
64 uint64_t max = priv->params_ethtool.tx_queue_size /
65 (2 * MLX5_SEND_WQE_MAX_WQEBBS);
68 * Update the maximum completion factor value in case the
69 * tx_queue_size field changed. Ensure we don't overflow
76 priv->params_ethtool.tx_completion_fact_max = max;
79 * Verify that the current TX completion factor is within the
82 if (priv->params_ethtool.tx_completion_fact < 1)
83 priv->params_ethtool.tx_completion_fact = 1;
84 else if (priv->params_ethtool.tx_completion_fact > max)
85 priv->params_ethtool.tx_completion_fact = max;
89 mlx5e_getmaxrate(struct mlx5e_priv *priv)
91 struct mlx5_core_dev *mdev = priv->mdev;
92 u8 max_bw_unit[IEEE_8021QAZ_MAX_TCS];
93 u8 max_bw_value[IEEE_8021QAZ_MAX_TCS];
98 err = -mlx5_query_port_tc_rate_limit(mdev, max_bw_value, max_bw_unit);
102 for (i = 0; i <= mlx5_max_tc(mdev); i++) {
103 switch (max_bw_unit[i]) {
104 case MLX5_100_MBPS_UNIT:
105 priv->params_ethtool.max_bw_value[i] = max_bw_value[i] * MLX5E_100MB;
108 priv->params_ethtool.max_bw_value[i] = max_bw_value[i] * MLX5E_1GB;
110 case MLX5_BW_NO_LIMIT:
111 priv->params_ethtool.max_bw_value[i] = 0;
114 priv->params_ethtool.max_bw_value[i] = -1;
115 WARN_ONCE(true, "non-supported BW unit");
125 mlx5e_get_max_alloc(struct mlx5e_priv *priv)
127 struct mlx5_core_dev *mdev = priv->mdev;
132 err = -mlx5_query_port_tc_bw_alloc(mdev, priv->params_ethtool.max_bw_share);
134 /* set default value */
135 for (x = 0; x != IEEE_8021QAZ_MAX_TCS; x++) {
136 priv->params_ethtool.max_bw_share[x] =
137 100 / IEEE_8021QAZ_MAX_TCS;
139 err = -mlx5_set_port_tc_bw_alloc(mdev,
140 priv->params_ethtool.max_bw_share);
148 mlx5e_get_dscp(struct mlx5e_priv *priv)
150 struct mlx5_core_dev *mdev = priv->mdev;
153 if (MLX5_CAP_GEN(mdev, qcam_reg) == 0 ||
154 MLX5_CAP_QCAM_REG(mdev, qpts) == 0 ||
155 MLX5_CAP_QCAM_REG(mdev, qpdpm) == 0)
159 err = -mlx5_query_dscp2prio(mdev, priv->params_ethtool.dscp2prio);
163 err = -mlx5_query_trust_state(mdev, &priv->params_ethtool.trust_state);
172 mlx5e_tc_get_parameters(struct mlx5e_priv *priv,
173 u64 *new_bw_value, u8 *max_bw_value, u8 *max_bw_unit)
175 const u64 upper_limit_mbps = 255 * MLX5E_100MB;
176 const u64 upper_limit_gbps = 255 * MLX5E_1GB;
180 memset(max_bw_value, 0, IEEE_8021QAZ_MAX_TCS);
181 memset(max_bw_unit, 0, IEEE_8021QAZ_MAX_TCS);
183 for (i = 0; i <= mlx5_max_tc(priv->mdev); i++) {
184 temp = (new_bw_value != NULL) ?
185 new_bw_value[i] : priv->params_ethtool.max_bw_value[i];
188 max_bw_unit[i] = MLX5_BW_NO_LIMIT;
189 } else if (temp > upper_limit_gbps) {
190 max_bw_unit[i] = MLX5_BW_NO_LIMIT;
191 } else if (temp <= upper_limit_mbps) {
192 max_bw_value[i] = howmany(temp, MLX5E_100MB);
193 max_bw_unit[i] = MLX5_100_MBPS_UNIT;
195 max_bw_value[i] = howmany(temp, MLX5E_1GB);
196 max_bw_unit[i] = MLX5_GBPS_UNIT;
202 mlx5e_tc_maxrate_handler(SYSCTL_HANDLER_ARGS)
204 struct mlx5e_priv *priv = arg1;
205 struct mlx5_core_dev *mdev = priv->mdev;
206 u8 max_bw_unit[IEEE_8021QAZ_MAX_TCS];
207 u8 max_bw_value[IEEE_8021QAZ_MAX_TCS];
208 u64 new_bw_value[IEEE_8021QAZ_MAX_TCS];
209 u8 max_rates = mlx5_max_tc(mdev) + 1;
214 err = SYSCTL_OUT(req, priv->params_ethtool.max_bw_value,
215 sizeof(priv->params_ethtool.max_bw_value[0]) * max_rates);
216 if (err || !req->newptr)
218 err = SYSCTL_IN(req, new_bw_value,
219 sizeof(new_bw_value[0]) * max_rates);
223 /* range check input value */
224 for (x = 0; x != max_rates; x++) {
225 if (new_bw_value[x] % MLX5E_100MB) {
231 mlx5e_tc_get_parameters(priv, new_bw_value, max_bw_value, max_bw_unit);
233 err = -mlx5_modify_port_tc_rate_limit(mdev, max_bw_value, max_bw_unit);
237 memcpy(priv->params_ethtool.max_bw_value, new_bw_value,
238 sizeof(priv->params_ethtool.max_bw_value));
245 mlx5e_tc_rate_share_handler(SYSCTL_HANDLER_ARGS)
247 struct mlx5e_priv *priv = arg1;
248 struct mlx5_core_dev *mdev = priv->mdev;
249 u8 max_bw_share[IEEE_8021QAZ_MAX_TCS];
250 u8 max_rates = mlx5_max_tc(mdev) + 1;
256 err = SYSCTL_OUT(req, priv->params_ethtool.max_bw_share, max_rates);
257 if (err || !req->newptr)
259 err = SYSCTL_IN(req, max_bw_share, max_rates);
263 /* range check input value */
264 for (sum = i = 0; i != max_rates; i++) {
265 if (max_bw_share[i] < 1 || max_bw_share[i] > 100) {
269 sum += max_bw_share[i];
272 /* sum of values should be as close to 100 as possible */
273 if (sum < (100 - max_rates + 1) || sum > 100) {
278 err = -mlx5_set_port_tc_bw_alloc(mdev, max_bw_share);
282 memcpy(priv->params_ethtool.max_bw_share, max_bw_share,
283 sizeof(priv->params_ethtool.max_bw_share));
290 mlx5e_get_prio_tc(struct mlx5e_priv *priv)
292 struct mlx5_core_dev *mdev = priv->mdev;
297 if (!MLX5_CAP_GEN(priv->mdev, ets)) {
302 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) {
303 err = -mlx5_query_port_prio_tc(mdev, i, priv->params_ethtool.prio_tc + i);
312 mlx5e_prio_to_tc_handler(SYSCTL_HANDLER_ARGS)
314 struct mlx5e_priv *priv = arg1;
315 struct mlx5_core_dev *mdev = priv->mdev;
316 uint8_t temp[MLX5E_MAX_PRIORITY];
321 err = SYSCTL_OUT(req, priv->params_ethtool.prio_tc, MLX5E_MAX_PRIORITY);
322 if (err || !req->newptr)
324 err = SYSCTL_IN(req, temp, MLX5E_MAX_PRIORITY);
328 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) {
329 if (temp[i] > mlx5_max_tc(mdev)) {
335 for (i = 0; i != MLX5E_MAX_PRIORITY; i++) {
336 if (temp[i] == priv->params_ethtool.prio_tc[i])
338 err = -mlx5_set_port_prio_tc(mdev, i, temp[i]);
341 /* update cached value */
342 priv->params_ethtool.prio_tc[i] = temp[i];
350 mlx5e_trust_state_handler(SYSCTL_HANDLER_ARGS)
352 struct mlx5e_priv *priv = arg1;
353 struct mlx5_core_dev *mdev = priv->mdev;
358 result = priv->params_ethtool.trust_state;
359 err = sysctl_handle_8(oidp, &result, 0, req);
360 if (err || !req->newptr ||
361 result == priv->params_ethtool.trust_state)
365 case MLX5_QPTS_TRUST_PCP:
366 case MLX5_QPTS_TRUST_DSCP:
368 case MLX5_QPTS_TRUST_BOTH:
369 if (!MLX5_CAP_QCAM_FEATURE(mdev, qpts_trust_both)) {
379 err = -mlx5_set_trust_state(mdev, result);
383 priv->params_ethtool.trust_state = result;
385 /* update inline mode */
386 mlx5e_refresh_sq_inline(priv);
388 mlx5e_rl_refresh_sq_inline(&priv->rl);
396 mlx5e_dscp_prio_handler(SYSCTL_HANDLER_ARGS)
398 struct mlx5e_priv *priv = arg1;
399 int prio_index = arg2;
400 struct mlx5_core_dev *mdev = priv->mdev;
401 uint8_t dscp2prio[MLX5_MAX_SUPPORTED_DSCP];
406 err = SYSCTL_OUT(req, priv->params_ethtool.dscp2prio + prio_index,
407 sizeof(priv->params_ethtool.dscp2prio) / 8);
408 if (err || !req->newptr)
411 memcpy(dscp2prio, priv->params_ethtool.dscp2prio, sizeof(dscp2prio));
412 err = SYSCTL_IN(req, dscp2prio + prio_index, sizeof(dscp2prio) / 8);
415 for (x = 0; x != MLX5_MAX_SUPPORTED_DSCP; x++) {
416 if (dscp2prio[x] > 7) {
421 err = -mlx5_set_dscp2prio(mdev, dscp2prio);
425 /* update local array */
426 memcpy(priv->params_ethtool.dscp2prio, dscp2prio,
427 sizeof(priv->params_ethtool.dscp2prio));
434 mlx5e_update_buf_lossy(struct mlx5e_priv *priv)
438 PRIV_ASSERT_LOCKED(priv);
439 bzero(&pfc, sizeof(pfc));
440 pfc.pfc_en = priv->params.rx_priority_flow_control;
441 return (-mlx5e_port_manual_buffer_config(priv, MLX5E_PORT_BUFFER_PFC,
442 priv->params_ethtool.hw_mtu, &pfc, NULL, NULL));
446 mlx5e_buf_size_handler(SYSCTL_HANDLER_ARGS)
448 struct mlx5e_priv *priv;
449 u32 buf_size[MLX5E_MAX_BUFFER];
450 struct mlx5e_port_buffer port_buffer;
455 error = -mlx5e_port_query_buffer(priv, &port_buffer);
458 for (i = 0; i < nitems(buf_size); i++)
459 buf_size[i] = port_buffer.buffer[i].size;
460 error = SYSCTL_OUT(req, buf_size, sizeof(buf_size));
461 if (error != 0 || req->newptr == NULL)
463 error = SYSCTL_IN(req, buf_size, sizeof(buf_size));
466 error = -mlx5e_port_manual_buffer_config(priv, MLX5E_PORT_BUFFER_SIZE,
467 priv->params_ethtool.hw_mtu, NULL, buf_size, NULL);
474 mlx5e_buf_prio_handler(SYSCTL_HANDLER_ARGS)
476 struct mlx5e_priv *priv;
477 struct mlx5_core_dev *mdev;
478 u8 buffer[MLX5E_MAX_BUFFER];
484 error = -mlx5e_port_query_priority2buffer(mdev, buffer);
487 error = SYSCTL_OUT(req, buffer, MLX5E_MAX_BUFFER);
488 if (error != 0 || req->newptr == NULL)
490 error = SYSCTL_IN(req, buffer, MLX5E_MAX_BUFFER);
493 error = -mlx5e_port_manual_buffer_config(priv,
494 MLX5E_PORT_BUFFER_PRIO2BUFFER,
495 priv->params_ethtool.hw_mtu, NULL, NULL, buffer);
497 error = mlx5e_update_buf_lossy(priv);
504 mlx5e_cable_length_handler(SYSCTL_HANDLER_ARGS)
506 struct mlx5e_priv *priv;
512 cable_len = priv->dcbx.cable_len;
513 error = sysctl_handle_int(oidp, &cable_len, 0, req);
514 if (error == 0 && req->newptr != NULL &&
515 cable_len != priv->dcbx.cable_len) {
516 error = -mlx5e_port_manual_buffer_config(priv,
517 MLX5E_PORT_BUFFER_CABLE_LEN, priv->params_ethtool.hw_mtu,
520 priv->dcbx.cable_len = cable_len;
526 #define MLX5_PARAM_OFFSET(n) \
527 __offsetof(struct mlx5e_priv, params_ethtool.n)
530 mlx5e_ethtool_handler(SYSCTL_HANDLER_ARGS)
532 struct mlx5e_priv *priv = arg1;
539 value = priv->params_ethtool.arg[arg2];
541 error = sysctl_handle_64(oidp, &value, 0, req);
542 if (error || req->newptr == NULL ||
543 value == priv->params_ethtool.arg[arg2])
546 /* assign new value */
547 priv->params_ethtool.arg[arg2] = value;
551 /* check if device is gone */
556 was_opened = test_bit(MLX5E_STATE_OPENED, &priv->state);
557 mode_modify = MLX5_CAP_GEN(priv->mdev, cq_period_mode_modify);
559 switch (MLX5_PARAM_OFFSET(arg[arg2])) {
560 case MLX5_PARAM_OFFSET(rx_coalesce_usecs):
561 /* import RX coal time */
562 if (priv->params_ethtool.rx_coalesce_usecs < 1)
563 priv->params_ethtool.rx_coalesce_usecs = 0;
564 else if (priv->params_ethtool.rx_coalesce_usecs >
565 MLX5E_FLD_MAX(cqc, cq_period)) {
566 priv->params_ethtool.rx_coalesce_usecs =
567 MLX5E_FLD_MAX(cqc, cq_period);
569 priv->params.rx_cq_moderation_usec =
570 priv->params_ethtool.rx_coalesce_usecs;
572 /* check to avoid down and up the network interface */
574 error = mlx5e_refresh_channel_params(priv);
577 case MLX5_PARAM_OFFSET(rx_coalesce_pkts):
578 /* import RX coal pkts */
579 if (priv->params_ethtool.rx_coalesce_pkts < 1)
580 priv->params_ethtool.rx_coalesce_pkts = 0;
581 else if (priv->params_ethtool.rx_coalesce_pkts >
582 MLX5E_FLD_MAX(cqc, cq_max_count)) {
583 priv->params_ethtool.rx_coalesce_pkts =
584 MLX5E_FLD_MAX(cqc, cq_max_count);
586 priv->params.rx_cq_moderation_pkts =
587 priv->params_ethtool.rx_coalesce_pkts;
589 /* check to avoid down and up the network interface */
591 error = mlx5e_refresh_channel_params(priv);
594 case MLX5_PARAM_OFFSET(tx_coalesce_usecs):
595 /* import TX coal time */
596 if (priv->params_ethtool.tx_coalesce_usecs < 1)
597 priv->params_ethtool.tx_coalesce_usecs = 0;
598 else if (priv->params_ethtool.tx_coalesce_usecs >
599 MLX5E_FLD_MAX(cqc, cq_period)) {
600 priv->params_ethtool.tx_coalesce_usecs =
601 MLX5E_FLD_MAX(cqc, cq_period);
603 priv->params.tx_cq_moderation_usec =
604 priv->params_ethtool.tx_coalesce_usecs;
606 /* check to avoid down and up the network interface */
608 error = mlx5e_refresh_channel_params(priv);
611 case MLX5_PARAM_OFFSET(tx_coalesce_pkts):
612 /* import TX coal pkts */
613 if (priv->params_ethtool.tx_coalesce_pkts < 1)
614 priv->params_ethtool.tx_coalesce_pkts = 0;
615 else if (priv->params_ethtool.tx_coalesce_pkts >
616 MLX5E_FLD_MAX(cqc, cq_max_count)) {
617 priv->params_ethtool.tx_coalesce_pkts =
618 MLX5E_FLD_MAX(cqc, cq_max_count);
620 priv->params.tx_cq_moderation_pkts =
621 priv->params_ethtool.tx_coalesce_pkts;
623 /* check to avoid down and up the network interface */
625 error = mlx5e_refresh_channel_params(priv);
628 case MLX5_PARAM_OFFSET(tx_queue_size):
629 /* network interface must be down */
631 mlx5e_close_locked(priv->ifp);
633 /* import TX queue size */
634 if (priv->params_ethtool.tx_queue_size <
635 (1 << MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE)) {
636 priv->params_ethtool.tx_queue_size =
637 (1 << MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE);
638 } else if (priv->params_ethtool.tx_queue_size >
639 priv->params_ethtool.tx_queue_size_max) {
640 priv->params_ethtool.tx_queue_size =
641 priv->params_ethtool.tx_queue_size_max;
643 /* store actual TX queue size */
644 priv->params.log_sq_size =
645 order_base_2(priv->params_ethtool.tx_queue_size);
646 priv->params_ethtool.tx_queue_size =
647 1 << priv->params.log_sq_size;
649 /* verify TX completion factor */
650 mlx5e_ethtool_sync_tx_completion_fact(priv);
652 /* restart network interface, if any */
654 mlx5e_open_locked(priv->ifp);
657 case MLX5_PARAM_OFFSET(rx_queue_size):
658 /* network interface must be down */
660 mlx5e_close_locked(priv->ifp);
662 /* import RX queue size */
663 if (priv->params_ethtool.rx_queue_size <
664 (1 << MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE)) {
665 priv->params_ethtool.rx_queue_size =
666 (1 << MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE);
667 } else if (priv->params_ethtool.rx_queue_size >
668 priv->params_ethtool.rx_queue_size_max) {
669 priv->params_ethtool.rx_queue_size =
670 priv->params_ethtool.rx_queue_size_max;
672 /* store actual RX queue size */
673 priv->params.log_rq_size =
674 order_base_2(priv->params_ethtool.rx_queue_size);
675 priv->params_ethtool.rx_queue_size =
676 1 << priv->params.log_rq_size;
678 /* update least number of RX WQEs */
679 priv->params.min_rx_wqes = min(
680 priv->params_ethtool.rx_queue_size - 1,
681 MLX5E_PARAMS_DEFAULT_MIN_RX_WQES);
683 /* restart network interface, if any */
685 mlx5e_open_locked(priv->ifp);
688 case MLX5_PARAM_OFFSET(channels_rsss):
689 /* network interface must be down */
691 mlx5e_close_locked(priv->ifp);
693 /* import number of channels */
694 if (priv->params_ethtool.channels_rsss < 1)
695 priv->params_ethtool.channels_rsss = 1;
696 else if (priv->params_ethtool.channels_rsss > 128)
697 priv->params_ethtool.channels_rsss = 128;
699 priv->params.channels_rsss = priv->params_ethtool.channels_rsss;
701 /* restart network interface, if any */
703 mlx5e_open_locked(priv->ifp);
706 case MLX5_PARAM_OFFSET(channels):
707 /* network interface must be down */
709 mlx5e_close_locked(priv->ifp);
711 /* import number of channels */
712 if (priv->params_ethtool.channels < 1)
713 priv->params_ethtool.channels = 1;
714 else if (priv->params_ethtool.channels >
715 (u64) priv->mdev->priv.eq_table.num_comp_vectors) {
716 priv->params_ethtool.channels =
717 (u64) priv->mdev->priv.eq_table.num_comp_vectors;
719 priv->params.num_channels = priv->params_ethtool.channels;
721 /* restart network interface, if any */
723 mlx5e_open_locked(priv->ifp);
726 case MLX5_PARAM_OFFSET(rx_coalesce_mode):
727 /* network interface must be down */
728 if (was_opened != 0 && mode_modify == 0)
729 mlx5e_close_locked(priv->ifp);
731 /* import RX coalesce mode */
732 if (priv->params_ethtool.rx_coalesce_mode > 3)
733 priv->params_ethtool.rx_coalesce_mode = 3;
734 priv->params.rx_cq_moderation_mode =
735 priv->params_ethtool.rx_coalesce_mode;
737 /* restart network interface, if any */
738 if (was_opened != 0) {
739 if (mode_modify == 0)
740 mlx5e_open_locked(priv->ifp);
742 error = mlx5e_refresh_channel_params(priv);
746 case MLX5_PARAM_OFFSET(tx_coalesce_mode):
747 /* network interface must be down */
748 if (was_opened != 0 && mode_modify == 0)
749 mlx5e_close_locked(priv->ifp);
751 /* import TX coalesce mode */
752 if (priv->params_ethtool.tx_coalesce_mode != 0)
753 priv->params_ethtool.tx_coalesce_mode = 1;
754 priv->params.tx_cq_moderation_mode =
755 priv->params_ethtool.tx_coalesce_mode;
757 /* restart network interface, if any */
758 if (was_opened != 0) {
759 if (mode_modify == 0)
760 mlx5e_open_locked(priv->ifp);
762 error = mlx5e_refresh_channel_params(priv);
766 case MLX5_PARAM_OFFSET(hw_lro):
767 /* network interface must be down */
769 mlx5e_close_locked(priv->ifp);
771 /* import HW LRO mode */
772 if (priv->params_ethtool.hw_lro != 0 &&
773 MLX5_CAP_ETH(priv->mdev, lro_cap)) {
774 priv->params_ethtool.hw_lro = 1;
775 /* check if feature should actually be enabled */
776 if (priv->ifp->if_capenable & IFCAP_LRO) {
777 priv->params.hw_lro_en = true;
779 priv->params.hw_lro_en = false;
781 mlx5_en_warn(priv->ifp, "To enable HW LRO "
782 "please also enable LRO via ifconfig(8).\n");
785 /* return an error if HW does not support this feature */
786 if (priv->params_ethtool.hw_lro != 0)
788 priv->params.hw_lro_en = false;
789 priv->params_ethtool.hw_lro = 0;
791 /* restart network interface, if any */
793 mlx5e_open_locked(priv->ifp);
796 case MLX5_PARAM_OFFSET(cqe_zipping):
797 /* network interface must be down */
799 mlx5e_close_locked(priv->ifp);
801 /* import CQE zipping mode */
802 if (priv->params_ethtool.cqe_zipping &&
803 MLX5_CAP_GEN(priv->mdev, cqe_compression)) {
804 priv->params.cqe_zipping_en = true;
805 priv->params_ethtool.cqe_zipping = 1;
807 priv->params.cqe_zipping_en = false;
808 priv->params_ethtool.cqe_zipping = 0;
810 /* restart network interface, if any */
812 mlx5e_open_locked(priv->ifp);
815 case MLX5_PARAM_OFFSET(tx_completion_fact):
816 /* network interface must be down */
818 mlx5e_close_locked(priv->ifp);
820 /* verify parameter */
821 mlx5e_ethtool_sync_tx_completion_fact(priv);
823 /* restart network interface, if any */
825 mlx5e_open_locked(priv->ifp);
828 case MLX5_PARAM_OFFSET(modify_tx_dma):
829 /* check if network interface is opened */
831 priv->params_ethtool.modify_tx_dma =
832 priv->params_ethtool.modify_tx_dma ? 1 : 0;
833 /* modify tx according to value */
834 mlx5e_modify_tx_dma(priv, value != 0);
836 /* if closed force enable tx */
837 priv->params_ethtool.modify_tx_dma = 0;
841 case MLX5_PARAM_OFFSET(modify_rx_dma):
842 /* check if network interface is opened */
844 priv->params_ethtool.modify_rx_dma =
845 priv->params_ethtool.modify_rx_dma ? 1 : 0;
846 /* modify rx according to value */
847 mlx5e_modify_rx_dma(priv, value != 0);
849 /* if closed force enable rx */
850 priv->params_ethtool.modify_rx_dma = 0;
854 case MLX5_PARAM_OFFSET(diag_pci_enable):
855 priv->params_ethtool.diag_pci_enable =
856 priv->params_ethtool.diag_pci_enable ? 1 : 0;
858 error = -mlx5_core_set_diagnostics_full(priv->mdev,
859 priv->params_ethtool.diag_pci_enable,
860 priv->params_ethtool.diag_general_enable);
863 case MLX5_PARAM_OFFSET(diag_general_enable):
864 priv->params_ethtool.diag_general_enable =
865 priv->params_ethtool.diag_general_enable ? 1 : 0;
867 error = -mlx5_core_set_diagnostics_full(priv->mdev,
868 priv->params_ethtool.diag_pci_enable,
869 priv->params_ethtool.diag_general_enable);
872 case MLX5_PARAM_OFFSET(mc_local_lb):
873 priv->params_ethtool.mc_local_lb =
874 priv->params_ethtool.mc_local_lb ? 1 : 0;
876 if (MLX5_CAP_GEN(priv->mdev, disable_local_lb)) {
877 error = mlx5_nic_vport_modify_local_lb(priv->mdev,
878 MLX5_LOCAL_MC_LB, priv->params_ethtool.mc_local_lb);
884 case MLX5_PARAM_OFFSET(uc_local_lb):
885 priv->params_ethtool.uc_local_lb =
886 priv->params_ethtool.uc_local_lb ? 1 : 0;
888 if (MLX5_CAP_GEN(priv->mdev, disable_local_lb)) {
889 error = mlx5_nic_vport_modify_local_lb(priv->mdev,
890 MLX5_LOCAL_UC_LB, priv->params_ethtool.uc_local_lb);
904 static const char *mlx5e_params_desc[] = {
905 MLX5E_PARAMS(MLX5E_STATS_DESC)
908 static const char *mlx5e_port_stats_debug_desc[] = {
909 MLX5E_PORT_STATS_DEBUG(MLX5E_STATS_DESC)
913 mlx5e_ethtool_debug_channel_info(SYSCTL_HANDLER_ARGS)
915 struct mlx5e_priv *priv;
917 struct mlx5e_channel *c;
924 error = sysctl_wire_old_buffer(req, 0);
927 if (sbuf_new_for_sysctl(&sb, NULL, 1024, req) == NULL)
929 sbuf_clear_flags(&sb, SBUF_INCLUDENUL);
932 opened = test_bit(MLX5E_STATE_OPENED, &priv->state);
934 sbuf_printf(&sb, "pages irq %d\n",
935 priv->mdev->priv.msix_arr[MLX5_EQ_VEC_PAGES].vector);
936 sbuf_printf(&sb, "command irq %d\n",
937 priv->mdev->priv.msix_arr[MLX5_EQ_VEC_CMD].vector);
938 sbuf_printf(&sb, "async irq %d\n",
939 priv->mdev->priv.msix_arr[MLX5_EQ_VEC_ASYNC].vector);
941 for (i = 0; i != priv->params.num_channels; i++) {
942 int eqn_not_used = -1;
943 int irqn = MLX5_EQ_VEC_COMP_BASE;
945 if (mlx5_vector2eqn(priv->mdev, i, &eqn_not_used, &irqn) != 0)
948 c = opened ? &priv->channel[i] : NULL;
949 rq = opened ? &c->rq : NULL;
950 sbuf_printf(&sb, "channel %d rq %d cq %d irq %d\n", i,
951 opened ? rq->rqn : -1,
952 opened ? rq->cq.mcq.cqn : -1,
953 priv->mdev->priv.msix_arr[irqn].vector);
955 for (tc = 0; tc != priv->num_tc; tc++) {
956 sq = opened ? &c->sq[tc] : NULL;
957 sbuf_printf(&sb, "channel %d tc %d sq %d cq %d irq %d\n",
959 opened ? sq->sqn : -1,
960 opened ? sq->cq.mcq.cqn : -1,
961 priv->mdev->priv.msix_arr[irqn].vector);
965 error = sbuf_finish(&sb);
971 mlx5e_ethtool_debug_stats(SYSCTL_HANDLER_ARGS)
973 struct mlx5e_priv *priv = arg1;
978 if (priv->gone != 0) {
982 sys_debug = priv->sysctl_debug;
983 error = sysctl_handle_int(oidp, &sys_debug, 0, req);
984 if (error != 0 || !req->newptr)
986 sys_debug = sys_debug ? 1 : 0;
987 if (sys_debug == priv->sysctl_debug)
990 if ((priv->sysctl_debug = sys_debug)) {
991 mlx5e_create_stats(&priv->stats.port_stats_debug.ctx,
992 SYSCTL_CHILDREN(priv->sysctl_ifnet), "debug_stats",
993 mlx5e_port_stats_debug_desc, MLX5E_PORT_STATS_DEBUG_NUM,
994 priv->stats.port_stats_debug.arg);
995 SYSCTL_ADD_PROC(&priv->stats.port_stats_debug.ctx,
996 SYSCTL_CHILDREN(priv->sysctl_ifnet), OID_AUTO,
998 CTLFLAG_RD | CTLFLAG_MPSAFE | CTLTYPE_STRING, priv, 0,
999 mlx5e_ethtool_debug_channel_info, "S", "");
1001 sysctl_ctx_free(&priv->stats.port_stats_debug.ctx);
1009 mlx5e_create_diagnostics(struct mlx5e_priv *priv)
1011 struct mlx5_core_diagnostics_entry entry;
1012 struct sysctl_ctx_list *ctx;
1013 struct sysctl_oid *node;
1016 /* sysctl context we are using */
1017 ctx = &priv->sysctl_ctx;
1019 /* create root node */
1020 node = SYSCTL_ADD_NODE(ctx,
1021 SYSCTL_CHILDREN(priv->sysctl_ifnet), OID_AUTO,
1022 "diagnostics", CTLFLAG_RD, NULL, "Diagnostics");
1026 /* create PCI diagnostics */
1027 for (x = 0; x != MLX5_CORE_PCI_DIAGNOSTICS_NUM; x++) {
1028 entry = mlx5_core_pci_diagnostics_table[x];
1029 if (mlx5_core_supports_diagnostics(priv->mdev, entry.counter_id) == 0)
1031 SYSCTL_ADD_UQUAD(ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1032 entry.desc, CTLFLAG_RD, priv->params_pci.array + x,
1033 "PCI diagnostics counter");
1036 /* create general diagnostics */
1037 for (x = 0; x != MLX5_CORE_GENERAL_DIAGNOSTICS_NUM; x++) {
1038 entry = mlx5_core_general_diagnostics_table[x];
1039 if (mlx5_core_supports_diagnostics(priv->mdev, entry.counter_id) == 0)
1041 SYSCTL_ADD_UQUAD(ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1042 entry.desc, CTLFLAG_RD, priv->params_general.array + x,
1043 "General diagnostics counter");
1048 mlx5e_create_ethtool(struct mlx5e_priv *priv)
1050 struct sysctl_oid *node, *qos_node;
1051 const char *pnameunit;
1052 struct mlx5e_port_buffer port_buffer;
1056 /* set some defaults */
1057 priv->params_ethtool.tx_queue_size_max = 1 << MLX5E_PARAMS_MAXIMUM_LOG_SQ_SIZE;
1058 priv->params_ethtool.rx_queue_size_max = 1 << MLX5E_PARAMS_MAXIMUM_LOG_RQ_SIZE;
1059 priv->params_ethtool.tx_queue_size = 1 << priv->params.log_sq_size;
1060 priv->params_ethtool.rx_queue_size = 1 << priv->params.log_rq_size;
1061 priv->params_ethtool.channels = priv->params.num_channels;
1062 priv->params_ethtool.channels_rsss = priv->params.channels_rsss;
1063 priv->params_ethtool.coalesce_pkts_max = MLX5E_FLD_MAX(cqc, cq_max_count);
1064 priv->params_ethtool.coalesce_usecs_max = MLX5E_FLD_MAX(cqc, cq_period);
1065 priv->params_ethtool.rx_coalesce_mode = priv->params.rx_cq_moderation_mode;
1066 priv->params_ethtool.rx_coalesce_usecs = priv->params.rx_cq_moderation_usec;
1067 priv->params_ethtool.rx_coalesce_pkts = priv->params.rx_cq_moderation_pkts;
1068 priv->params_ethtool.tx_coalesce_mode = priv->params.tx_cq_moderation_mode;
1069 priv->params_ethtool.tx_coalesce_usecs = priv->params.tx_cq_moderation_usec;
1070 priv->params_ethtool.tx_coalesce_pkts = priv->params.tx_cq_moderation_pkts;
1071 priv->params_ethtool.hw_lro = priv->params.hw_lro_en;
1072 priv->params_ethtool.cqe_zipping = priv->params.cqe_zipping_en;
1073 mlx5e_ethtool_sync_tx_completion_fact(priv);
1075 /* get default values for local loopback, if any */
1076 if (MLX5_CAP_GEN(priv->mdev, disable_local_lb)) {
1080 err = mlx5_nic_vport_query_local_lb(priv->mdev, MLX5_LOCAL_MC_LB, &val);
1082 priv->params_ethtool.mc_local_lb = val;
1084 err = mlx5_nic_vport_query_local_lb(priv->mdev, MLX5_LOCAL_UC_LB, &val);
1086 priv->params_ethtool.uc_local_lb = val;
1089 /* create root node */
1090 node = SYSCTL_ADD_NODE(&priv->sysctl_ctx,
1091 SYSCTL_CHILDREN(priv->sysctl_ifnet), OID_AUTO,
1092 "conf", CTLFLAG_RW, NULL, "Configuration");
1095 for (x = 0; x != MLX5E_PARAMS_NUM; x++) {
1096 /* check for read-only parameter */
1097 if (strstr(mlx5e_params_desc[2 * x], "_max") != NULL ||
1098 strstr(mlx5e_params_desc[2 * x], "_mtu") != NULL) {
1099 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1100 mlx5e_params_desc[2 * x], CTLTYPE_U64 | CTLFLAG_RD |
1101 CTLFLAG_MPSAFE, priv, x, &mlx5e_ethtool_handler, "QU",
1102 mlx5e_params_desc[2 * x + 1]);
1104 #if (__FreeBSD_version < 1100000)
1108 * NOTE: In FreeBSD-11 and newer the
1109 * CTLFLAG_RWTUN flag will take care of
1110 * loading default sysctl value from the
1111 * kernel environment, if any:
1113 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1114 mlx5e_params_desc[2 * x], CTLTYPE_U64 | CTLFLAG_RWTUN |
1115 CTLFLAG_MPSAFE, priv, x, &mlx5e_ethtool_handler, "QU",
1116 mlx5e_params_desc[2 * x + 1]);
1118 #if (__FreeBSD_version < 1100000)
1119 /* compute path for sysctl */
1120 snprintf(path, sizeof(path), "dev.mce.%d.conf.%s",
1121 device_get_unit(priv->mdev->pdev->dev.bsddev),
1122 mlx5e_params_desc[2 * x]);
1124 /* try to fetch tunable, if any */
1125 if (TUNABLE_QUAD_FETCH(path, &priv->params_ethtool.arg[x]))
1126 mlx5e_ethtool_handler(NULL, priv, x, NULL);
1131 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(node), OID_AUTO,
1132 "debug_stats", CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, priv,
1133 0, &mlx5e_ethtool_debug_stats, "I", "Extended debug statistics");
1135 pnameunit = device_get_nameunit(priv->mdev->pdev->dev.bsddev);
1137 SYSCTL_ADD_STRING(&priv->sysctl_ctx, SYSCTL_CHILDREN(node),
1138 OID_AUTO, "device_name", CTLFLAG_RD,
1139 __DECONST(void *, pnameunit), 0,
1142 /* Diagnostics support */
1143 mlx5e_create_diagnostics(priv);
1145 /* create qos node */
1146 qos_node = SYSCTL_ADD_NODE(&priv->sysctl_ctx,
1147 SYSCTL_CHILDREN(node), OID_AUTO,
1148 "qos", CTLFLAG_RW, NULL, "Quality Of Service configuration");
1149 if (qos_node == NULL)
1152 /* Priority rate limit support */
1153 if (mlx5e_getmaxrate(priv) == 0) {
1154 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1155 OID_AUTO, "tc_max_rate", CTLTYPE_U64 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1156 priv, 0, mlx5e_tc_maxrate_handler, "QU",
1157 "Max rate for priority, specified in kilobits, where kilo=1000, "
1158 "max_rate must be divisible by 100000");
1161 /* Bandwidth limiting by ratio */
1162 if (mlx5e_get_max_alloc(priv) == 0) {
1163 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1164 OID_AUTO, "tc_rate_share", CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1165 priv, 0, mlx5e_tc_rate_share_handler, "QU",
1166 "Specify bandwidth ratio from 1 to 100 "
1167 "for the available traffic classes");
1170 /* Priority to traffic class mapping */
1171 if (mlx5e_get_prio_tc(priv) == 0) {
1172 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1173 OID_AUTO, "prio_0_7_tc", CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1174 priv, 0, mlx5e_prio_to_tc_handler, "CU",
1175 "Set traffic class 0 to 7 for priority 0 to 7 inclusivly");
1179 if (mlx5e_get_dscp(priv) == 0) {
1180 for (i = 0; i != MLX5_MAX_SUPPORTED_DSCP; i += 8) {
1182 snprintf(name, sizeof(name), "dscp_%d_%d_prio", i, i + 7);
1183 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1184 OID_AUTO, name, CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1185 priv, i, mlx5e_dscp_prio_handler, "CU",
1186 "Set DSCP to priority mapping, 0..7");
1188 #define A "Set trust state, 1:PCP 2:DSCP"
1190 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1191 OID_AUTO, "trust_state", CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1192 priv, 0, mlx5e_trust_state_handler, "CU",
1193 MLX5_CAP_QCAM_FEATURE(priv->mdev, qpts_trust_both) ?
1199 if (mlx5e_port_query_buffer(priv, &port_buffer) == 0) {
1200 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1201 OID_AUTO, "buffers_size",
1202 CTLTYPE_U32 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1203 priv, 0, mlx5e_buf_size_handler, "IU",
1204 "Set buffers sizes");
1205 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1206 OID_AUTO, "buffers_prio",
1207 CTLTYPE_U8 | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1208 priv, 0, mlx5e_buf_prio_handler, "CU",
1209 "Set prio to buffers mapping");
1210 SYSCTL_ADD_PROC(&priv->sysctl_ctx, SYSCTL_CHILDREN(qos_node),
1211 OID_AUTO, "cable_length",
1212 CTLTYPE_UINT | CTLFLAG_RWTUN | CTLFLAG_MPSAFE,
1213 priv, 0, mlx5e_cable_length_handler, "IU",
1214 "Set cable length in meters for xoff threshold calculation");