2 * Copyright (c) 2016, Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32 #include <linux/device.h>
33 #include <linux/netdevice.h>
36 #include "en/port_buffer.h"
38 #define MLX5E_MAX_BW_ALLOC 100 /* Max percentage of BW allocation */
40 #define MLX5E_100MB (100000)
41 #define MLX5E_1GB (1000000)
43 #define MLX5E_CEE_STATE_UP 1
44 #define MLX5E_CEE_STATE_DOWN 0
46 /* Max supported cable length is 1000 meters */
47 #define MLX5E_MAX_CABLE_LENGTH 1000
50 MLX5E_VENDOR_TC_GROUP_NUM = 7,
51 MLX5E_LOWEST_PRIO_GROUP = 0,
57 MLX5_DCB_CHG_NO_RESET,
60 #define MLX5_DSCP_SUPPORTED(mdev) (MLX5_CAP_GEN(mdev, qcam_reg) && \
61 MLX5_CAP_QCAM_REG(mdev, qpts) && \
62 MLX5_CAP_QCAM_REG(mdev, qpdpm))
64 static int mlx5e_set_trust_state(struct mlx5e_priv *priv, u8 trust_state);
65 static int mlx5e_set_dscp2prio(struct mlx5e_priv *priv, u8 dscp, u8 prio);
67 /* If dcbx mode is non-host set the dcbx mode to host.
69 static int mlx5e_dcbnl_set_dcbx_mode(struct mlx5e_priv *priv,
70 enum mlx5_dcbx_oper_mode mode)
72 struct mlx5_core_dev *mdev = priv->mdev;
73 u32 param[MLX5_ST_SZ_DW(dcbx_param)];
76 err = mlx5_query_port_dcbx_param(mdev, param);
80 MLX5_SET(dcbx_param, param, version_admin, mode);
81 if (mode != MLX5E_DCBX_PARAM_VER_OPER_HOST)
82 MLX5_SET(dcbx_param, param, willing_admin, 1);
84 return mlx5_set_port_dcbx_param(mdev, param);
87 static int mlx5e_dcbnl_switch_to_host_mode(struct mlx5e_priv *priv)
89 struct mlx5e_dcbx *dcbx = &priv->dcbx;
92 if (!MLX5_CAP_GEN(priv->mdev, dcbx))
95 if (dcbx->mode == MLX5E_DCBX_PARAM_VER_OPER_HOST)
98 err = mlx5e_dcbnl_set_dcbx_mode(priv, MLX5E_DCBX_PARAM_VER_OPER_HOST);
102 dcbx->mode = MLX5E_DCBX_PARAM_VER_OPER_HOST;
106 static int mlx5e_dcbnl_ieee_getets(struct net_device *netdev,
107 struct ieee_ets *ets)
109 struct mlx5e_priv *priv = netdev_priv(netdev);
110 struct mlx5_core_dev *mdev = priv->mdev;
111 u8 tc_group[IEEE_8021QAZ_MAX_TCS];
112 bool is_tc_group_6_exist = false;
113 bool is_zero_bw_ets_tc = false;
117 if (!MLX5_CAP_GEN(priv->mdev, ets))
120 ets->ets_cap = mlx5_max_tc(priv->mdev) + 1;
121 for (i = 0; i < ets->ets_cap; i++) {
122 err = mlx5_query_port_prio_tc(mdev, i, &ets->prio_tc[i]);
126 err = mlx5_query_port_tc_group(mdev, i, &tc_group[i]);
130 err = mlx5_query_port_tc_bw_alloc(mdev, i, &ets->tc_tx_bw[i]);
134 if (ets->tc_tx_bw[i] < MLX5E_MAX_BW_ALLOC &&
135 tc_group[i] == (MLX5E_LOWEST_PRIO_GROUP + 1))
136 is_zero_bw_ets_tc = true;
138 if (tc_group[i] == (MLX5E_VENDOR_TC_GROUP_NUM - 1))
139 is_tc_group_6_exist = true;
142 /* Report 0% ets tc if exits*/
143 if (is_zero_bw_ets_tc) {
144 for (i = 0; i < ets->ets_cap; i++)
145 if (tc_group[i] == MLX5E_LOWEST_PRIO_GROUP)
146 ets->tc_tx_bw[i] = 0;
149 /* Update tc_tsa based on fw setting*/
150 for (i = 0; i < ets->ets_cap; i++) {
151 if (ets->tc_tx_bw[i] < MLX5E_MAX_BW_ALLOC)
152 priv->dcbx.tc_tsa[i] = IEEE_8021QAZ_TSA_ETS;
153 else if (tc_group[i] == MLX5E_VENDOR_TC_GROUP_NUM &&
154 !is_tc_group_6_exist)
155 priv->dcbx.tc_tsa[i] = IEEE_8021QAZ_TSA_VENDOR;
157 memcpy(ets->tc_tsa, priv->dcbx.tc_tsa, sizeof(ets->tc_tsa));
162 static void mlx5e_build_tc_group(struct ieee_ets *ets, u8 *tc_group, int max_tc)
164 bool any_tc_mapped_to_ets = false;
165 bool ets_zero_bw = false;
169 for (i = 0; i <= max_tc; i++) {
170 if (ets->tc_tsa[i] == IEEE_8021QAZ_TSA_ETS) {
171 any_tc_mapped_to_ets = true;
172 if (!ets->tc_tx_bw[i])
177 /* strict group has higher priority than ets group */
178 strict_group = MLX5E_LOWEST_PRIO_GROUP;
179 if (any_tc_mapped_to_ets)
184 for (i = 0; i <= max_tc; i++) {
185 switch (ets->tc_tsa[i]) {
186 case IEEE_8021QAZ_TSA_VENDOR:
187 tc_group[i] = MLX5E_VENDOR_TC_GROUP_NUM;
189 case IEEE_8021QAZ_TSA_STRICT:
190 tc_group[i] = strict_group++;
192 case IEEE_8021QAZ_TSA_ETS:
193 tc_group[i] = MLX5E_LOWEST_PRIO_GROUP;
194 if (ets->tc_tx_bw[i] && ets_zero_bw)
195 tc_group[i] = MLX5E_LOWEST_PRIO_GROUP + 1;
201 static void mlx5e_build_tc_tx_bw(struct ieee_ets *ets, u8 *tc_tx_bw,
202 u8 *tc_group, int max_tc)
204 int bw_for_ets_zero_bw_tc = 0;
205 int last_ets_zero_bw_tc = -1;
206 int num_ets_zero_bw = 0;
209 for (i = 0; i <= max_tc; i++) {
210 if (ets->tc_tsa[i] == IEEE_8021QAZ_TSA_ETS &&
213 last_ets_zero_bw_tc = i;
218 bw_for_ets_zero_bw_tc = MLX5E_MAX_BW_ALLOC / num_ets_zero_bw;
220 for (i = 0; i <= max_tc; i++) {
221 switch (ets->tc_tsa[i]) {
222 case IEEE_8021QAZ_TSA_VENDOR:
223 tc_tx_bw[i] = MLX5E_MAX_BW_ALLOC;
225 case IEEE_8021QAZ_TSA_STRICT:
226 tc_tx_bw[i] = MLX5E_MAX_BW_ALLOC;
228 case IEEE_8021QAZ_TSA_ETS:
229 tc_tx_bw[i] = ets->tc_tx_bw[i] ?
231 bw_for_ets_zero_bw_tc;
236 /* Make sure the total bw for ets zero bw group is 100% */
237 if (last_ets_zero_bw_tc != -1)
238 tc_tx_bw[last_ets_zero_bw_tc] +=
239 MLX5E_MAX_BW_ALLOC % num_ets_zero_bw;
242 /* If there are ETS BW 0,
243 * Set ETS group # to 1 for all ETS non zero BW tcs. Their sum must be 100%.
244 * Set group #0 to all the ETS BW 0 tcs and
245 * equally splits the 100% BW between them
246 * Report both group #0 and #1 as ETS type.
247 * All the tcs in group #0 will be reported with 0% BW.
249 static int mlx5e_dcbnl_ieee_setets_core(struct mlx5e_priv *priv, struct ieee_ets *ets)
251 struct mlx5_core_dev *mdev = priv->mdev;
252 u8 tc_tx_bw[IEEE_8021QAZ_MAX_TCS];
253 u8 tc_group[IEEE_8021QAZ_MAX_TCS];
254 int max_tc = mlx5_max_tc(mdev);
257 mlx5e_build_tc_group(ets, tc_group, max_tc);
258 mlx5e_build_tc_tx_bw(ets, tc_tx_bw, tc_group, max_tc);
260 err = mlx5_set_port_prio_tc(mdev, ets->prio_tc);
264 err = mlx5_set_port_tc_group(mdev, tc_group);
268 err = mlx5_set_port_tc_bw_alloc(mdev, tc_tx_bw);
273 memcpy(priv->dcbx.tc_tsa, ets->tc_tsa, sizeof(ets->tc_tsa));
275 for (i = 0; i < IEEE_8021QAZ_MAX_TCS; i++) {
276 mlx5e_dbg(HW, priv, "%s: prio_%d <=> tc_%d\n",
277 __func__, i, ets->prio_tc[i]);
278 mlx5e_dbg(HW, priv, "%s: tc_%d <=> tx_bw_%d%%, group_%d\n",
279 __func__, i, tc_tx_bw[i], tc_group[i]);
285 static int mlx5e_dbcnl_validate_ets(struct net_device *netdev,
286 struct ieee_ets *ets,
287 bool zero_sum_allowed)
289 bool have_ets_tc = false;
293 /* Validate Priority */
294 for (i = 0; i < IEEE_8021QAZ_MAX_TCS; i++) {
295 if (ets->prio_tc[i] >= MLX5E_MAX_PRIORITY) {
297 "Failed to validate ETS: priority value greater than max(%d)\n",
303 /* Validate Bandwidth Sum */
304 for (i = 0; i < IEEE_8021QAZ_MAX_TCS; i++) {
305 if (ets->tc_tsa[i] == IEEE_8021QAZ_TSA_ETS) {
307 bw_sum += ets->tc_tx_bw[i];
311 if (have_ets_tc && bw_sum != 100) {
312 if (bw_sum || (!bw_sum && !zero_sum_allowed))
314 "Failed to validate ETS: BW sum is illegal\n");
320 static int mlx5e_dcbnl_ieee_setets(struct net_device *netdev,
321 struct ieee_ets *ets)
323 struct mlx5e_priv *priv = netdev_priv(netdev);
326 if (!MLX5_CAP_GEN(priv->mdev, ets))
329 err = mlx5e_dbcnl_validate_ets(netdev, ets, false);
333 err = mlx5e_dcbnl_ieee_setets_core(priv, ets);
340 static int mlx5e_dcbnl_ieee_getpfc(struct net_device *dev,
341 struct ieee_pfc *pfc)
343 struct mlx5e_priv *priv = netdev_priv(dev);
344 struct mlx5_core_dev *mdev = priv->mdev;
345 struct mlx5e_pport_stats *pstats = &priv->stats.pport;
348 pfc->pfc_cap = mlx5_max_tc(mdev) + 1;
349 for (i = 0; i < IEEE_8021QAZ_MAX_TCS; i++) {
350 pfc->requests[i] = PPORT_PER_PRIO_GET(pstats, i, tx_pause);
351 pfc->indications[i] = PPORT_PER_PRIO_GET(pstats, i, rx_pause);
354 if (MLX5_BUFFER_SUPPORTED(mdev))
355 pfc->delay = priv->dcbx.cable_len;
357 return mlx5_query_port_pfc(mdev, &pfc->pfc_en, NULL);
360 static int mlx5e_dcbnl_ieee_setpfc(struct net_device *dev,
361 struct ieee_pfc *pfc)
363 struct mlx5e_priv *priv = netdev_priv(dev);
364 struct mlx5_core_dev *mdev = priv->mdev;
365 u32 old_cable_len = priv->dcbx.cable_len;
366 struct ieee_pfc pfc_new;
372 mlx5_query_port_pfc(mdev, &curr_pfc_en, NULL);
373 if (pfc->pfc_en != curr_pfc_en) {
374 ret = mlx5_set_port_pfc(mdev, pfc->pfc_en, pfc->pfc_en);
377 mlx5_toggle_port_link(mdev);
378 changed |= MLX5E_PORT_BUFFER_PFC;
382 pfc->delay < MLX5E_MAX_CABLE_LENGTH &&
383 pfc->delay != priv->dcbx.cable_len) {
384 priv->dcbx.cable_len = pfc->delay;
385 changed |= MLX5E_PORT_BUFFER_CABLE_LEN;
388 if (MLX5_BUFFER_SUPPORTED(mdev)) {
389 pfc_new.pfc_en = (changed & MLX5E_PORT_BUFFER_PFC) ? pfc->pfc_en : curr_pfc_en;
390 if (priv->dcbx.manual_buffer)
391 ret = mlx5e_port_manual_buffer_config(priv, changed,
395 if (ret && (changed & MLX5E_PORT_BUFFER_CABLE_LEN))
396 priv->dcbx.cable_len = old_cable_len;
401 "%s: PFC per priority bit mask: 0x%x\n",
402 __func__, pfc->pfc_en);
407 static u8 mlx5e_dcbnl_getdcbx(struct net_device *dev)
409 struct mlx5e_priv *priv = netdev_priv(dev);
411 return priv->dcbx.cap;
414 static u8 mlx5e_dcbnl_setdcbx(struct net_device *dev, u8 mode)
416 struct mlx5e_priv *priv = netdev_priv(dev);
417 struct mlx5e_dcbx *dcbx = &priv->dcbx;
419 if (mode & DCB_CAP_DCBX_LLD_MANAGED)
422 if ((!mode) && MLX5_CAP_GEN(priv->mdev, dcbx)) {
423 if (dcbx->mode == MLX5E_DCBX_PARAM_VER_OPER_AUTO)
426 /* set dcbx to fw controlled */
427 if (!mlx5e_dcbnl_set_dcbx_mode(priv, MLX5E_DCBX_PARAM_VER_OPER_AUTO)) {
428 dcbx->mode = MLX5E_DCBX_PARAM_VER_OPER_AUTO;
429 dcbx->cap &= ~DCB_CAP_DCBX_HOST;
436 if (!(mode & DCB_CAP_DCBX_HOST))
439 if (mlx5e_dcbnl_switch_to_host_mode(netdev_priv(dev)))
447 static int mlx5e_dcbnl_ieee_setapp(struct net_device *dev, struct dcb_app *app)
449 struct mlx5e_priv *priv = netdev_priv(dev);
454 if (!MLX5_CAP_GEN(priv->mdev, vport_group_manager) ||
455 !MLX5_DSCP_SUPPORTED(priv->mdev))
458 if ((app->selector != IEEE_8021QAZ_APP_SEL_DSCP) ||
459 (app->protocol >= MLX5E_MAX_DSCP))
462 /* Save the old entry info */
463 temp.selector = IEEE_8021QAZ_APP_SEL_DSCP;
464 temp.protocol = app->protocol;
465 temp.priority = priv->dcbx_dp.dscp2prio[app->protocol];
467 /* Check if need to switch to dscp trust state */
468 if (!priv->dcbx.dscp_app_cnt) {
469 err = mlx5e_set_trust_state(priv, MLX5_QPTS_TRUST_DSCP);
474 /* Skip the fw command if new and old mapping are the same */
475 if (app->priority != priv->dcbx_dp.dscp2prio[app->protocol]) {
476 err = mlx5e_set_dscp2prio(priv, app->protocol, app->priority);
481 /* Delete the old entry if exists */
483 err = dcb_ieee_delapp(dev, &temp);
487 /* Add new entry and update counter */
488 err = dcb_ieee_setapp(dev, app);
493 priv->dcbx.dscp_app_cnt++;
498 mlx5e_set_trust_state(priv, MLX5_QPTS_TRUST_PCP);
502 static int mlx5e_dcbnl_ieee_delapp(struct net_device *dev, struct dcb_app *app)
504 struct mlx5e_priv *priv = netdev_priv(dev);
507 if (!MLX5_CAP_GEN(priv->mdev, vport_group_manager) ||
508 !MLX5_DSCP_SUPPORTED(priv->mdev))
511 if ((app->selector != IEEE_8021QAZ_APP_SEL_DSCP) ||
512 (app->protocol >= MLX5E_MAX_DSCP))
515 /* Skip if no dscp app entry */
516 if (!priv->dcbx.dscp_app_cnt)
519 /* Check if the entry matches fw setting */
520 if (app->priority != priv->dcbx_dp.dscp2prio[app->protocol])
523 /* Delete the app entry */
524 err = dcb_ieee_delapp(dev, app);
528 /* Reset the priority mapping back to zero */
529 err = mlx5e_set_dscp2prio(priv, app->protocol, 0);
533 priv->dcbx.dscp_app_cnt--;
535 /* Check if need to switch to pcp trust state */
536 if (!priv->dcbx.dscp_app_cnt)
537 err = mlx5e_set_trust_state(priv, MLX5_QPTS_TRUST_PCP);
542 mlx5e_set_trust_state(priv, MLX5_QPTS_TRUST_PCP);
546 static int mlx5e_dcbnl_ieee_getmaxrate(struct net_device *netdev,
547 struct ieee_maxrate *maxrate)
549 struct mlx5e_priv *priv = netdev_priv(netdev);
550 struct mlx5_core_dev *mdev = priv->mdev;
551 u8 max_bw_value[IEEE_8021QAZ_MAX_TCS];
552 u8 max_bw_unit[IEEE_8021QAZ_MAX_TCS];
556 err = mlx5_query_port_ets_rate_limit(mdev, max_bw_value, max_bw_unit);
560 memset(maxrate->tc_maxrate, 0, sizeof(maxrate->tc_maxrate));
562 for (i = 0; i <= mlx5_max_tc(mdev); i++) {
563 switch (max_bw_unit[i]) {
564 case MLX5_100_MBPS_UNIT:
565 maxrate->tc_maxrate[i] = max_bw_value[i] * MLX5E_100MB;
568 maxrate->tc_maxrate[i] = max_bw_value[i] * MLX5E_1GB;
570 case MLX5_BW_NO_LIMIT:
573 WARN(true, "non-supported BW unit");
581 static int mlx5e_dcbnl_ieee_setmaxrate(struct net_device *netdev,
582 struct ieee_maxrate *maxrate)
584 struct mlx5e_priv *priv = netdev_priv(netdev);
585 struct mlx5_core_dev *mdev = priv->mdev;
586 u8 max_bw_value[IEEE_8021QAZ_MAX_TCS];
587 u8 max_bw_unit[IEEE_8021QAZ_MAX_TCS];
588 __u64 upper_limit_mbps = roundup(255 * MLX5E_100MB, MLX5E_1GB);
591 memset(max_bw_value, 0, sizeof(max_bw_value));
592 memset(max_bw_unit, 0, sizeof(max_bw_unit));
594 for (i = 0; i <= mlx5_max_tc(mdev); i++) {
595 if (!maxrate->tc_maxrate[i]) {
596 max_bw_unit[i] = MLX5_BW_NO_LIMIT;
599 if (maxrate->tc_maxrate[i] < upper_limit_mbps) {
600 max_bw_value[i] = div_u64(maxrate->tc_maxrate[i],
602 max_bw_value[i] = max_bw_value[i] ? max_bw_value[i] : 1;
603 max_bw_unit[i] = MLX5_100_MBPS_UNIT;
605 max_bw_value[i] = div_u64(maxrate->tc_maxrate[i],
607 max_bw_unit[i] = MLX5_GBPS_UNIT;
611 for (i = 0; i < IEEE_8021QAZ_MAX_TCS; i++) {
612 mlx5e_dbg(HW, priv, "%s: tc_%d <=> max_bw %d Gbps\n",
613 __func__, i, max_bw_value[i]);
616 return mlx5_modify_port_ets_rate_limit(mdev, max_bw_value, max_bw_unit);
619 static u8 mlx5e_dcbnl_setall(struct net_device *netdev)
621 struct mlx5e_priv *priv = netdev_priv(netdev);
622 struct mlx5e_cee_config *cee_cfg = &priv->dcbx.cee_cfg;
623 struct mlx5_core_dev *mdev = priv->mdev;
626 int err = -EOPNOTSUPP;
629 if (!MLX5_CAP_GEN(mdev, ets))
632 memset(&ets, 0, sizeof(ets));
633 memset(&pfc, 0, sizeof(pfc));
635 ets.ets_cap = IEEE_8021QAZ_MAX_TCS;
636 for (i = 0; i < CEE_DCBX_MAX_PGS; i++) {
637 ets.tc_tx_bw[i] = cee_cfg->pg_bw_pct[i];
638 ets.tc_rx_bw[i] = cee_cfg->pg_bw_pct[i];
639 ets.tc_tsa[i] = IEEE_8021QAZ_TSA_ETS;
640 ets.prio_tc[i] = cee_cfg->prio_to_pg_map[i];
642 "%s: Priority group %d: tx_bw %d, rx_bw %d, prio_tc %d\n",
643 __func__, i, ets.tc_tx_bw[i], ets.tc_rx_bw[i],
647 err = mlx5e_dbcnl_validate_ets(netdev, &ets, true);
651 err = mlx5e_dcbnl_ieee_setets_core(priv, &ets);
654 "%s, Failed to set ETS: %d\n", __func__, err);
659 pfc.pfc_cap = mlx5_max_tc(mdev) + 1;
660 if (!cee_cfg->pfc_enable)
663 for (i = 0; i < CEE_DCBX_MAX_PRIO; i++)
664 pfc.pfc_en |= cee_cfg->pfc_setting[i] << i;
666 err = mlx5e_dcbnl_ieee_setpfc(netdev, &pfc);
669 "%s, Failed to set PFC: %d\n", __func__, err);
673 return err ? MLX5_DCB_NO_CHG : MLX5_DCB_CHG_RESET;
676 static u8 mlx5e_dcbnl_getstate(struct net_device *netdev)
678 return MLX5E_CEE_STATE_UP;
681 static void mlx5e_dcbnl_getpermhwaddr(struct net_device *netdev,
684 struct mlx5e_priv *priv = netdev_priv(netdev);
689 memset(perm_addr, 0xff, MAX_ADDR_LEN);
691 mlx5_query_mac_address(priv->mdev, perm_addr);
694 static void mlx5e_dcbnl_setpgtccfgtx(struct net_device *netdev,
695 int priority, u8 prio_type,
696 u8 pgid, u8 bw_pct, u8 up_map)
698 struct mlx5e_priv *priv = netdev_priv(netdev);
699 struct mlx5e_cee_config *cee_cfg = &priv->dcbx.cee_cfg;
701 if (priority >= CEE_DCBX_MAX_PRIO) {
703 "%s, priority is out of range\n", __func__);
707 if (pgid >= CEE_DCBX_MAX_PGS) {
709 "%s, priority group is out of range\n", __func__);
713 cee_cfg->prio_to_pg_map[priority] = pgid;
716 static void mlx5e_dcbnl_setpgbwgcfgtx(struct net_device *netdev,
719 struct mlx5e_priv *priv = netdev_priv(netdev);
720 struct mlx5e_cee_config *cee_cfg = &priv->dcbx.cee_cfg;
722 if (pgid >= CEE_DCBX_MAX_PGS) {
724 "%s, priority group is out of range\n", __func__);
728 cee_cfg->pg_bw_pct[pgid] = bw_pct;
731 static void mlx5e_dcbnl_getpgtccfgtx(struct net_device *netdev,
732 int priority, u8 *prio_type,
733 u8 *pgid, u8 *bw_pct, u8 *up_map)
735 struct mlx5e_priv *priv = netdev_priv(netdev);
736 struct mlx5_core_dev *mdev = priv->mdev;
738 if (!MLX5_CAP_GEN(priv->mdev, ets)) {
739 netdev_err(netdev, "%s, ets is not supported\n", __func__);
743 if (priority >= CEE_DCBX_MAX_PRIO) {
745 "%s, priority is out of range\n", __func__);
753 if (mlx5_query_port_prio_tc(mdev, priority, pgid))
757 static void mlx5e_dcbnl_getpgbwgcfgtx(struct net_device *netdev,
758 int pgid, u8 *bw_pct)
762 if (pgid >= CEE_DCBX_MAX_PGS) {
764 "%s, priority group is out of range\n", __func__);
768 mlx5e_dcbnl_ieee_getets(netdev, &ets);
769 *bw_pct = ets.tc_tx_bw[pgid];
772 static void mlx5e_dcbnl_setpfccfg(struct net_device *netdev,
773 int priority, u8 setting)
775 struct mlx5e_priv *priv = netdev_priv(netdev);
776 struct mlx5e_cee_config *cee_cfg = &priv->dcbx.cee_cfg;
778 if (priority >= CEE_DCBX_MAX_PRIO) {
780 "%s, priority is out of range\n", __func__);
787 cee_cfg->pfc_setting[priority] = setting;
791 mlx5e_dcbnl_get_priority_pfc(struct net_device *netdev,
792 int priority, u8 *setting)
797 err = mlx5e_dcbnl_ieee_getpfc(netdev, &pfc);
802 *setting = (pfc.pfc_en >> priority) & 0x01;
807 static void mlx5e_dcbnl_getpfccfg(struct net_device *netdev,
808 int priority, u8 *setting)
810 if (priority >= CEE_DCBX_MAX_PRIO) {
812 "%s, priority is out of range\n", __func__);
819 mlx5e_dcbnl_get_priority_pfc(netdev, priority, setting);
822 static u8 mlx5e_dcbnl_getcap(struct net_device *netdev,
825 struct mlx5e_priv *priv = netdev_priv(netdev);
826 struct mlx5_core_dev *mdev = priv->mdev;
830 case DCB_CAP_ATTR_PG:
833 case DCB_CAP_ATTR_PFC:
836 case DCB_CAP_ATTR_UP2TC:
839 case DCB_CAP_ATTR_PG_TCS:
840 *cap = 1 << mlx5_max_tc(mdev);
842 case DCB_CAP_ATTR_PFC_TCS:
843 *cap = 1 << mlx5_max_tc(mdev);
845 case DCB_CAP_ATTR_GSP:
848 case DCB_CAP_ATTR_BCN:
851 case DCB_CAP_ATTR_DCBX:
852 *cap = priv->dcbx.cap |
853 DCB_CAP_DCBX_VER_CEE |
854 DCB_CAP_DCBX_VER_IEEE;
865 static int mlx5e_dcbnl_getnumtcs(struct net_device *netdev,
868 struct mlx5e_priv *priv = netdev_priv(netdev);
869 struct mlx5_core_dev *mdev = priv->mdev;
872 case DCB_NUMTCS_ATTR_PG:
873 case DCB_NUMTCS_ATTR_PFC:
874 *num = mlx5_max_tc(mdev) + 1;
883 static u8 mlx5e_dcbnl_getpfcstate(struct net_device *netdev)
887 if (mlx5e_dcbnl_ieee_getpfc(netdev, &pfc))
888 return MLX5E_CEE_STATE_DOWN;
890 return pfc.pfc_en ? MLX5E_CEE_STATE_UP : MLX5E_CEE_STATE_DOWN;
893 static void mlx5e_dcbnl_setpfcstate(struct net_device *netdev, u8 state)
895 struct mlx5e_priv *priv = netdev_priv(netdev);
896 struct mlx5e_cee_config *cee_cfg = &priv->dcbx.cee_cfg;
898 if ((state != MLX5E_CEE_STATE_UP) && (state != MLX5E_CEE_STATE_DOWN))
901 cee_cfg->pfc_enable = state;
904 static int mlx5e_dcbnl_getbuffer(struct net_device *dev,
905 struct dcbnl_buffer *dcb_buffer)
907 struct mlx5e_priv *priv = netdev_priv(dev);
908 struct mlx5_core_dev *mdev = priv->mdev;
909 struct mlx5e_port_buffer port_buffer;
910 u8 buffer[MLX5E_MAX_PRIORITY];
913 if (!MLX5_BUFFER_SUPPORTED(mdev))
916 err = mlx5e_port_query_priority2buffer(mdev, buffer);
920 for (i = 0; i < MLX5E_MAX_PRIORITY; i++)
921 dcb_buffer->prio2buffer[i] = buffer[i];
923 err = mlx5e_port_query_buffer(priv, &port_buffer);
927 for (i = 0; i < MLX5E_MAX_BUFFER; i++)
928 dcb_buffer->buffer_size[i] = port_buffer.buffer[i].size;
929 dcb_buffer->total_size = port_buffer.port_buffer_size;
934 static int mlx5e_dcbnl_setbuffer(struct net_device *dev,
935 struct dcbnl_buffer *dcb_buffer)
937 struct mlx5e_priv *priv = netdev_priv(dev);
938 struct mlx5_core_dev *mdev = priv->mdev;
939 struct mlx5e_port_buffer port_buffer;
940 u8 old_prio2buffer[MLX5E_MAX_PRIORITY];
941 u32 *buffer_size = NULL;
942 u8 *prio2buffer = NULL;
946 if (!MLX5_BUFFER_SUPPORTED(mdev))
949 for (i = 0; i < DCBX_MAX_BUFFERS; i++)
950 mlx5_core_dbg(mdev, "buffer[%d]=%d\n", i, dcb_buffer->buffer_size[i]);
952 for (i = 0; i < MLX5E_MAX_PRIORITY; i++)
953 mlx5_core_dbg(mdev, "priority %d buffer%d\n", i, dcb_buffer->prio2buffer[i]);
955 err = mlx5e_port_query_priority2buffer(mdev, old_prio2buffer);
959 for (i = 0; i < MLX5E_MAX_PRIORITY; i++) {
960 if (dcb_buffer->prio2buffer[i] != old_prio2buffer[i]) {
961 changed |= MLX5E_PORT_BUFFER_PRIO2BUFFER;
962 prio2buffer = dcb_buffer->prio2buffer;
967 err = mlx5e_port_query_buffer(priv, &port_buffer);
971 for (i = 0; i < MLX5E_MAX_BUFFER; i++) {
972 if (port_buffer.buffer[i].size != dcb_buffer->buffer_size[i]) {
973 changed |= MLX5E_PORT_BUFFER_SIZE;
974 buffer_size = dcb_buffer->buffer_size;
982 priv->dcbx.manual_buffer = true;
983 err = mlx5e_port_manual_buffer_config(priv, changed, dev->mtu, NULL,
984 buffer_size, prio2buffer);
988 static const struct dcbnl_rtnl_ops mlx5e_dcbnl_ops = {
989 .ieee_getets = mlx5e_dcbnl_ieee_getets,
990 .ieee_setets = mlx5e_dcbnl_ieee_setets,
991 .ieee_getmaxrate = mlx5e_dcbnl_ieee_getmaxrate,
992 .ieee_setmaxrate = mlx5e_dcbnl_ieee_setmaxrate,
993 .ieee_getpfc = mlx5e_dcbnl_ieee_getpfc,
994 .ieee_setpfc = mlx5e_dcbnl_ieee_setpfc,
995 .ieee_setapp = mlx5e_dcbnl_ieee_setapp,
996 .ieee_delapp = mlx5e_dcbnl_ieee_delapp,
997 .getdcbx = mlx5e_dcbnl_getdcbx,
998 .setdcbx = mlx5e_dcbnl_setdcbx,
999 .dcbnl_getbuffer = mlx5e_dcbnl_getbuffer,
1000 .dcbnl_setbuffer = mlx5e_dcbnl_setbuffer,
1002 /* CEE interfaces */
1003 .setall = mlx5e_dcbnl_setall,
1004 .getstate = mlx5e_dcbnl_getstate,
1005 .getpermhwaddr = mlx5e_dcbnl_getpermhwaddr,
1007 .setpgtccfgtx = mlx5e_dcbnl_setpgtccfgtx,
1008 .setpgbwgcfgtx = mlx5e_dcbnl_setpgbwgcfgtx,
1009 .getpgtccfgtx = mlx5e_dcbnl_getpgtccfgtx,
1010 .getpgbwgcfgtx = mlx5e_dcbnl_getpgbwgcfgtx,
1012 .setpfccfg = mlx5e_dcbnl_setpfccfg,
1013 .getpfccfg = mlx5e_dcbnl_getpfccfg,
1014 .getcap = mlx5e_dcbnl_getcap,
1015 .getnumtcs = mlx5e_dcbnl_getnumtcs,
1016 .getpfcstate = mlx5e_dcbnl_getpfcstate,
1017 .setpfcstate = mlx5e_dcbnl_setpfcstate,
1020 void mlx5e_dcbnl_build_netdev(struct net_device *netdev)
1022 struct mlx5e_priv *priv = netdev_priv(netdev);
1023 struct mlx5_core_dev *mdev = priv->mdev;
1025 if (MLX5_CAP_GEN(mdev, vport_group_manager) && MLX5_CAP_GEN(mdev, qos))
1026 netdev->dcbnl_ops = &mlx5e_dcbnl_ops;
1029 void mlx5e_dcbnl_build_rep_netdev(struct net_device *netdev)
1031 struct mlx5e_priv *priv = netdev_priv(netdev);
1032 struct mlx5_core_dev *mdev = priv->mdev;
1034 if (MLX5_CAP_GEN(mdev, qos))
1035 netdev->dcbnl_ops = &mlx5e_dcbnl_ops;
1038 static void mlx5e_dcbnl_query_dcbx_mode(struct mlx5e_priv *priv,
1039 enum mlx5_dcbx_oper_mode *mode)
1041 u32 out[MLX5_ST_SZ_DW(dcbx_param)];
1043 *mode = MLX5E_DCBX_PARAM_VER_OPER_HOST;
1045 if (!mlx5_query_port_dcbx_param(priv->mdev, out))
1046 *mode = MLX5_GET(dcbx_param, out, version_oper);
1048 /* From driver's point of view, we only care if the mode
1049 * is host (HOST) or non-host (AUTO)
1051 if (*mode != MLX5E_DCBX_PARAM_VER_OPER_HOST)
1052 *mode = MLX5E_DCBX_PARAM_VER_OPER_AUTO;
1055 static void mlx5e_ets_init(struct mlx5e_priv *priv)
1057 struct ieee_ets ets;
1061 if (!MLX5_CAP_GEN(priv->mdev, ets))
1064 memset(&ets, 0, sizeof(ets));
1065 ets.ets_cap = mlx5_max_tc(priv->mdev) + 1;
1066 for (i = 0; i < ets.ets_cap; i++) {
1067 ets.tc_tx_bw[i] = MLX5E_MAX_BW_ALLOC;
1068 ets.tc_tsa[i] = IEEE_8021QAZ_TSA_VENDOR;
1072 if (ets.ets_cap > 1) {
1073 /* tclass[prio=0]=1, tclass[prio=1]=0, tclass[prio=i]=i (for i>1) */
1078 err = mlx5e_dcbnl_ieee_setets_core(priv, &ets);
1080 netdev_err(priv->netdev,
1081 "%s, Failed to init ETS: %d\n", __func__, err);
1089 static void mlx5e_dcbnl_dscp_app(struct mlx5e_priv *priv, int action)
1091 struct dcb_app temp;
1094 if (!MLX5_CAP_GEN(priv->mdev, vport_group_manager))
1097 if (!MLX5_DSCP_SUPPORTED(priv->mdev))
1100 /* No SEL_DSCP entry in non DSCP state */
1101 if (priv->dcbx_dp.trust_state != MLX5_QPTS_TRUST_DSCP)
1104 temp.selector = IEEE_8021QAZ_APP_SEL_DSCP;
1105 for (i = 0; i < MLX5E_MAX_DSCP; i++) {
1107 temp.priority = priv->dcbx_dp.dscp2prio[i];
1109 dcb_ieee_setapp(priv->netdev, &temp);
1111 dcb_ieee_delapp(priv->netdev, &temp);
1114 priv->dcbx.dscp_app_cnt = (action == INIT) ? MLX5E_MAX_DSCP : 0;
1117 void mlx5e_dcbnl_init_app(struct mlx5e_priv *priv)
1119 mlx5e_dcbnl_dscp_app(priv, INIT);
1122 void mlx5e_dcbnl_delete_app(struct mlx5e_priv *priv)
1124 mlx5e_dcbnl_dscp_app(priv, DELETE);
1127 static void mlx5e_params_calc_trust_tx_min_inline_mode(struct mlx5_core_dev *mdev,
1128 struct mlx5e_params *params,
1131 mlx5_query_min_inline(mdev, ¶ms->tx_min_inline_mode);
1132 if (trust_state == MLX5_QPTS_TRUST_DSCP &&
1133 params->tx_min_inline_mode == MLX5_INLINE_MODE_L2)
1134 params->tx_min_inline_mode = MLX5_INLINE_MODE_IP;
1137 static int mlx5e_update_trust_state_hw(struct mlx5e_priv *priv, void *context)
1139 u8 *trust_state = context;
1142 err = mlx5_set_trust_state(priv->mdev, *trust_state);
1145 WRITE_ONCE(priv->dcbx_dp.trust_state, *trust_state);
1150 static int mlx5e_set_trust_state(struct mlx5e_priv *priv, u8 trust_state)
1152 struct mlx5e_params new_params;
1156 mutex_lock(&priv->state_lock);
1158 new_params = priv->channels.params;
1159 mlx5e_params_calc_trust_tx_min_inline_mode(priv->mdev, &new_params,
1162 /* Skip if tx_min_inline is the same */
1163 if (new_params.tx_min_inline_mode == priv->channels.params.tx_min_inline_mode)
1166 err = mlx5e_safe_switch_params(priv, &new_params,
1167 mlx5e_update_trust_state_hw,
1168 &trust_state, reset);
1170 mutex_unlock(&priv->state_lock);
1175 static int mlx5e_set_dscp2prio(struct mlx5e_priv *priv, u8 dscp, u8 prio)
1179 err = mlx5_set_dscp2prio(priv->mdev, dscp, prio);
1183 priv->dcbx_dp.dscp2prio[dscp] = prio;
1187 static int mlx5e_trust_initialize(struct mlx5e_priv *priv)
1189 struct mlx5_core_dev *mdev = priv->mdev;
1193 if (!MLX5_DSCP_SUPPORTED(mdev)) {
1194 WRITE_ONCE(priv->dcbx_dp.trust_state, MLX5_QPTS_TRUST_PCP);
1198 err = mlx5_query_trust_state(priv->mdev, &trust_state);
1201 WRITE_ONCE(priv->dcbx_dp.trust_state, trust_state);
1203 mlx5e_params_calc_trust_tx_min_inline_mode(priv->mdev, &priv->channels.params,
1204 priv->dcbx_dp.trust_state);
1206 err = mlx5_query_dscp2prio(priv->mdev, priv->dcbx_dp.dscp2prio);
1213 #define MLX5E_BUFFER_CELL_SHIFT 7
1215 static u16 mlx5e_query_port_buffers_cell_size(struct mlx5e_priv *priv)
1217 struct mlx5_core_dev *mdev = priv->mdev;
1218 u32 out[MLX5_ST_SZ_DW(sbcam_reg)] = {};
1219 u32 in[MLX5_ST_SZ_DW(sbcam_reg)] = {};
1221 if (!MLX5_CAP_GEN(mdev, sbcam_reg))
1222 return (1 << MLX5E_BUFFER_CELL_SHIFT);
1224 if (mlx5_core_access_reg(mdev, in, sizeof(in), out, sizeof(out),
1225 MLX5_REG_SBCAM, 0, 0))
1226 return (1 << MLX5E_BUFFER_CELL_SHIFT);
1228 return MLX5_GET(sbcam_reg, out, cap_cell_size);
1231 void mlx5e_dcbnl_initialize(struct mlx5e_priv *priv)
1233 struct mlx5e_dcbx *dcbx = &priv->dcbx;
1235 mlx5e_trust_initialize(priv);
1237 if (!MLX5_CAP_GEN(priv->mdev, qos))
1240 if (MLX5_CAP_GEN(priv->mdev, dcbx))
1241 mlx5e_dcbnl_query_dcbx_mode(priv, &dcbx->mode);
1243 priv->dcbx.cap = DCB_CAP_DCBX_VER_CEE |
1244 DCB_CAP_DCBX_VER_IEEE;
1245 if (priv->dcbx.mode == MLX5E_DCBX_PARAM_VER_OPER_HOST)
1246 priv->dcbx.cap |= DCB_CAP_DCBX_HOST;
1248 priv->dcbx.port_buff_cell_sz = mlx5e_query_port_buffers_cell_size(priv);
1249 priv->dcbx.manual_buffer = false;
1250 priv->dcbx.cable_len = MLX5E_DEFAULT_CABLE_LEN;
1252 mlx5e_ets_init(priv);