dpdk/drivers/net/mlx5/mlx5_trigger.c
<<
>>
Prefs
   1/* SPDX-License-Identifier: BSD-3-Clause
   2 * Copyright 2015 6WIND S.A.
   3 * Copyright 2015 Mellanox Technologies, Ltd
   4 */
   5
   6#include <unistd.h>
   7
   8#include <rte_ether.h>
   9#include <ethdev_driver.h>
  10#include <rte_interrupts.h>
  11#include <rte_alarm.h>
  12#include <rte_cycles.h>
  13
  14#include <mlx5_malloc.h>
  15
  16#include "mlx5.h"
  17#include "mlx5_mr.h"
  18#include "mlx5_rx.h"
  19#include "mlx5_tx.h"
  20#include "mlx5_utils.h"
  21#include "rte_pmd_mlx5.h"
  22
  23/**
  24 * Stop traffic on Tx queues.
  25 *
  26 * @param dev
  27 *   Pointer to Ethernet device structure.
  28 */
  29static void
  30mlx5_txq_stop(struct rte_eth_dev *dev)
  31{
  32        struct mlx5_priv *priv = dev->data->dev_private;
  33        unsigned int i;
  34
  35        for (i = 0; i != priv->txqs_n; ++i)
  36                mlx5_txq_release(dev, i);
  37}
  38
  39/**
  40 * Start traffic on Tx queues.
  41 *
  42 * @param dev
  43 *   Pointer to Ethernet device structure.
  44 *
  45 * @return
  46 *   0 on success, a negative errno value otherwise and rte_errno is set.
  47 */
  48static int
  49mlx5_txq_start(struct rte_eth_dev *dev)
  50{
  51        struct mlx5_priv *priv = dev->data->dev_private;
  52        unsigned int i;
  53        int ret;
  54
  55        for (i = 0; i != priv->txqs_n; ++i) {
  56                struct mlx5_txq_ctrl *txq_ctrl = mlx5_txq_get(dev, i);
  57                struct mlx5_txq_data *txq_data = &txq_ctrl->txq;
  58                uint32_t flags = MLX5_MEM_RTE | MLX5_MEM_ZERO;
  59
  60                if (!txq_ctrl)
  61                        continue;
  62                if (txq_ctrl->type == MLX5_TXQ_TYPE_STANDARD)
  63                        txq_alloc_elts(txq_ctrl);
  64                MLX5_ASSERT(!txq_ctrl->obj);
  65                txq_ctrl->obj = mlx5_malloc(flags, sizeof(struct mlx5_txq_obj),
  66                                            0, txq_ctrl->socket);
  67                if (!txq_ctrl->obj) {
  68                        DRV_LOG(ERR, "Port %u Tx queue %u cannot allocate "
  69                                "memory resources.", dev->data->port_id,
  70                                txq_data->idx);
  71                        rte_errno = ENOMEM;
  72                        goto error;
  73                }
  74                ret = priv->obj_ops.txq_obj_new(dev, i);
  75                if (ret < 0) {
  76                        mlx5_free(txq_ctrl->obj);
  77                        txq_ctrl->obj = NULL;
  78                        goto error;
  79                }
  80                if (txq_ctrl->type == MLX5_TXQ_TYPE_STANDARD) {
  81                        size_t size = txq_data->cqe_s * sizeof(*txq_data->fcqs);
  82
  83                        txq_data->fcqs = mlx5_malloc(flags, size,
  84                                                     RTE_CACHE_LINE_SIZE,
  85                                                     txq_ctrl->socket);
  86                        if (!txq_data->fcqs) {
  87                                DRV_LOG(ERR, "Port %u Tx queue %u cannot "
  88                                        "allocate memory (FCQ).",
  89                                        dev->data->port_id, i);
  90                                rte_errno = ENOMEM;
  91                                goto error;
  92                        }
  93                }
  94                DRV_LOG(DEBUG, "Port %u txq %u updated with %p.",
  95                        dev->data->port_id, i, (void *)&txq_ctrl->obj);
  96                LIST_INSERT_HEAD(&priv->txqsobj, txq_ctrl->obj, next);
  97        }
  98        return 0;
  99error:
 100        ret = rte_errno; /* Save rte_errno before cleanup. */
 101        do {
 102                mlx5_txq_release(dev, i);
 103        } while (i-- != 0);
 104        rte_errno = ret; /* Restore rte_errno. */
 105        return -rte_errno;
 106}
 107
 108/**
 109 * Stop traffic on Rx queues.
 110 *
 111 * @param dev
 112 *   Pointer to Ethernet device structure.
 113 */
 114static void
 115mlx5_rxq_stop(struct rte_eth_dev *dev)
 116{
 117        struct mlx5_priv *priv = dev->data->dev_private;
 118        unsigned int i;
 119
 120        for (i = 0; i != priv->rxqs_n; ++i)
 121                mlx5_rxq_release(dev, i);
 122}
 123
 124/**
 125 * Start traffic on Rx queues.
 126 *
 127 * @param dev
 128 *   Pointer to Ethernet device structure.
 129 *
 130 * @return
 131 *   0 on success, a negative errno value otherwise and rte_errno is set.
 132 */
 133static int
 134mlx5_rxq_start(struct rte_eth_dev *dev)
 135{
 136        struct mlx5_priv *priv = dev->data->dev_private;
 137        unsigned int i;
 138        int ret = 0;
 139
 140        /* Allocate/reuse/resize mempool for Multi-Packet RQ. */
 141        if (mlx5_mprq_alloc_mp(dev)) {
 142                /* Should not release Rx queues but return immediately. */
 143                return -rte_errno;
 144        }
 145        DRV_LOG(DEBUG, "Port %u device_attr.max_qp_wr is %d.",
 146                dev->data->port_id, priv->sh->device_attr.max_qp_wr);
 147        DRV_LOG(DEBUG, "Port %u device_attr.max_sge is %d.",
 148                dev->data->port_id, priv->sh->device_attr.max_sge);
 149        for (i = 0; i != priv->rxqs_n; ++i) {
 150                struct mlx5_rxq_ctrl *rxq_ctrl = mlx5_rxq_get(dev, i);
 151
 152                if (!rxq_ctrl)
 153                        continue;
 154                if (rxq_ctrl->type == MLX5_RXQ_TYPE_STANDARD) {
 155                        /* Pre-register Rx mempools. */
 156                        if (mlx5_rxq_mprq_enabled(&rxq_ctrl->rxq)) {
 157                                mlx5_mr_update_mp(dev, &rxq_ctrl->rxq.mr_ctrl,
 158                                                  rxq_ctrl->rxq.mprq_mp);
 159                        } else {
 160                                uint32_t s;
 161
 162                                for (s = 0; s < rxq_ctrl->rxq.rxseg_n; s++)
 163                                        mlx5_mr_update_mp
 164                                                (dev, &rxq_ctrl->rxq.mr_ctrl,
 165                                                rxq_ctrl->rxq.rxseg[s].mp);
 166                        }
 167                        ret = rxq_alloc_elts(rxq_ctrl);
 168                        if (ret)
 169                                goto error;
 170                }
 171                MLX5_ASSERT(!rxq_ctrl->obj);
 172                rxq_ctrl->obj = mlx5_malloc(MLX5_MEM_RTE | MLX5_MEM_ZERO,
 173                                            sizeof(*rxq_ctrl->obj), 0,
 174                                            rxq_ctrl->socket);
 175                if (!rxq_ctrl->obj) {
 176                        DRV_LOG(ERR,
 177                                "Port %u Rx queue %u can't allocate resources.",
 178                                dev->data->port_id, (*priv->rxqs)[i]->idx);
 179                        rte_errno = ENOMEM;
 180                        goto error;
 181                }
 182                ret = priv->obj_ops.rxq_obj_new(dev, i);
 183                if (ret) {
 184                        mlx5_free(rxq_ctrl->obj);
 185                        goto error;
 186                }
 187                DRV_LOG(DEBUG, "Port %u rxq %u updated with %p.",
 188                        dev->data->port_id, i, (void *)&rxq_ctrl->obj);
 189                LIST_INSERT_HEAD(&priv->rxqsobj, rxq_ctrl->obj, next);
 190        }
 191        return 0;
 192error:
 193        ret = rte_errno; /* Save rte_errno before cleanup. */
 194        do {
 195                mlx5_rxq_release(dev, i);
 196        } while (i-- != 0);
 197        rte_errno = ret; /* Restore rte_errno. */
 198        return -rte_errno;
 199}
 200
 201/**
 202 * Binds Tx queues to Rx queues for hairpin.
 203 *
 204 * Binds Tx queues to the target Rx queues.
 205 *
 206 * @param dev
 207 *   Pointer to Ethernet device structure.
 208 *
 209 * @return
 210 *   0 on success, a negative errno value otherwise and rte_errno is set.
 211 */
 212static int
 213mlx5_hairpin_auto_bind(struct rte_eth_dev *dev)
 214{
 215        struct mlx5_priv *priv = dev->data->dev_private;
 216        struct mlx5_devx_modify_sq_attr sq_attr = { 0 };
 217        struct mlx5_devx_modify_rq_attr rq_attr = { 0 };
 218        struct mlx5_txq_ctrl *txq_ctrl;
 219        struct mlx5_rxq_ctrl *rxq_ctrl;
 220        struct mlx5_devx_obj *sq;
 221        struct mlx5_devx_obj *rq;
 222        unsigned int i;
 223        int ret = 0;
 224        bool need_auto = false;
 225        uint16_t self_port = dev->data->port_id;
 226
 227        for (i = 0; i != priv->txqs_n; ++i) {
 228                txq_ctrl = mlx5_txq_get(dev, i);
 229                if (!txq_ctrl)
 230                        continue;
 231                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN ||
 232                    txq_ctrl->hairpin_conf.peers[0].port != self_port) {
 233                        mlx5_txq_release(dev, i);
 234                        continue;
 235                }
 236                if (txq_ctrl->hairpin_conf.manual_bind) {
 237                        mlx5_txq_release(dev, i);
 238                        return 0;
 239                }
 240                need_auto = true;
 241                mlx5_txq_release(dev, i);
 242        }
 243        if (!need_auto)
 244                return 0;
 245        for (i = 0; i != priv->txqs_n; ++i) {
 246                txq_ctrl = mlx5_txq_get(dev, i);
 247                if (!txq_ctrl)
 248                        continue;
 249                /* Skip hairpin queues with other peer ports. */
 250                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN ||
 251                    txq_ctrl->hairpin_conf.peers[0].port != self_port) {
 252                        mlx5_txq_release(dev, i);
 253                        continue;
 254                }
 255                if (!txq_ctrl->obj) {
 256                        rte_errno = ENOMEM;
 257                        DRV_LOG(ERR, "port %u no txq object found: %d",
 258                                dev->data->port_id, i);
 259                        mlx5_txq_release(dev, i);
 260                        return -rte_errno;
 261                }
 262                sq = txq_ctrl->obj->sq;
 263                rxq_ctrl = mlx5_rxq_get(dev,
 264                                        txq_ctrl->hairpin_conf.peers[0].queue);
 265                if (!rxq_ctrl) {
 266                        mlx5_txq_release(dev, i);
 267                        rte_errno = EINVAL;
 268                        DRV_LOG(ERR, "port %u no rxq object found: %d",
 269                                dev->data->port_id,
 270                                txq_ctrl->hairpin_conf.peers[0].queue);
 271                        return -rte_errno;
 272                }
 273                if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN ||
 274                    rxq_ctrl->hairpin_conf.peers[0].queue != i) {
 275                        rte_errno = ENOMEM;
 276                        DRV_LOG(ERR, "port %u Tx queue %d can't be binded to "
 277                                "Rx queue %d", dev->data->port_id,
 278                                i, txq_ctrl->hairpin_conf.peers[0].queue);
 279                        goto error;
 280                }
 281                rq = rxq_ctrl->obj->rq;
 282                if (!rq) {
 283                        rte_errno = ENOMEM;
 284                        DRV_LOG(ERR, "port %u hairpin no matching rxq: %d",
 285                                dev->data->port_id,
 286                                txq_ctrl->hairpin_conf.peers[0].queue);
 287                        goto error;
 288                }
 289                sq_attr.state = MLX5_SQC_STATE_RDY;
 290                sq_attr.sq_state = MLX5_SQC_STATE_RST;
 291                sq_attr.hairpin_peer_rq = rq->id;
 292                sq_attr.hairpin_peer_vhca = priv->config.hca_attr.vhca_id;
 293                ret = mlx5_devx_cmd_modify_sq(sq, &sq_attr);
 294                if (ret)
 295                        goto error;
 296                rq_attr.state = MLX5_SQC_STATE_RDY;
 297                rq_attr.rq_state = MLX5_SQC_STATE_RST;
 298                rq_attr.hairpin_peer_sq = sq->id;
 299                rq_attr.hairpin_peer_vhca = priv->config.hca_attr.vhca_id;
 300                ret = mlx5_devx_cmd_modify_rq(rq, &rq_attr);
 301                if (ret)
 302                        goto error;
 303                /* Qs with auto-bind will be destroyed directly. */
 304                rxq_ctrl->hairpin_status = 1;
 305                txq_ctrl->hairpin_status = 1;
 306                mlx5_txq_release(dev, i);
 307                mlx5_rxq_release(dev, txq_ctrl->hairpin_conf.peers[0].queue);
 308        }
 309        return 0;
 310error:
 311        mlx5_txq_release(dev, i);
 312        mlx5_rxq_release(dev, txq_ctrl->hairpin_conf.peers[0].queue);
 313        return -rte_errno;
 314}
 315
 316/*
 317 * Fetch the peer queue's SW & HW information.
 318 *
 319 * @param dev
 320 *   Pointer to Ethernet device structure.
 321 * @param peer_queue
 322 *   Index of the queue to fetch the information.
 323 * @param current_info
 324 *   Pointer to the input peer information, not used currently.
 325 * @param peer_info
 326 *   Pointer to the structure to store the information, output.
 327 * @param direction
 328 *   Positive to get the RxQ information, zero to get the TxQ information.
 329 *
 330 * @return
 331 *   0 on success, a negative errno value otherwise and rte_errno is set.
 332 */
 333int
 334mlx5_hairpin_queue_peer_update(struct rte_eth_dev *dev, uint16_t peer_queue,
 335                               struct rte_hairpin_peer_info *current_info,
 336                               struct rte_hairpin_peer_info *peer_info,
 337                               uint32_t direction)
 338{
 339        struct mlx5_priv *priv = dev->data->dev_private;
 340        RTE_SET_USED(current_info);
 341
 342        if (dev->data->dev_started == 0) {
 343                rte_errno = EBUSY;
 344                DRV_LOG(ERR, "peer port %u is not started",
 345                        dev->data->port_id);
 346                return -rte_errno;
 347        }
 348        /*
 349         * Peer port used as egress. In the current design, hairpin Tx queue
 350         * will be bound to the peer Rx queue. Indeed, only the information of
 351         * peer Rx queue needs to be fetched.
 352         */
 353        if (direction == 0) {
 354                struct mlx5_txq_ctrl *txq_ctrl;
 355
 356                txq_ctrl = mlx5_txq_get(dev, peer_queue);
 357                if (txq_ctrl == NULL) {
 358                        rte_errno = EINVAL;
 359                        DRV_LOG(ERR, "Failed to get port %u Tx queue %d",
 360                                dev->data->port_id, peer_queue);
 361                        return -rte_errno;
 362                }
 363                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 364                        rte_errno = EINVAL;
 365                        DRV_LOG(ERR, "port %u queue %d is not a hairpin Txq",
 366                                dev->data->port_id, peer_queue);
 367                        mlx5_txq_release(dev, peer_queue);
 368                        return -rte_errno;
 369                }
 370                if (txq_ctrl->obj == NULL || txq_ctrl->obj->sq == NULL) {
 371                        rte_errno = ENOMEM;
 372                        DRV_LOG(ERR, "port %u no Txq object found: %d",
 373                                dev->data->port_id, peer_queue);
 374                        mlx5_txq_release(dev, peer_queue);
 375                        return -rte_errno;
 376                }
 377                peer_info->qp_id = txq_ctrl->obj->sq->id;
 378                peer_info->vhca_id = priv->config.hca_attr.vhca_id;
 379                /* 1-to-1 mapping, only the first one is used. */
 380                peer_info->peer_q = txq_ctrl->hairpin_conf.peers[0].queue;
 381                peer_info->tx_explicit = txq_ctrl->hairpin_conf.tx_explicit;
 382                peer_info->manual_bind = txq_ctrl->hairpin_conf.manual_bind;
 383                mlx5_txq_release(dev, peer_queue);
 384        } else { /* Peer port used as ingress. */
 385                struct mlx5_rxq_ctrl *rxq_ctrl;
 386
 387                rxq_ctrl = mlx5_rxq_get(dev, peer_queue);
 388                if (rxq_ctrl == NULL) {
 389                        rte_errno = EINVAL;
 390                        DRV_LOG(ERR, "Failed to get port %u Rx queue %d",
 391                                dev->data->port_id, peer_queue);
 392                        return -rte_errno;
 393                }
 394                if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN) {
 395                        rte_errno = EINVAL;
 396                        DRV_LOG(ERR, "port %u queue %d is not a hairpin Rxq",
 397                                dev->data->port_id, peer_queue);
 398                        mlx5_rxq_release(dev, peer_queue);
 399                        return -rte_errno;
 400                }
 401                if (rxq_ctrl->obj == NULL || rxq_ctrl->obj->rq == NULL) {
 402                        rte_errno = ENOMEM;
 403                        DRV_LOG(ERR, "port %u no Rxq object found: %d",
 404                                dev->data->port_id, peer_queue);
 405                        mlx5_rxq_release(dev, peer_queue);
 406                        return -rte_errno;
 407                }
 408                peer_info->qp_id = rxq_ctrl->obj->rq->id;
 409                peer_info->vhca_id = priv->config.hca_attr.vhca_id;
 410                peer_info->peer_q = rxq_ctrl->hairpin_conf.peers[0].queue;
 411                peer_info->tx_explicit = rxq_ctrl->hairpin_conf.tx_explicit;
 412                peer_info->manual_bind = rxq_ctrl->hairpin_conf.manual_bind;
 413                mlx5_rxq_release(dev, peer_queue);
 414        }
 415        return 0;
 416}
 417
 418/*
 419 * Bind the hairpin queue with the peer HW information.
 420 * This needs to be called twice both for Tx and Rx queues of a pair.
 421 * If the queue is already bound, it is considered successful.
 422 *
 423 * @param dev
 424 *   Pointer to Ethernet device structure.
 425 * @param cur_queue
 426 *   Index of the queue to change the HW configuration to bind.
 427 * @param peer_info
 428 *   Pointer to information of the peer queue.
 429 * @param direction
 430 *   Positive to configure the TxQ, zero to configure the RxQ.
 431 *
 432 * @return
 433 *   0 on success, a negative errno value otherwise and rte_errno is set.
 434 */
 435int
 436mlx5_hairpin_queue_peer_bind(struct rte_eth_dev *dev, uint16_t cur_queue,
 437                             struct rte_hairpin_peer_info *peer_info,
 438                             uint32_t direction)
 439{
 440        int ret = 0;
 441
 442        /*
 443         * Consistency checking of the peer queue: opposite direction is used
 444         * to get the peer queue info with ethdev port ID, no need to check.
 445         */
 446        if (peer_info->peer_q != cur_queue) {
 447                rte_errno = EINVAL;
 448                DRV_LOG(ERR, "port %u queue %d and peer queue %d mismatch",
 449                        dev->data->port_id, cur_queue, peer_info->peer_q);
 450                return -rte_errno;
 451        }
 452        if (direction != 0) {
 453                struct mlx5_txq_ctrl *txq_ctrl;
 454                struct mlx5_devx_modify_sq_attr sq_attr = { 0 };
 455
 456                txq_ctrl = mlx5_txq_get(dev, cur_queue);
 457                if (txq_ctrl == NULL) {
 458                        rte_errno = EINVAL;
 459                        DRV_LOG(ERR, "Failed to get port %u Tx queue %d",
 460                                dev->data->port_id, cur_queue);
 461                        return -rte_errno;
 462                }
 463                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 464                        rte_errno = EINVAL;
 465                        DRV_LOG(ERR, "port %u queue %d not a hairpin Txq",
 466                                dev->data->port_id, cur_queue);
 467                        mlx5_txq_release(dev, cur_queue);
 468                        return -rte_errno;
 469                }
 470                if (txq_ctrl->obj == NULL || txq_ctrl->obj->sq == NULL) {
 471                        rte_errno = ENOMEM;
 472                        DRV_LOG(ERR, "port %u no Txq object found: %d",
 473                                dev->data->port_id, cur_queue);
 474                        mlx5_txq_release(dev, cur_queue);
 475                        return -rte_errno;
 476                }
 477                if (txq_ctrl->hairpin_status != 0) {
 478                        DRV_LOG(DEBUG, "port %u Tx queue %d is already bound",
 479                                dev->data->port_id, cur_queue);
 480                        mlx5_txq_release(dev, cur_queue);
 481                        return 0;
 482                }
 483                /*
 484                 * All queues' of one port consistency checking is done in the
 485                 * bind() function, and that is optional.
 486                 */
 487                if (peer_info->tx_explicit !=
 488                    txq_ctrl->hairpin_conf.tx_explicit) {
 489                        rte_errno = EINVAL;
 490                        DRV_LOG(ERR, "port %u Tx queue %d and peer Tx rule mode"
 491                                " mismatch", dev->data->port_id, cur_queue);
 492                        mlx5_txq_release(dev, cur_queue);
 493                        return -rte_errno;
 494                }
 495                if (peer_info->manual_bind !=
 496                    txq_ctrl->hairpin_conf.manual_bind) {
 497                        rte_errno = EINVAL;
 498                        DRV_LOG(ERR, "port %u Tx queue %d and peer binding mode"
 499                                " mismatch", dev->data->port_id, cur_queue);
 500                        mlx5_txq_release(dev, cur_queue);
 501                        return -rte_errno;
 502                }
 503                sq_attr.state = MLX5_SQC_STATE_RDY;
 504                sq_attr.sq_state = MLX5_SQC_STATE_RST;
 505                sq_attr.hairpin_peer_rq = peer_info->qp_id;
 506                sq_attr.hairpin_peer_vhca = peer_info->vhca_id;
 507                ret = mlx5_devx_cmd_modify_sq(txq_ctrl->obj->sq, &sq_attr);
 508                if (ret == 0)
 509                        txq_ctrl->hairpin_status = 1;
 510                mlx5_txq_release(dev, cur_queue);
 511        } else {
 512                struct mlx5_rxq_ctrl *rxq_ctrl;
 513                struct mlx5_devx_modify_rq_attr rq_attr = { 0 };
 514
 515                rxq_ctrl = mlx5_rxq_get(dev, cur_queue);
 516                if (rxq_ctrl == NULL) {
 517                        rte_errno = EINVAL;
 518                        DRV_LOG(ERR, "Failed to get port %u Rx queue %d",
 519                                dev->data->port_id, cur_queue);
 520                        return -rte_errno;
 521                }
 522                if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN) {
 523                        rte_errno = EINVAL;
 524                        DRV_LOG(ERR, "port %u queue %d not a hairpin Rxq",
 525                                dev->data->port_id, cur_queue);
 526                        mlx5_rxq_release(dev, cur_queue);
 527                        return -rte_errno;
 528                }
 529                if (rxq_ctrl->obj == NULL || rxq_ctrl->obj->rq == NULL) {
 530                        rte_errno = ENOMEM;
 531                        DRV_LOG(ERR, "port %u no Rxq object found: %d",
 532                                dev->data->port_id, cur_queue);
 533                        mlx5_rxq_release(dev, cur_queue);
 534                        return -rte_errno;
 535                }
 536                if (rxq_ctrl->hairpin_status != 0) {
 537                        DRV_LOG(DEBUG, "port %u Rx queue %d is already bound",
 538                                dev->data->port_id, cur_queue);
 539                        mlx5_rxq_release(dev, cur_queue);
 540                        return 0;
 541                }
 542                if (peer_info->tx_explicit !=
 543                    rxq_ctrl->hairpin_conf.tx_explicit) {
 544                        rte_errno = EINVAL;
 545                        DRV_LOG(ERR, "port %u Rx queue %d and peer Tx rule mode"
 546                                " mismatch", dev->data->port_id, cur_queue);
 547                        mlx5_rxq_release(dev, cur_queue);
 548                        return -rte_errno;
 549                }
 550                if (peer_info->manual_bind !=
 551                    rxq_ctrl->hairpin_conf.manual_bind) {
 552                        rte_errno = EINVAL;
 553                        DRV_LOG(ERR, "port %u Rx queue %d and peer binding mode"
 554                                " mismatch", dev->data->port_id, cur_queue);
 555                        mlx5_rxq_release(dev, cur_queue);
 556                        return -rte_errno;
 557                }
 558                rq_attr.state = MLX5_SQC_STATE_RDY;
 559                rq_attr.rq_state = MLX5_SQC_STATE_RST;
 560                rq_attr.hairpin_peer_sq = peer_info->qp_id;
 561                rq_attr.hairpin_peer_vhca = peer_info->vhca_id;
 562                ret = mlx5_devx_cmd_modify_rq(rxq_ctrl->obj->rq, &rq_attr);
 563                if (ret == 0)
 564                        rxq_ctrl->hairpin_status = 1;
 565                mlx5_rxq_release(dev, cur_queue);
 566        }
 567        return ret;
 568}
 569
 570/*
 571 * Unbind the hairpin queue and reset its HW configuration.
 572 * This needs to be called twice both for Tx and Rx queues of a pair.
 573 * If the queue is already unbound, it is considered successful.
 574 *
 575 * @param dev
 576 *   Pointer to Ethernet device structure.
 577 * @param cur_queue
 578 *   Index of the queue to change the HW configuration to unbind.
 579 * @param direction
 580 *   Positive to reset the TxQ, zero to reset the RxQ.
 581 *
 582 * @return
 583 *   0 on success, a negative errno value otherwise and rte_errno is set.
 584 */
 585int
 586mlx5_hairpin_queue_peer_unbind(struct rte_eth_dev *dev, uint16_t cur_queue,
 587                               uint32_t direction)
 588{
 589        int ret = 0;
 590
 591        if (direction != 0) {
 592                struct mlx5_txq_ctrl *txq_ctrl;
 593                struct mlx5_devx_modify_sq_attr sq_attr = { 0 };
 594
 595                txq_ctrl = mlx5_txq_get(dev, cur_queue);
 596                if (txq_ctrl == NULL) {
 597                        rte_errno = EINVAL;
 598                        DRV_LOG(ERR, "Failed to get port %u Tx queue %d",
 599                                dev->data->port_id, cur_queue);
 600                        return -rte_errno;
 601                }
 602                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 603                        rte_errno = EINVAL;
 604                        DRV_LOG(ERR, "port %u queue %d not a hairpin Txq",
 605                                dev->data->port_id, cur_queue);
 606                        mlx5_txq_release(dev, cur_queue);
 607                        return -rte_errno;
 608                }
 609                /* Already unbound, return success before obj checking. */
 610                if (txq_ctrl->hairpin_status == 0) {
 611                        DRV_LOG(DEBUG, "port %u Tx queue %d is already unbound",
 612                                dev->data->port_id, cur_queue);
 613                        mlx5_txq_release(dev, cur_queue);
 614                        return 0;
 615                }
 616                if (!txq_ctrl->obj || !txq_ctrl->obj->sq) {
 617                        rte_errno = ENOMEM;
 618                        DRV_LOG(ERR, "port %u no Txq object found: %d",
 619                                dev->data->port_id, cur_queue);
 620                        mlx5_txq_release(dev, cur_queue);
 621                        return -rte_errno;
 622                }
 623                sq_attr.state = MLX5_SQC_STATE_RST;
 624                sq_attr.sq_state = MLX5_SQC_STATE_RST;
 625                ret = mlx5_devx_cmd_modify_sq(txq_ctrl->obj->sq, &sq_attr);
 626                if (ret == 0)
 627                        txq_ctrl->hairpin_status = 0;
 628                mlx5_txq_release(dev, cur_queue);
 629        } else {
 630                struct mlx5_rxq_ctrl *rxq_ctrl;
 631                struct mlx5_devx_modify_rq_attr rq_attr = { 0 };
 632
 633                rxq_ctrl = mlx5_rxq_get(dev, cur_queue);
 634                if (rxq_ctrl == NULL) {
 635                        rte_errno = EINVAL;
 636                        DRV_LOG(ERR, "Failed to get port %u Rx queue %d",
 637                                dev->data->port_id, cur_queue);
 638                        return -rte_errno;
 639                }
 640                if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN) {
 641                        rte_errno = EINVAL;
 642                        DRV_LOG(ERR, "port %u queue %d not a hairpin Rxq",
 643                                dev->data->port_id, cur_queue);
 644                        mlx5_rxq_release(dev, cur_queue);
 645                        return -rte_errno;
 646                }
 647                if (rxq_ctrl->hairpin_status == 0) {
 648                        DRV_LOG(DEBUG, "port %u Rx queue %d is already unbound",
 649                                dev->data->port_id, cur_queue);
 650                        mlx5_rxq_release(dev, cur_queue);
 651                        return 0;
 652                }
 653                if (rxq_ctrl->obj == NULL || rxq_ctrl->obj->rq == NULL) {
 654                        rte_errno = ENOMEM;
 655                        DRV_LOG(ERR, "port %u no Rxq object found: %d",
 656                                dev->data->port_id, cur_queue);
 657                        mlx5_rxq_release(dev, cur_queue);
 658                        return -rte_errno;
 659                }
 660                rq_attr.state = MLX5_SQC_STATE_RST;
 661                rq_attr.rq_state = MLX5_SQC_STATE_RST;
 662                ret = mlx5_devx_cmd_modify_rq(rxq_ctrl->obj->rq, &rq_attr);
 663                if (ret == 0)
 664                        rxq_ctrl->hairpin_status = 0;
 665                mlx5_rxq_release(dev, cur_queue);
 666        }
 667        return ret;
 668}
 669
 670/*
 671 * Bind the hairpin port pairs, from the Tx to the peer Rx.
 672 * This function only supports to bind the Tx to one Rx.
 673 *
 674 * @param dev
 675 *   Pointer to Ethernet device structure.
 676 * @param rx_port
 677 *   Port identifier of the Rx port.
 678 *
 679 * @return
 680 *   0 on success, a negative errno value otherwise and rte_errno is set.
 681 */
 682static int
 683mlx5_hairpin_bind_single_port(struct rte_eth_dev *dev, uint16_t rx_port)
 684{
 685        struct mlx5_priv *priv = dev->data->dev_private;
 686        int ret = 0;
 687        struct mlx5_txq_ctrl *txq_ctrl;
 688        uint32_t i;
 689        struct rte_hairpin_peer_info peer = {0xffffff};
 690        struct rte_hairpin_peer_info cur;
 691        const struct rte_eth_hairpin_conf *conf;
 692        uint16_t num_q = 0;
 693        uint16_t local_port = priv->dev_data->port_id;
 694        uint32_t manual;
 695        uint32_t explicit;
 696        uint16_t rx_queue;
 697
 698        if (mlx5_eth_find_next(rx_port, dev->device) != rx_port) {
 699                rte_errno = ENODEV;
 700                DRV_LOG(ERR, "Rx port %u does not belong to mlx5", rx_port);
 701                return -rte_errno;
 702        }
 703        /*
 704         * Before binding TxQ to peer RxQ, first round loop will be used for
 705         * checking the queues' configuration consistency. This would be a
 706         * little time consuming but better than doing the rollback.
 707         */
 708        for (i = 0; i != priv->txqs_n; i++) {
 709                txq_ctrl = mlx5_txq_get(dev, i);
 710                if (txq_ctrl == NULL)
 711                        continue;
 712                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 713                        mlx5_txq_release(dev, i);
 714                        continue;
 715                }
 716                /*
 717                 * All hairpin Tx queues of a single port that connected to the
 718                 * same peer Rx port should have the same "auto binding" and
 719                 * "implicit Tx flow" modes.
 720                 * Peer consistency checking will be done in per queue binding.
 721                 */
 722                conf = &txq_ctrl->hairpin_conf;
 723                if (conf->peers[0].port == rx_port) {
 724                        if (num_q == 0) {
 725                                manual = conf->manual_bind;
 726                                explicit = conf->tx_explicit;
 727                        } else {
 728                                if (manual != conf->manual_bind ||
 729                                    explicit != conf->tx_explicit) {
 730                                        rte_errno = EINVAL;
 731                                        DRV_LOG(ERR, "port %u queue %d mode"
 732                                                " mismatch: %u %u, %u %u",
 733                                                local_port, i, manual,
 734                                                conf->manual_bind, explicit,
 735                                                conf->tx_explicit);
 736                                        mlx5_txq_release(dev, i);
 737                                        return -rte_errno;
 738                                }
 739                        }
 740                        num_q++;
 741                }
 742                mlx5_txq_release(dev, i);
 743        }
 744        /* Once no queue is configured, success is returned directly. */
 745        if (num_q == 0)
 746                return ret;
 747        /* All the hairpin TX queues need to be traversed again. */
 748        for (i = 0; i != priv->txqs_n; i++) {
 749                txq_ctrl = mlx5_txq_get(dev, i);
 750                if (txq_ctrl == NULL)
 751                        continue;
 752                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 753                        mlx5_txq_release(dev, i);
 754                        continue;
 755                }
 756                if (txq_ctrl->hairpin_conf.peers[0].port != rx_port) {
 757                        mlx5_txq_release(dev, i);
 758                        continue;
 759                }
 760                rx_queue = txq_ctrl->hairpin_conf.peers[0].queue;
 761                /*
 762                 * Fetch peer RxQ's information.
 763                 * No need to pass the information of the current queue.
 764                 */
 765                ret = rte_eth_hairpin_queue_peer_update(rx_port, rx_queue,
 766                                                        NULL, &peer, 1);
 767                if (ret != 0) {
 768                        mlx5_txq_release(dev, i);
 769                        goto error;
 770                }
 771                /* Accessing its own device, inside mlx5 PMD. */
 772                ret = mlx5_hairpin_queue_peer_bind(dev, i, &peer, 1);
 773                if (ret != 0) {
 774                        mlx5_txq_release(dev, i);
 775                        goto error;
 776                }
 777                /* Pass TxQ's information to peer RxQ and try binding. */
 778                cur.peer_q = rx_queue;
 779                cur.qp_id = txq_ctrl->obj->sq->id;
 780                cur.vhca_id = priv->config.hca_attr.vhca_id;
 781                cur.tx_explicit = txq_ctrl->hairpin_conf.tx_explicit;
 782                cur.manual_bind = txq_ctrl->hairpin_conf.manual_bind;
 783                /*
 784                 * In order to access another device in a proper way, RTE level
 785                 * private function is needed.
 786                 */
 787                ret = rte_eth_hairpin_queue_peer_bind(rx_port, rx_queue,
 788                                                      &cur, 0);
 789                if (ret != 0) {
 790                        mlx5_txq_release(dev, i);
 791                        goto error;
 792                }
 793                mlx5_txq_release(dev, i);
 794        }
 795        return 0;
 796error:
 797        /*
 798         * Do roll-back process for the queues already bound.
 799         * No need to check the return value of the queue unbind function.
 800         */
 801        do {
 802                /* No validation is needed here. */
 803                txq_ctrl = mlx5_txq_get(dev, i);
 804                if (txq_ctrl == NULL)
 805                        continue;
 806                rx_queue = txq_ctrl->hairpin_conf.peers[0].queue;
 807                rte_eth_hairpin_queue_peer_unbind(rx_port, rx_queue, 0);
 808                mlx5_hairpin_queue_peer_unbind(dev, i, 1);
 809                mlx5_txq_release(dev, i);
 810        } while (i--);
 811        return ret;
 812}
 813
 814/*
 815 * Unbind the hairpin port pair, HW configuration of both devices will be clear
 816 * and status will be reset for all the queues used between the them.
 817 * This function only supports to unbind the Tx from one Rx.
 818 *
 819 * @param dev
 820 *   Pointer to Ethernet device structure.
 821 * @param rx_port
 822 *   Port identifier of the Rx port.
 823 *
 824 * @return
 825 *   0 on success, a negative errno value otherwise and rte_errno is set.
 826 */
 827static int
 828mlx5_hairpin_unbind_single_port(struct rte_eth_dev *dev, uint16_t rx_port)
 829{
 830        struct mlx5_priv *priv = dev->data->dev_private;
 831        struct mlx5_txq_ctrl *txq_ctrl;
 832        uint32_t i;
 833        int ret;
 834        uint16_t cur_port = priv->dev_data->port_id;
 835
 836        if (mlx5_eth_find_next(rx_port, dev->device) != rx_port) {
 837                rte_errno = ENODEV;
 838                DRV_LOG(ERR, "Rx port %u does not belong to mlx5", rx_port);
 839                return -rte_errno;
 840        }
 841        for (i = 0; i != priv->txqs_n; i++) {
 842                uint16_t rx_queue;
 843
 844                txq_ctrl = mlx5_txq_get(dev, i);
 845                if (txq_ctrl == NULL)
 846                        continue;
 847                if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 848                        mlx5_txq_release(dev, i);
 849                        continue;
 850                }
 851                if (txq_ctrl->hairpin_conf.peers[0].port != rx_port) {
 852                        mlx5_txq_release(dev, i);
 853                        continue;
 854                }
 855                /* Indeed, only the first used queue needs to be checked. */
 856                if (txq_ctrl->hairpin_conf.manual_bind == 0) {
 857                        if (cur_port != rx_port) {
 858                                rte_errno = EINVAL;
 859                                DRV_LOG(ERR, "port %u and port %u are in"
 860                                        " auto-bind mode", cur_port, rx_port);
 861                                mlx5_txq_release(dev, i);
 862                                return -rte_errno;
 863                        } else {
 864                                return 0;
 865                        }
 866                }
 867                rx_queue = txq_ctrl->hairpin_conf.peers[0].queue;
 868                mlx5_txq_release(dev, i);
 869                ret = rte_eth_hairpin_queue_peer_unbind(rx_port, rx_queue, 0);
 870                if (ret) {
 871                        DRV_LOG(ERR, "port %u Rx queue %d unbind - failure",
 872                                rx_port, rx_queue);
 873                        return ret;
 874                }
 875                ret = mlx5_hairpin_queue_peer_unbind(dev, i, 1);
 876                if (ret) {
 877                        DRV_LOG(ERR, "port %u Tx queue %d unbind - failure",
 878                                cur_port, i);
 879                        return ret;
 880                }
 881        }
 882        return 0;
 883}
 884
 885/*
 886 * Bind hairpin ports, Rx could be all ports when using RTE_MAX_ETHPORTS.
 887 * @see mlx5_hairpin_bind_single_port()
 888 */
 889int
 890mlx5_hairpin_bind(struct rte_eth_dev *dev, uint16_t rx_port)
 891{
 892        int ret = 0;
 893        uint16_t p, pp;
 894
 895        /*
 896         * If the Rx port has no hairpin configuration with the current port,
 897         * the binding will be skipped in the called function of single port.
 898         * Device started status will be checked only before the queue
 899         * information updating.
 900         */
 901        if (rx_port == RTE_MAX_ETHPORTS) {
 902                MLX5_ETH_FOREACH_DEV(p, dev->device) {
 903                        ret = mlx5_hairpin_bind_single_port(dev, p);
 904                        if (ret != 0)
 905                                goto unbind;
 906                }
 907                return ret;
 908        } else {
 909                return mlx5_hairpin_bind_single_port(dev, rx_port);
 910        }
 911unbind:
 912        MLX5_ETH_FOREACH_DEV(pp, dev->device)
 913                if (pp < p)
 914                        mlx5_hairpin_unbind_single_port(dev, pp);
 915        return ret;
 916}
 917
 918/*
 919 * Unbind hairpin ports, Rx could be all ports when using RTE_MAX_ETHPORTS.
 920 * @see mlx5_hairpin_unbind_single_port()
 921 */
 922int
 923mlx5_hairpin_unbind(struct rte_eth_dev *dev, uint16_t rx_port)
 924{
 925        int ret = 0;
 926        uint16_t p;
 927
 928        if (rx_port == RTE_MAX_ETHPORTS)
 929                MLX5_ETH_FOREACH_DEV(p, dev->device) {
 930                        ret = mlx5_hairpin_unbind_single_port(dev, p);
 931                        if (ret != 0)
 932                                return ret;
 933                }
 934        else
 935                ret = mlx5_hairpin_unbind_single_port(dev, rx_port);
 936        return ret;
 937}
 938
 939/*
 940 * DPDK callback to get the hairpin peer ports list.
 941 * This will return the actual number of peer ports and save the identifiers
 942 * into the array (sorted, may be different from that when setting up the
 943 * hairpin peer queues).
 944 * The peer port ID could be the same as the port ID of the current device.
 945 *
 946 * @param dev
 947 *   Pointer to Ethernet device structure.
 948 * @param peer_ports
 949 *   Pointer to array to save the port identifiers.
 950 * @param len
 951 *   The length of the array.
 952 * @param direction
 953 *   Current port to peer port direction.
 954 *   positive - current used as Tx to get all peer Rx ports.
 955 *   zero - current used as Rx to get all peer Tx ports.
 956 *
 957 * @return
 958 *   0 or positive value on success, actual number of peer ports.
 959 *   a negative errno value otherwise and rte_errno is set.
 960 */
 961int
 962mlx5_hairpin_get_peer_ports(struct rte_eth_dev *dev, uint16_t *peer_ports,
 963                            size_t len, uint32_t direction)
 964{
 965        struct mlx5_priv *priv = dev->data->dev_private;
 966        struct mlx5_txq_ctrl *txq_ctrl;
 967        struct mlx5_rxq_ctrl *rxq_ctrl;
 968        uint32_t i;
 969        uint16_t pp;
 970        uint32_t bits[(RTE_MAX_ETHPORTS + 31) / 32] = {0};
 971        int ret = 0;
 972
 973        if (direction) {
 974                for (i = 0; i < priv->txqs_n; i++) {
 975                        txq_ctrl = mlx5_txq_get(dev, i);
 976                        if (!txq_ctrl)
 977                                continue;
 978                        if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
 979                                mlx5_txq_release(dev, i);
 980                                continue;
 981                        }
 982                        pp = txq_ctrl->hairpin_conf.peers[0].port;
 983                        if (pp >= RTE_MAX_ETHPORTS) {
 984                                rte_errno = ERANGE;
 985                                mlx5_txq_release(dev, i);
 986                                DRV_LOG(ERR, "port %hu queue %u peer port "
 987                                        "out of range %hu",
 988                                        priv->dev_data->port_id, i, pp);
 989                                return -rte_errno;
 990                        }
 991                        bits[pp / 32] |= 1 << (pp % 32);
 992                        mlx5_txq_release(dev, i);
 993                }
 994        } else {
 995                for (i = 0; i < priv->rxqs_n; i++) {
 996                        rxq_ctrl = mlx5_rxq_get(dev, i);
 997                        if (!rxq_ctrl)
 998                                continue;
 999                        if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN) {
1000                                mlx5_rxq_release(dev, i);
1001                                continue;
1002                        }
1003                        pp = rxq_ctrl->hairpin_conf.peers[0].port;
1004                        if (pp >= RTE_MAX_ETHPORTS) {
1005                                rte_errno = ERANGE;
1006                                mlx5_rxq_release(dev, i);
1007                                DRV_LOG(ERR, "port %hu queue %u peer port "
1008                                        "out of range %hu",
1009                                        priv->dev_data->port_id, i, pp);
1010                                return -rte_errno;
1011                        }
1012                        bits[pp / 32] |= 1 << (pp % 32);
1013                        mlx5_rxq_release(dev, i);
1014                }
1015        }
1016        for (i = 0; i < RTE_MAX_ETHPORTS; i++) {
1017                if (bits[i / 32] & (1 << (i % 32))) {
1018                        if ((size_t)ret >= len) {
1019                                rte_errno = E2BIG;
1020                                return -rte_errno;
1021                        }
1022                        peer_ports[ret++] = i;
1023                }
1024        }
1025        return ret;
1026}
1027
1028/**
1029 * DPDK callback to start the device.
1030 *
1031 * Simulate device start by attaching all configured flows.
1032 *
1033 * @param dev
1034 *   Pointer to Ethernet device structure.
1035 *
1036 * @return
1037 *   0 on success, a negative errno value otherwise and rte_errno is set.
1038 */
1039int
1040mlx5_dev_start(struct rte_eth_dev *dev)
1041{
1042        struct mlx5_priv *priv = dev->data->dev_private;
1043        int ret;
1044        int fine_inline;
1045
1046        DRV_LOG(DEBUG, "port %u starting device", dev->data->port_id);
1047        fine_inline = rte_mbuf_dynflag_lookup
1048                (RTE_PMD_MLX5_FINE_GRANULARITY_INLINE, NULL);
1049        if (fine_inline >= 0)
1050                rte_net_mlx5_dynf_inline_mask = 1UL << fine_inline;
1051        else
1052                rte_net_mlx5_dynf_inline_mask = 0;
1053        if (dev->data->nb_rx_queues > 0) {
1054                ret = mlx5_dev_configure_rss_reta(dev);
1055                if (ret) {
1056                        DRV_LOG(ERR, "port %u reta config failed: %s",
1057                                dev->data->port_id, strerror(rte_errno));
1058                        return -rte_errno;
1059                }
1060        }
1061        ret = mlx5_txpp_start(dev);
1062        if (ret) {
1063                DRV_LOG(ERR, "port %u Tx packet pacing init failed: %s",
1064                        dev->data->port_id, strerror(rte_errno));
1065                goto error;
1066        }
1067        if ((priv->config.devx && priv->config.dv_flow_en &&
1068            priv->config.dest_tir) && priv->obj_ops.lb_dummy_queue_create) {
1069                ret = priv->obj_ops.lb_dummy_queue_create(dev);
1070                if (ret)
1071                        goto error;
1072        }
1073        ret = mlx5_txq_start(dev);
1074        if (ret) {
1075                DRV_LOG(ERR, "port %u Tx queue allocation failed: %s",
1076                        dev->data->port_id, strerror(rte_errno));
1077                goto error;
1078        }
1079        ret = mlx5_rxq_start(dev);
1080        if (ret) {
1081                DRV_LOG(ERR, "port %u Rx queue allocation failed: %s",
1082                        dev->data->port_id, strerror(rte_errno));
1083                goto error;
1084        }
1085        /*
1086         * Such step will be skipped if there is no hairpin TX queue configured
1087         * with RX peer queue from the same device.
1088         */
1089        ret = mlx5_hairpin_auto_bind(dev);
1090        if (ret) {
1091                DRV_LOG(ERR, "port %u hairpin auto binding failed: %s",
1092                        dev->data->port_id, strerror(rte_errno));
1093                goto error;
1094        }
1095        /* Set started flag here for the following steps like control flow. */
1096        dev->data->dev_started = 1;
1097        ret = mlx5_rx_intr_vec_enable(dev);
1098        if (ret) {
1099                DRV_LOG(ERR, "port %u Rx interrupt vector creation failed",
1100                        dev->data->port_id);
1101                goto error;
1102        }
1103        mlx5_os_stats_init(dev);
1104        ret = mlx5_traffic_enable(dev);
1105        if (ret) {
1106                DRV_LOG(ERR, "port %u failed to set defaults flows",
1107                        dev->data->port_id);
1108                goto error;
1109        }
1110        /* Set a mask and offset of dynamic metadata flows into Rx queues. */
1111        mlx5_flow_rxq_dynf_metadata_set(dev);
1112        /* Set flags and context to convert Rx timestamps. */
1113        mlx5_rxq_timestamp_set(dev);
1114        /* Set a mask and offset of scheduling on timestamp into Tx queues. */
1115        mlx5_txq_dynf_timestamp_set(dev);
1116        /*
1117         * In non-cached mode, it only needs to start the default mreg copy
1118         * action and no flow created by application exists anymore.
1119         * But it is worth wrapping the interface for further usage.
1120         */
1121        ret = mlx5_flow_start_default(dev);
1122        if (ret) {
1123                DRV_LOG(DEBUG, "port %u failed to start default actions: %s",
1124                        dev->data->port_id, strerror(rte_errno));
1125                goto error;
1126        }
1127        rte_wmb();
1128        dev->tx_pkt_burst = mlx5_select_tx_function(dev);
1129        dev->rx_pkt_burst = mlx5_select_rx_function(dev);
1130        /* Enable datapath on secondary process. */
1131        mlx5_mp_os_req_start_rxtx(dev);
1132        if (priv->sh->intr_handle.fd >= 0) {
1133                priv->sh->port[priv->dev_port - 1].ih_port_id =
1134                                        (uint32_t)dev->data->port_id;
1135        } else {
1136                DRV_LOG(INFO, "port %u starts without LSC and RMV interrupts.",
1137                        dev->data->port_id);
1138                dev->data->dev_conf.intr_conf.lsc = 0;
1139                dev->data->dev_conf.intr_conf.rmv = 0;
1140        }
1141        if (priv->sh->intr_handle_devx.fd >= 0)
1142                priv->sh->port[priv->dev_port - 1].devx_ih_port_id =
1143                                        (uint32_t)dev->data->port_id;
1144        return 0;
1145error:
1146        ret = rte_errno; /* Save rte_errno before cleanup. */
1147        /* Rollback. */
1148        dev->data->dev_started = 0;
1149        mlx5_flow_stop_default(dev);
1150        mlx5_traffic_disable(dev);
1151        mlx5_txq_stop(dev);
1152        mlx5_rxq_stop(dev);
1153        if (priv->obj_ops.lb_dummy_queue_release)
1154                priv->obj_ops.lb_dummy_queue_release(dev);
1155        mlx5_txpp_stop(dev); /* Stop last. */
1156        rte_errno = ret; /* Restore rte_errno. */
1157        return -rte_errno;
1158}
1159
1160/**
1161 * DPDK callback to stop the device.
1162 *
1163 * Simulate device stop by detaching all configured flows.
1164 *
1165 * @param dev
1166 *   Pointer to Ethernet device structure.
1167 */
1168int
1169mlx5_dev_stop(struct rte_eth_dev *dev)
1170{
1171        struct mlx5_priv *priv = dev->data->dev_private;
1172
1173        dev->data->dev_started = 0;
1174        /* Prevent crashes when queues are still in use. */
1175        dev->rx_pkt_burst = removed_rx_burst;
1176        dev->tx_pkt_burst = removed_tx_burst;
1177        rte_wmb();
1178        /* Disable datapath on secondary process. */
1179        mlx5_mp_os_req_stop_rxtx(dev);
1180        rte_delay_us_sleep(1000 * priv->rxqs_n);
1181        DRV_LOG(DEBUG, "port %u stopping device", dev->data->port_id);
1182        mlx5_flow_stop_default(dev);
1183        /* Control flows for default traffic can be removed firstly. */
1184        mlx5_traffic_disable(dev);
1185        /* All RX queue flags will be cleared in the flush interface. */
1186        mlx5_flow_list_flush(dev, MLX5_FLOW_TYPE_GEN, true);
1187        mlx5_flow_meter_rxq_flush(dev);
1188        mlx5_rx_intr_vec_disable(dev);
1189        priv->sh->port[priv->dev_port - 1].ih_port_id = RTE_MAX_ETHPORTS;
1190        priv->sh->port[priv->dev_port - 1].devx_ih_port_id = RTE_MAX_ETHPORTS;
1191        mlx5_txq_stop(dev);
1192        mlx5_rxq_stop(dev);
1193        if (priv->obj_ops.lb_dummy_queue_release)
1194                priv->obj_ops.lb_dummy_queue_release(dev);
1195        mlx5_txpp_stop(dev);
1196
1197        return 0;
1198}
1199
1200/**
1201 * Enable traffic flows configured by control plane
1202 *
1203 * @param dev
1204 *   Pointer to Ethernet device private data.
1205 * @param dev
1206 *   Pointer to Ethernet device structure.
1207 *
1208 * @return
1209 *   0 on success, a negative errno value otherwise and rte_errno is set.
1210 */
1211int
1212mlx5_traffic_enable(struct rte_eth_dev *dev)
1213{
1214        struct mlx5_priv *priv = dev->data->dev_private;
1215        struct rte_flow_item_eth bcast = {
1216                .dst.addr_bytes = "\xff\xff\xff\xff\xff\xff",
1217        };
1218        struct rte_flow_item_eth ipv6_multi_spec = {
1219                .dst.addr_bytes = "\x33\x33\x00\x00\x00\x00",
1220        };
1221        struct rte_flow_item_eth ipv6_multi_mask = {
1222                .dst.addr_bytes = "\xff\xff\x00\x00\x00\x00",
1223        };
1224        struct rte_flow_item_eth unicast = {
1225                .src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
1226        };
1227        struct rte_flow_item_eth unicast_mask = {
1228                .dst.addr_bytes = "\xff\xff\xff\xff\xff\xff",
1229        };
1230        const unsigned int vlan_filter_n = priv->vlan_filter_n;
1231        const struct rte_ether_addr cmp = {
1232                .addr_bytes = "\x00\x00\x00\x00\x00\x00",
1233        };
1234        unsigned int i;
1235        unsigned int j;
1236        int ret;
1237
1238        /*
1239         * Hairpin txq default flow should be created no matter if it is
1240         * isolation mode. Or else all the packets to be sent will be sent
1241         * out directly without the TX flow actions, e.g. encapsulation.
1242         */
1243        for (i = 0; i != priv->txqs_n; ++i) {
1244                struct mlx5_txq_ctrl *txq_ctrl = mlx5_txq_get(dev, i);
1245                if (!txq_ctrl)
1246                        continue;
1247                /* Only Tx implicit mode requires the default Tx flow. */
1248                if (txq_ctrl->type == MLX5_TXQ_TYPE_HAIRPIN &&
1249                    txq_ctrl->hairpin_conf.tx_explicit == 0 &&
1250                    txq_ctrl->hairpin_conf.peers[0].port ==
1251                    priv->dev_data->port_id) {
1252                        ret = mlx5_ctrl_flow_source_queue(dev, i);
1253                        if (ret) {
1254                                mlx5_txq_release(dev, i);
1255                                goto error;
1256                        }
1257                }
1258                mlx5_txq_release(dev, i);
1259        }
1260        if (priv->config.dv_esw_en && !priv->config.vf && !priv->config.sf) {
1261                if (mlx5_flow_create_esw_table_zero_flow(dev))
1262                        priv->fdb_def_rule = 1;
1263                else
1264                        DRV_LOG(INFO, "port %u FDB default rule cannot be"
1265                                " configured - only Eswitch group 0 flows are"
1266                                " supported.", dev->data->port_id);
1267        }
1268        if (!priv->config.lacp_by_user && priv->pf_bond >= 0) {
1269                ret = mlx5_flow_lacp_miss(dev);
1270                if (ret)
1271                        DRV_LOG(INFO, "port %u LACP rule cannot be created - "
1272                                "forward LACP to kernel.", dev->data->port_id);
1273                else
1274                        DRV_LOG(INFO, "LACP traffic will be missed in port %u."
1275                                , dev->data->port_id);
1276        }
1277        if (priv->isolated)
1278                return 0;
1279        if (dev->data->promiscuous) {
1280                struct rte_flow_item_eth promisc = {
1281                        .dst.addr_bytes = "\x00\x00\x00\x00\x00\x00",
1282                        .src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
1283                        .type = 0,
1284                };
1285
1286                ret = mlx5_ctrl_flow(dev, &promisc, &promisc);
1287                if (ret)
1288                        goto error;
1289        }
1290        if (dev->data->all_multicast) {
1291                struct rte_flow_item_eth multicast = {
1292                        .dst.addr_bytes = "\x01\x00\x00\x00\x00\x00",
1293                        .src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
1294                        .type = 0,
1295                };
1296
1297                ret = mlx5_ctrl_flow(dev, &multicast, &multicast);
1298                if (ret)
1299                        goto error;
1300        } else {
1301                /* Add broadcast/multicast flows. */
1302                for (i = 0; i != vlan_filter_n; ++i) {
1303                        uint16_t vlan = priv->vlan_filter[i];
1304
1305                        struct rte_flow_item_vlan vlan_spec = {
1306                                .tci = rte_cpu_to_be_16(vlan),
1307                        };
1308                        struct rte_flow_item_vlan vlan_mask =
1309                                rte_flow_item_vlan_mask;
1310
1311                        ret = mlx5_ctrl_flow_vlan(dev, &bcast, &bcast,
1312                                                  &vlan_spec, &vlan_mask);
1313                        if (ret)
1314                                goto error;
1315                        ret = mlx5_ctrl_flow_vlan(dev, &ipv6_multi_spec,
1316                                                  &ipv6_multi_mask,
1317                                                  &vlan_spec, &vlan_mask);
1318                        if (ret)
1319                                goto error;
1320                }
1321                if (!vlan_filter_n) {
1322                        ret = mlx5_ctrl_flow(dev, &bcast, &bcast);
1323                        if (ret)
1324                                goto error;
1325                        ret = mlx5_ctrl_flow(dev, &ipv6_multi_spec,
1326                                             &ipv6_multi_mask);
1327                        if (ret) {
1328                                /* Do not fail on IPv6 broadcast creation failure. */
1329                                DRV_LOG(WARNING,
1330                                        "IPv6 broadcast is not supported");
1331                                ret = 0;
1332                        }
1333                }
1334        }
1335        /* Add MAC address flows. */
1336        for (i = 0; i != MLX5_MAX_MAC_ADDRESSES; ++i) {
1337                struct rte_ether_addr *mac = &dev->data->mac_addrs[i];
1338
1339                if (!memcmp(mac, &cmp, sizeof(*mac)))
1340                        continue;
1341                memcpy(&unicast.dst.addr_bytes,
1342                       mac->addr_bytes,
1343                       RTE_ETHER_ADDR_LEN);
1344                for (j = 0; j != vlan_filter_n; ++j) {
1345                        uint16_t vlan = priv->vlan_filter[j];
1346
1347                        struct rte_flow_item_vlan vlan_spec = {
1348                                .tci = rte_cpu_to_be_16(vlan),
1349                        };
1350                        struct rte_flow_item_vlan vlan_mask =
1351                                rte_flow_item_vlan_mask;
1352
1353                        ret = mlx5_ctrl_flow_vlan(dev, &unicast,
1354                                                  &unicast_mask,
1355                                                  &vlan_spec,
1356                                                  &vlan_mask);
1357                        if (ret)
1358                                goto error;
1359                }
1360                if (!vlan_filter_n) {
1361                        ret = mlx5_ctrl_flow(dev, &unicast, &unicast_mask);
1362                        if (ret)
1363                                goto error;
1364                }
1365        }
1366        return 0;
1367error:
1368        ret = rte_errno; /* Save rte_errno before cleanup. */
1369        mlx5_flow_list_flush(dev, MLX5_FLOW_TYPE_CTL, false);
1370        rte_errno = ret; /* Restore rte_errno. */
1371        return -rte_errno;
1372}
1373
1374
1375/**
1376 * Disable traffic flows configured by control plane
1377 *
1378 * @param dev
1379 *   Pointer to Ethernet device private data.
1380 */
1381void
1382mlx5_traffic_disable(struct rte_eth_dev *dev)
1383{
1384        mlx5_flow_list_flush(dev, MLX5_FLOW_TYPE_CTL, false);
1385}
1386
1387/**
1388 * Restart traffic flows configured by control plane
1389 *
1390 * @param dev
1391 *   Pointer to Ethernet device private data.
1392 *
1393 * @return
1394 *   0 on success, a negative errno value otherwise and rte_errno is set.
1395 */
1396int
1397mlx5_traffic_restart(struct rte_eth_dev *dev)
1398{
1399        if (dev->data->dev_started) {
1400                mlx5_traffic_disable(dev);
1401                return mlx5_traffic_enable(dev);
1402        }
1403        return 0;
1404}
1405