67f57892f9
Currently the rxe driver has three work queue tasks per qp. These are the req.task, comp.task and resp.task which call rxe_requester(), rxe_completer() and rxe_responder() respectively directly or on work queues. Each of these subroutines checks to see if there is work to be performed on the send queue or on the response packet queue or the request packet queue and will run until there is no work remaining or yield the cpu and reschedule itself until there is no work remaining. This commit combines the req.task and comp.task into a single send.task and renames the resp.task to the recv.task. The combined send.task calls rxe_requester() and rxe_completer() serially and continues until all work on both the send queue and the response packet queue are done. In various benchmarks the performance is either improved or left the same. At high scale there is a significant reduction in the load on the cpu. This is the first step in combining these two tasks. Once they are serialized cross rescheduling of req.task and comp.task can be more efficiently handled by just letting the send.task continue to run. This will be done in the next several patches. Link: https://lore.kernel.org/r/20240329145513.35381-7-rpearsonhpe@gmail.com Signed-off-by: Bob Pearson <rpearsonhpe@gmail.com> Signed-off-by: Jason Gunthorpe <jgg@nvidia.com>
38 lines
870 B
C
38 lines
870 B
C
/* SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB */
|
|
/*
|
|
* Copyright (c) 2017 Mellanox Technologies Ltd. All rights reserved.
|
|
*/
|
|
|
|
#ifndef RXE_HW_COUNTERS_H
|
|
#define RXE_HW_COUNTERS_H
|
|
|
|
/*
|
|
* when adding counters to enum also add
|
|
* them to rxe_counter_name[] vector.
|
|
*/
|
|
enum rxe_counters {
|
|
RXE_CNT_SENT_PKTS,
|
|
RXE_CNT_RCVD_PKTS,
|
|
RXE_CNT_DUP_REQ,
|
|
RXE_CNT_OUT_OF_SEQ_REQ,
|
|
RXE_CNT_RCV_RNR,
|
|
RXE_CNT_SND_RNR,
|
|
RXE_CNT_RCV_SEQ_ERR,
|
|
RXE_CNT_SENDER_SCHED,
|
|
RXE_CNT_RETRY_EXCEEDED,
|
|
RXE_CNT_RNR_RETRY_EXCEEDED,
|
|
RXE_CNT_COMP_RETRY,
|
|
RXE_CNT_SEND_ERR,
|
|
RXE_CNT_LINK_DOWNED,
|
|
RXE_CNT_RDMA_SEND,
|
|
RXE_CNT_RDMA_RECV,
|
|
RXE_NUM_OF_COUNTERS
|
|
};
|
|
|
|
struct rdma_hw_stats *rxe_ib_alloc_hw_port_stats(struct ib_device *ibdev,
|
|
u32 port_num);
|
|
int rxe_ib_get_hw_stats(struct ib_device *ibdev,
|
|
struct rdma_hw_stats *stats,
|
|
u32 port, int index);
|
|
#endif /* RXE_HW_COUNTERS_H */
|