Spdk/include/spdk_internal/rdma.h
Alexey Marchuk 1eae58ff6d rdma: Add statistics per qpair
These statistics can help to estimate efficiency of
Work Requests batching and show busy/idle polls ratio.

Send: the doorbell updates statistics for verbs
provider are incremented per each ibv_post_send call,
for mlx5_dv per each ibv_wr_complete call.

Recv: the doorbell updates statistics for both
providers are updated when either ibv_post_recv
or ibv_post_srq_recv functions are called.

Each qpair on initialization accepts an optional
pointer to shared statistics (nvmf/nvme poll groups).
If the pointer to statistics is not provided then
qpair allocates its own structure. That is done
to support cases when NVME RDMA initiator doesn't
use poll groups, so we can avoid checks that qpair
has statistics in IO path

Change-Id: I07dea603cb870b85ea23c42e8e2c4520b1c66252
Signed-off-by: Alexey Marchuk <alexeymar@mellanox.com>
Reviewed-on: https://review.spdk.io/gerrit/c/spdk/spdk/+/6293
Community-CI: Broadcom CI
Community-CI: Mellanox Build Bot
Tested-by: SPDK CI Jenkins <sys_sgci@intel.com>
Reviewed-by: Ben Walker <benjamin.walker@intel.com>
Reviewed-by: Jim Harris <james.r.harris@intel.com>
2021-03-01 10:17:13 +00:00

291 lines
9.5 KiB
C

/*-
* BSD LICENSE
*
* Copyright (c) Intel Corporation. All rights reserved.
* Copyright (c) Mellanox Technologies LTD. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
* * Neither the name of Intel Corporation nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef SPDK_RDMA_H
#define SPDK_RDMA_H
#include <infiniband/verbs.h>
#include <rdma/rdma_cma.h>
#include <rdma/rdma_verbs.h>
/* Contains hooks definition */
#include "spdk/nvme.h"
struct spdk_rdma_wr_stats {
/* Total number of submitted requests */
uint64_t num_submitted_wrs;
/* Total number of doorbell updates */
uint64_t doorbell_updates;
};
struct spdk_rdma_qp_stats {
struct spdk_rdma_wr_stats send;
struct spdk_rdma_wr_stats recv;
};
struct spdk_rdma_qp_init_attr {
void *qp_context;
struct ibv_cq *send_cq;
struct ibv_cq *recv_cq;
struct ibv_srq *srq;
struct ibv_qp_cap cap;
struct ibv_pd *pd;
struct spdk_rdma_qp_stats *stats;
};
struct spdk_rdma_send_wr_list {
struct ibv_send_wr *first;
struct ibv_send_wr *last;
};
struct spdk_rdma_recv_wr_list {
struct ibv_recv_wr *first;
struct ibv_recv_wr *last;
};
struct spdk_rdma_qp {
struct ibv_qp *qp;
struct rdma_cm_id *cm_id;
struct spdk_rdma_send_wr_list send_wrs;
struct spdk_rdma_recv_wr_list recv_wrs;
struct spdk_rdma_qp_stats *stats;
bool shared_stats;
};
struct spdk_rdma_mem_map;
union spdk_rdma_mr {
struct ibv_mr *mr;
uint64_t key;
};
enum SPDK_RDMA_TRANSLATION_TYPE {
SPDK_RDMA_TRANSLATION_MR = 0,
SPDK_RDMA_TRANSLATION_KEY
};
struct spdk_rdma_memory_translation {
union spdk_rdma_mr mr_or_key;
uint8_t translation_type;
};
struct spdk_rdma_srq_init_attr {
struct ibv_pd *pd;
struct spdk_rdma_wr_stats *stats;
struct ibv_srq_init_attr srq_init_attr;
};
struct spdk_rdma_srq {
struct ibv_srq *srq;
struct spdk_rdma_recv_wr_list recv_wrs;
struct spdk_rdma_wr_stats *stats;
bool shared_stats;
};
/**
* Create RDMA SRQ
*
* \param init_attr Pointer to SRQ init attr
* \return pointer to srq on success or NULL on failure. errno is updated in failure case.
*/
struct spdk_rdma_srq *spdk_rdma_srq_create(struct spdk_rdma_srq_init_attr *init_attr);
/**
* Destroy RDMA SRQ
*
* \param rdma_srq Pointer to SRQ
* \return 0 on succes, errno on failure
*/
int spdk_rdma_srq_destroy(struct spdk_rdma_srq *rdma_srq);
/**
* Append the given recv wr structure to the SRQ's outstanding recv list.
* This function accepts either a single Work Request or the first WR in a linked list.
*
* \param rdma_srq Pointer to SRQ
* \param first pointer to the first Work Request
* \return true if there were no outstanding WRs before, false otherwise
*/
bool spdk_rdma_srq_queue_recv_wrs(struct spdk_rdma_srq *rdma_srq, struct ibv_recv_wr *first);
/**
* Submit all queued receive Work Request
*
* \param rdma_srq Pointer to SRQ
* \param bad_wr Stores a pointer to the first failed WR if this function return nonzero value
* \return 0 on succes, errno on failure
*/
int spdk_rdma_srq_flush_recv_wrs(struct spdk_rdma_srq *rdma_srq, struct ibv_recv_wr **bad_wr);
/**
* Create RDMA provider specific qpair
*
* \param cm_id Pointer to RDMA_CM cm_id
* \param qp_attr Pointer to qpair init attributes
* \return Pointer to a newly created qpair on success or NULL on failure
*/
struct spdk_rdma_qp *spdk_rdma_qp_create(struct rdma_cm_id *cm_id,
struct spdk_rdma_qp_init_attr *qp_attr);
/**
* Accept a connection request. Called by the passive side (NVMEoF target)
*
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair
* \param conn_param Optional information needed to establish the connection
* \return 0 on success, errno on failure
*/
int spdk_rdma_qp_accept(struct spdk_rdma_qp *spdk_rdma_qp, struct rdma_conn_param *conn_param);
/**
* Complete the connection process, must be called by the active
* side (NVMEoF initiator) upon receipt RDMA_CM_EVENT_CONNECT_RESPONSE
*
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair
* \return 0 on success, errno on failure
*/
int spdk_rdma_qp_complete_connect(struct spdk_rdma_qp *spdk_rdma_qp);
/**
* Destroy RDMA provider specific qpair
*
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair to be destroyed
*/
void spdk_rdma_qp_destroy(struct spdk_rdma_qp *spdk_rdma_qp);
/**
* Disconnect a connection and transition associated qpair to error state.
* Generates RDMA_CM_EVENT_DISCONNECTED on both connection sides
*
* \param spdk_rdma_qp Pointer to qpair to be disconnected
*/
int spdk_rdma_qp_disconnect(struct spdk_rdma_qp *spdk_rdma_qp);
/**
* Append the given send wr structure to the qpair's outstanding sends list.
* This function accepts either a single Work Request or the first WR in a linked list.
*
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair
* \param first Pointer to the first Work Request
* \return true if there were no outstanding WRs before, false otherwise
*/
bool spdk_rdma_qp_queue_send_wrs(struct spdk_rdma_qp *spdk_rdma_qp, struct ibv_send_wr *first);
/**
* Submit all queued send Work Request
*
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair
* \param bad_wr Stores a pointer to the first failed WR if this function return nonzero value
* \return 0 on succes, errno on failure
*/
int spdk_rdma_qp_flush_send_wrs(struct spdk_rdma_qp *spdk_rdma_qp, struct ibv_send_wr **bad_wr);
/**
* Append the given recv wr structure to the qpair's outstanding recv list.
* This function accepts either a single Work Request or the first WR in a linked list.
*
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair
* \param first Pointer to the first Work Request
* \return true if there were no outstanding WRs before, false otherwise
*/
bool spdk_rdma_qp_queue_recv_wrs(struct spdk_rdma_qp *spdk_rdma_qp, struct ibv_recv_wr *first);
/**
* Submit all queued recv Work Request
* \param spdk_rdma_qp Pointer to SPDK RDMA qpair
* \param bad_wr Stores a pointer to the first failed WR if this function return nonzero value
* \return 0 on succes, errno on failure
*/
int spdk_rdma_qp_flush_recv_wrs(struct spdk_rdma_qp *spdk_rdma_qp, struct ibv_recv_wr **bad_wr);
/**
* Create a memory map which is used to register Memory Regions and perform address -> memory
* key translations
*
* \param pd Protection Domain which will be used to create Memory Regions
* \param hooks Optional hooks which are used to create Protection Domain or ger RKey
* \return Pointer to memory map or NULL on failure
*/
struct spdk_rdma_mem_map *spdk_rdma_create_mem_map(struct ibv_pd *pd,
struct spdk_nvme_rdma_hooks *hooks);
/**
* Free previously allocated memory map
*
* \param map Pointer to memory map to free
*/
void spdk_rdma_free_mem_map(struct spdk_rdma_mem_map **map);
/**
* Get a translation for the given address and length.
*
* Note: the user of this function should use address returned in \b translation structure
*
* \param map Pointer to translation map
* \param address Memory address for translation
* \param length Length of the memory address
* \param[in,out] translation Pointer to translation result to be filled by this function
* \retval -EINVAL if translation is not found
* \retval 0 translation succeed
*/
int spdk_rdma_get_translation(struct spdk_rdma_mem_map *map, void *address,
size_t length, struct spdk_rdma_memory_translation *translation);
/**
* Helper function for retrieving Local Memory Key. Should be applied to a translation
* returned by \b spdk_rdma_get_translation
*
* \param translation Memory translation
* \return Local Memory Key
*/
static inline uint32_t spdk_rdma_memory_translation_get_lkey(struct spdk_rdma_memory_translation
*translation)
{
return translation->translation_type == SPDK_RDMA_TRANSLATION_MR ?
translation->mr_or_key.mr->lkey : (uint32_t)translation->mr_or_key.key;
}
/**
* Helper function for retrieving Remote Memory Key. Should be applied to a translation
* returned by \b spdk_rdma_get_translation
*
* \param translation Memory translation
* \return Remote Memory Key
*/
static inline uint32_t spdk_rdma_memory_translation_get_rkey(struct spdk_rdma_memory_translation
*translation)
{
return translation->translation_type == SPDK_RDMA_TRANSLATION_MR ?
translation->mr_or_key.mr->rkey : (uint32_t)translation->mr_or_key.key;
}
#endif /* SPDK_RDMA_H */