Spdk/lib/idxd/idxd_user.c

560 lines
16 KiB
C
Raw Normal View History

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright (c) Intel Corporation.
* All rights reserved.
*
*/
#include "spdk/stdinc.h"
#include "spdk/env.h"
#include "spdk/util.h"
#include "spdk/memory.h"
#include "spdk/likely.h"
#include "spdk/log.h"
#include "spdk_internal/idxd.h"
#include "idxd_internal.h"
struct spdk_user_idxd_device {
struct spdk_idxd_device idxd;
struct spdk_pci_device *device;
int sock_id;
struct idxd_registers *registers;
};
#define __user_idxd(idxd) (struct spdk_user_idxd_device *)idxd
pthread_mutex_t g_driver_lock = PTHREAD_MUTEX_INITIALIZER;
static struct spdk_idxd_device *idxd_attach(struct spdk_pci_device *device);
/* Used for control commands, not for descriptor submission. */
static int
idxd_wait_cmd(struct spdk_user_idxd_device *user_idxd, int _timeout)
{
uint32_t timeout = _timeout;
union idxd_cmdsts_register cmd_status = {};
cmd_status.raw = spdk_mmio_read_4(&user_idxd->registers->cmdsts.raw);
while (cmd_status.active && --timeout) {
usleep(1);
cmd_status.raw = spdk_mmio_read_4(&user_idxd->registers->cmdsts.raw);
}
/* Check for timeout */
if (timeout == 0 && cmd_status.active) {
SPDK_ERRLOG("Command timeout, waited %u\n", _timeout);
return -EBUSY;
}
/* Check for error */
if (cmd_status.err) {
SPDK_ERRLOG("Command status reg reports error 0x%x\n", cmd_status.err);
return -EINVAL;
}
return 0;
}
static int
idxd_unmap_pci_bar(struct spdk_user_idxd_device *user_idxd, int bar)
{
int rc = 0;
void *addr = NULL;
if (bar == IDXD_MMIO_BAR) {
addr = (void *)user_idxd->registers;
} else if (bar == IDXD_WQ_BAR) {
addr = (void *)user_idxd->idxd.portal;
}
if (addr) {
rc = spdk_pci_device_unmap_bar(user_idxd->device, 0, addr);
}
return rc;
}
static int
idxd_map_pci_bars(struct spdk_user_idxd_device *user_idxd)
{
int rc;
void *addr;
uint64_t phys_addr, size;
rc = spdk_pci_device_map_bar(user_idxd->device, IDXD_MMIO_BAR, &addr, &phys_addr, &size);
if (rc != 0 || addr == NULL) {
SPDK_ERRLOG("pci_device_map_range failed with error code %d\n", rc);
return -1;
}
user_idxd->registers = (struct idxd_registers *)addr;
rc = spdk_pci_device_map_bar(user_idxd->device, IDXD_WQ_BAR, &addr, &phys_addr, &size);
if (rc != 0 || addr == NULL) {
SPDK_ERRLOG("pci_device_map_range failed with error code %d\n", rc);
rc = idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR);
if (rc) {
SPDK_ERRLOG("unable to unmap MMIO bar\n");
}
return -EINVAL;
}
user_idxd->idxd.portal = addr;
return 0;
}
static void
idxd_disable_dev(struct spdk_user_idxd_device *user_idxd)
{
int rc;
union idxd_cmd_register cmd = {};
cmd.command_code = IDXD_DISABLE_DEV;
assert(&user_idxd->registers->cmd.raw); /* scan-build */
spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw);
rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US);
if (rc < 0) {
SPDK_ERRLOG("Error disabling device %u\n", rc);
}
}
static int
idxd_reset_dev(struct spdk_user_idxd_device *user_idxd)
{
int rc;
union idxd_cmd_register cmd = {};
cmd.command_code = IDXD_RESET_DEVICE;
spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw);
rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US);
if (rc < 0) {
SPDK_ERRLOG("Error resetting device %u\n", rc);
}
return rc;
}
static int
idxd_group_config(struct spdk_user_idxd_device *user_idxd)
{
int i;
union idxd_groupcap_register groupcap;
union idxd_enginecap_register enginecap;
union idxd_wqcap_register wqcap;
union idxd_offsets_register table_offsets;
struct idxd_grptbl *grptbl;
struct idxd_grpcfg grpcfg = {};
groupcap.raw = spdk_mmio_read_8(&user_idxd->registers->groupcap.raw);
enginecap.raw = spdk_mmio_read_8(&user_idxd->registers->enginecap.raw);
wqcap.raw = spdk_mmio_read_8(&user_idxd->registers->wqcap.raw);
if (wqcap.num_wqs < 1) {
return -ENOTSUP;
}
/* Build one group with all of the engines and a single work queue. */
grpcfg.wqs[0] = 1;
grpcfg.flags.read_buffers_allowed = groupcap.read_bufs;
for (i = 0; i < enginecap.num_engines; i++) {
grpcfg.engines |= (1 << i);
}
table_offsets.raw[0] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[0]);
table_offsets.raw[1] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[1]);
grptbl = (struct idxd_grptbl *)((uint8_t *)user_idxd->registers + (table_offsets.grpcfg *
IDXD_TABLE_OFFSET_MULT));
/* Write the group we've configured */
spdk_mmio_write_8(&grptbl->group[0].wqs[0], grpcfg.wqs[0]);
spdk_mmio_write_8(&grptbl->group[0].wqs[1], 0);
spdk_mmio_write_8(&grptbl->group[0].wqs[2], 0);
spdk_mmio_write_8(&grptbl->group[0].wqs[3], 0);
spdk_mmio_write_8(&grptbl->group[0].engines, grpcfg.engines);
spdk_mmio_write_4(&grptbl->group[0].flags.raw, grpcfg.flags.raw);
/* Write zeroes to the rest of the groups */
for (i = 1 ; i < groupcap.num_groups; i++) {
spdk_mmio_write_8(&grptbl->group[i].wqs[0], 0L);
spdk_mmio_write_8(&grptbl->group[i].wqs[1], 0L);
spdk_mmio_write_8(&grptbl->group[i].wqs[2], 0L);
spdk_mmio_write_8(&grptbl->group[i].wqs[3], 0L);
spdk_mmio_write_8(&grptbl->group[i].engines, 0L);
spdk_mmio_write_4(&grptbl->group[i].flags.raw, 0L);
}
return 0;
}
static int
idxd_wq_config(struct spdk_user_idxd_device *user_idxd)
{
uint32_t i;
struct spdk_idxd_device *idxd = &user_idxd->idxd;
union idxd_wqcap_register wqcap;
union idxd_offsets_register table_offsets;
union idxd_wqcfg *wqcfg;
wqcap.raw = spdk_mmio_read_8(&user_idxd->registers->wqcap.raw);
SPDK_DEBUGLOG(idxd, "Total ring slots available 0x%x\n", wqcap.total_wq_size);
idxd->total_wq_size = wqcap.total_wq_size;
/* Spread the channels we allow per device based on the total number of WQE to try
* and achieve optimal performance for common cases.
*/
idxd->chan_per_device = (idxd->total_wq_size >= 128) ? 8 : 4;
table_offsets.raw[0] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[0]);
table_offsets.raw[1] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[1]);
wqcfg = (union idxd_wqcfg *)((uint8_t *)user_idxd->registers + (table_offsets.wqcfg *
IDXD_TABLE_OFFSET_MULT));
for (i = 0 ; i < SPDK_COUNTOF(wqcfg->raw); i++) {
wqcfg->raw[i] = spdk_mmio_read_4(&wqcfg->raw[i]);
}
wqcfg->wq_size = wqcap.total_wq_size;
wqcfg->mode = WQ_MODE_DEDICATED;
wqcfg->max_batch_shift = LOG2_WQ_MAX_BATCH;
wqcfg->max_xfer_shift = LOG2_WQ_MAX_XFER;
wqcfg->wq_state = WQ_ENABLED;
wqcfg->priority = WQ_PRIORITY_1;
for (i = 0; i < SPDK_COUNTOF(wqcfg->raw); i++) {
spdk_mmio_write_4(&wqcfg->raw[i], wqcfg->raw[i]);
}
return 0;
}
static int
idxd_device_configure(struct spdk_user_idxd_device *user_idxd)
{
int rc = 0;
union idxd_gensts_register gensts_reg;
union idxd_cmd_register cmd = {};
/*
* Map BAR0 and BAR2
*/
rc = idxd_map_pci_bars(user_idxd);
if (rc) {
return rc;
}
/*
* Reset the device
*/
rc = idxd_reset_dev(user_idxd);
if (rc) {
goto err_reset;
}
/*
* Save the device version for use in the common library code.
*/
user_idxd->idxd.version = user_idxd->registers->version;
/*
* Configure groups and work queues.
*/
rc = idxd_group_config(user_idxd);
if (rc) {
goto err_group_cfg;
}
rc = idxd_wq_config(user_idxd);
if (rc) {
goto err_wq_cfg;
}
/*
* Enable the device
*/
gensts_reg.raw = spdk_mmio_read_4(&user_idxd->registers->gensts.raw);
assert(gensts_reg.state == IDXD_DEVICE_STATE_DISABLED);
cmd.command_code = IDXD_ENABLE_DEV;
spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw);
rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US);
gensts_reg.raw = spdk_mmio_read_4(&user_idxd->registers->gensts.raw);
if ((rc < 0) || (gensts_reg.state != IDXD_DEVICE_STATE_ENABLED)) {
rc = -EINVAL;
SPDK_ERRLOG("Error enabling device %u\n", rc);
goto err_device_enable;
}
/*
* Enable the work queue that we've configured
*/
cmd.command_code = IDXD_ENABLE_WQ;
cmd.operand = 0;
spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw);
rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US);
if (rc < 0) {
SPDK_ERRLOG("Error enabling work queues 0x%x\n", rc);
goto err_wq_enable;
}
if ((rc == 0) && (gensts_reg.state == IDXD_DEVICE_STATE_ENABLED)) {
SPDK_DEBUGLOG(idxd, "Device enabled VID 0x%x DID 0x%x\n",
user_idxd->device->id.vendor_id, user_idxd->device->id.device_id);
}
return rc;
err_wq_enable:
err_device_enable:
err_wq_cfg:
err_group_cfg:
err_reset:
idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR);
idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR);
return rc;
}
static void
user_idxd_device_destruct(struct spdk_idxd_device *idxd)
{
struct spdk_user_idxd_device *user_idxd = __user_idxd(idxd);
idxd_disable_dev(user_idxd);
idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR);
idxd_unmap_pci_bar(user_idxd, IDXD_WQ_BAR);
spdk_pci_device_detach(user_idxd->device);
if (idxd->type == IDXD_DEV_TYPE_IAA) {
spdk_free(idxd->aecs);
}
free(user_idxd);
}
struct idxd_enum_ctx {
spdk_idxd_probe_cb probe_cb;
spdk_idxd_attach_cb attach_cb;
void *cb_ctx;
};
static bool
probe_cb(void *cb_ctx, struct spdk_pci_device *pci_dev)
{
struct spdk_pci_addr pci_addr __attribute__((unused));
pci_addr = spdk_pci_device_get_addr(pci_dev);
SPDK_DEBUGLOG(idxd,
" Found matching device at %04x:%02x:%02x.%x vendor:0x%04x device:0x%04x\n",
pci_addr.domain,
pci_addr.bus,
pci_addr.dev,
pci_addr.func,
spdk_pci_device_get_vendor_id(pci_dev),
spdk_pci_device_get_device_id(pci_dev));
/* Claim the device in case conflict with other process */
if (spdk_pci_device_claim(pci_dev) < 0) {
return false;
}
return true;
}
/* This function must only be called while holding g_driver_lock */
static int
idxd_enum_cb(void *ctx, struct spdk_pci_device *pci_dev)
{
struct idxd_enum_ctx *enum_ctx = ctx;
struct spdk_idxd_device *idxd;
/* Call the user probe_cb to see if they want this device or not, if not
* skip it with a positive return code.
*/
if (enum_ctx->probe_cb(enum_ctx->cb_ctx, pci_dev) == false) {
return 1;
}
if (probe_cb(enum_ctx->cb_ctx, pci_dev)) {
idxd = idxd_attach(pci_dev);
if (idxd == NULL) {
SPDK_ERRLOG("idxd_attach() failed\n");
return -EINVAL;
}
enum_ctx->attach_cb(enum_ctx->cb_ctx, idxd);
}
return 0;
}
/* The IDXD driver supports 2 distinct HW units, DSA and IAA. */
static int
user_idxd_probe(void *cb_ctx, spdk_idxd_attach_cb attach_cb,
spdk_idxd_probe_cb probe_cb)
{
int rc;
struct idxd_enum_ctx enum_ctx;
enum_ctx.probe_cb = probe_cb;
enum_ctx.attach_cb = attach_cb;
enum_ctx.cb_ctx = cb_ctx;
pthread_mutex_lock(&g_driver_lock);
rc = spdk_pci_enumerate(spdk_pci_idxd_get_driver(), idxd_enum_cb, &enum_ctx);
pthread_mutex_unlock(&g_driver_lock);
assert(rc == 0);
return rc;
}
static void
user_idxd_dump_sw_err(struct spdk_idxd_device *idxd, void *portal)
{
struct spdk_user_idxd_device *user_idxd = __user_idxd(idxd);
union idxd_swerr_register sw_err;
uint16_t i;
SPDK_NOTICELOG("SW Error Raw:");
for (i = 0; i < 4; i++) {
sw_err.raw[i] = spdk_mmio_read_8(&user_idxd->registers->sw_err.raw[i]);
SPDK_NOTICELOG(" 0x%lx\n", sw_err.raw[i]);
}
SPDK_NOTICELOG("SW Error error code: %#x\n", (uint8_t)(sw_err.error));
SPDK_NOTICELOG("SW Error WQ index: %u\n", (uint8_t)(sw_err.wq_idx));
SPDK_NOTICELOG("SW Error Operation: %u\n", (uint8_t)(sw_err.operation));
}
static char *
user_idxd_portal_get_addr(struct spdk_idxd_device *idxd)
{
return (char *)idxd->portal;
}
static struct spdk_idxd_impl g_user_idxd_impl = {
.name = "user",
.probe = user_idxd_probe,
.destruct = user_idxd_device_destruct,
.dump_sw_error = user_idxd_dump_sw_err,
.portal_get_addr = user_idxd_portal_get_addr
};
/*
* Fixed Huffman tables the IAA hardware requires to implement RFC-1951.
*/
const uint32_t fixed_ll_sym[286] = {
0x40030, 0x40031, 0x40032, 0x40033, 0x40034, 0x40035, 0x40036, 0x40037,
0x40038, 0x40039, 0x4003A, 0x4003B, 0x4003C, 0x4003D, 0x4003E, 0x4003F,
0x40040, 0x40041, 0x40042, 0x40043, 0x40044, 0x40045, 0x40046, 0x40047,
0x40048, 0x40049, 0x4004A, 0x4004B, 0x4004C, 0x4004D, 0x4004E, 0x4004F,
0x40050, 0x40051, 0x40052, 0x40053, 0x40054, 0x40055, 0x40056, 0x40057,
0x40058, 0x40059, 0x4005A, 0x4005B, 0x4005C, 0x4005D, 0x4005E, 0x4005F,
0x40060, 0x40061, 0x40062, 0x40063, 0x40064, 0x40065, 0x40066, 0x40067,
0x40068, 0x40069, 0x4006A, 0x4006B, 0x4006C, 0x4006D, 0x4006E, 0x4006F,
0x40070, 0x40071, 0x40072, 0x40073, 0x40074, 0x40075, 0x40076, 0x40077,
0x40078, 0x40079, 0x4007A, 0x4007B, 0x4007C, 0x4007D, 0x4007E, 0x4007F,
0x40080, 0x40081, 0x40082, 0x40083, 0x40084, 0x40085, 0x40086, 0x40087,
0x40088, 0x40089, 0x4008A, 0x4008B, 0x4008C, 0x4008D, 0x4008E, 0x4008F,
0x40090, 0x40091, 0x40092, 0x40093, 0x40094, 0x40095, 0x40096, 0x40097,
0x40098, 0x40099, 0x4009A, 0x4009B, 0x4009C, 0x4009D, 0x4009E, 0x4009F,
0x400A0, 0x400A1, 0x400A2, 0x400A3, 0x400A4, 0x400A5, 0x400A6, 0x400A7,
0x400A8, 0x400A9, 0x400AA, 0x400AB, 0x400AC, 0x400AD, 0x400AE, 0x400AF,
0x400B0, 0x400B1, 0x400B2, 0x400B3, 0x400B4, 0x400B5, 0x400B6, 0x400B7,
0x400B8, 0x400B9, 0x400BA, 0x400BB, 0x400BC, 0x400BD, 0x400BE, 0x400BF,
0x48190, 0x48191, 0x48192, 0x48193, 0x48194, 0x48195, 0x48196, 0x48197,
0x48198, 0x48199, 0x4819A, 0x4819B, 0x4819C, 0x4819D, 0x4819E, 0x4819F,
0x481A0, 0x481A1, 0x481A2, 0x481A3, 0x481A4, 0x481A5, 0x481A6, 0x481A7,
0x481A8, 0x481A9, 0x481AA, 0x481AB, 0x481AC, 0x481AD, 0x481AE, 0x481AF,
0x481B0, 0x481B1, 0x481B2, 0x481B3, 0x481B4, 0x481B5, 0x481B6, 0x481B7,
0x481B8, 0x481B9, 0x481BA, 0x481BB, 0x481BC, 0x481BD, 0x481BE, 0x481BF,
0x481C0, 0x481C1, 0x481C2, 0x481C3, 0x481C4, 0x481C5, 0x481C6, 0x481C7,
0x481C8, 0x481C9, 0x481CA, 0x481CB, 0x481CC, 0x481CD, 0x481CE, 0x481CF,
0x481D0, 0x481D1, 0x481D2, 0x481D3, 0x481D4, 0x481D5, 0x481D6, 0x481D7,
0x481D8, 0x481D9, 0x481DA, 0x481DB, 0x481DC, 0x481DD, 0x481DE, 0x481DF,
0x481E0, 0x481E1, 0x481E2, 0x481E3, 0x481E4, 0x481E5, 0x481E6, 0x481E7,
0x481E8, 0x481E9, 0x481EA, 0x481EB, 0x481EC, 0x481ED, 0x481EE, 0x481EF,
0x481F0, 0x481F1, 0x481F2, 0x481F3, 0x481F4, 0x481F5, 0x481F6, 0x481F7,
0x481F8, 0x481F9, 0x481FA, 0x481FB, 0x481FC, 0x481FD, 0x481FE, 0x481FF,
0x38000, 0x38001, 0x38002, 0x38003, 0x38004, 0x38005, 0x38006, 0x38007,
0x38008, 0x38009, 0x3800A, 0x3800B, 0x3800C, 0x3800D, 0x3800E, 0x3800F,
0x38010, 0x38011, 0x38012, 0x38013, 0x38014, 0x38015, 0x38016, 0x38017,
0x400C0, 0x400C1, 0x400C2, 0x400C3, 0x400C4, 0x400C5
};
const uint32_t fixed_d_sym[30] = {
0x28000, 0x28001, 0x28002, 0x28003, 0x28004, 0x28005, 0x28006, 0x28007,
0x28008, 0x28009, 0x2800A, 0x2800B, 0x2800C, 0x2800D, 0x2800E, 0x2800F,
0x28010, 0x28011, 0x28012, 0x28013, 0x28014, 0x28015, 0x28016, 0x28017,
0x28018, 0x28019, 0x2801A, 0x2801B, 0x2801C, 0x2801D
};
#define DYNAMIC_HDR 0x2
#define DYNAMIC_HDR_SIZE 3
/* Caller must hold g_driver_lock */
static struct spdk_idxd_device *
idxd_attach(struct spdk_pci_device *device)
{
struct spdk_user_idxd_device *user_idxd;
struct spdk_idxd_device *idxd;
uint16_t did = device->id.device_id;
uint32_t cmd_reg;
int rc;
user_idxd = calloc(1, sizeof(struct spdk_user_idxd_device));
if (user_idxd == NULL) {
SPDK_ERRLOG("Failed to allocate memory for user_idxd device.\n");
return NULL;
}
idxd = &user_idxd->idxd;
if (did == PCI_DEVICE_ID_INTEL_DSA) {
idxd->type = IDXD_DEV_TYPE_DSA;
} else if (did == PCI_DEVICE_ID_INTEL_IAA) {
idxd->type = IDXD_DEV_TYPE_IAA;
idxd->aecs = spdk_zmalloc(sizeof(struct iaa_aecs),
0x20, NULL,
SPDK_ENV_LCORE_ID_ANY, SPDK_MALLOC_DMA);
if (idxd->aecs == NULL) {
SPDK_ERRLOG("Failed to allocate iaa aecs\n");
goto err;
}
/* Configure aecs table using fixed Huffman table */
idxd->aecs->output_accum[0] = DYNAMIC_HDR | 1;
idxd->aecs->num_output_accum_bits = DYNAMIC_HDR_SIZE;
/* Add Huffman table to aecs */
memcpy(idxd->aecs->ll_sym, fixed_ll_sym, sizeof(fixed_ll_sym));
memcpy(idxd->aecs->d_sym, fixed_d_sym, sizeof(fixed_d_sym));
}
user_idxd->device = device;
idxd->impl = &g_user_idxd_impl;
idxd->socket_id = device->socket_id;
pthread_mutex_init(&idxd->num_channels_lock, NULL);
/* Enable PCI busmaster. */
spdk_pci_device_cfg_read32(device, &cmd_reg, 4);
cmd_reg |= 0x4;
spdk_pci_device_cfg_write32(device, cmd_reg, 4);
rc = idxd_device_configure(user_idxd);
if (rc) {
goto err;
}
return idxd;
err:
user_idxd_device_destruct(idxd);
return NULL;
}
SPDK_IDXD_IMPL_REGISTER(user, &g_user_idxd_impl);