/*- * BSD LICENSE * * Copyright (c) Intel Corporation. * All rights reserved. * * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in * the documentation and/or other materials provided with the * distribution. * * Neither the name of Intel Corporation nor the names of its * contributors may be used to endorse or promote products derived * from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "spdk/stdinc.h" #include "spdk/env.h" #include "spdk/util.h" #include "spdk/memory.h" #include "spdk/likely.h" #include "spdk/log.h" #include "spdk_internal/idxd.h" #include "idxd.h" struct spdk_user_idxd_device { struct spdk_idxd_device idxd; struct spdk_pci_device *device; int sock_id; struct idxd_registers *registers; }; typedef bool (*spdk_idxd_probe_cb)(void *cb_ctx, struct spdk_pci_device *pci_dev); #define __user_idxd(idxd) (struct spdk_user_idxd_device *)idxd pthread_mutex_t g_driver_lock = PTHREAD_MUTEX_INITIALIZER; static struct spdk_idxd_device *idxd_attach(struct spdk_pci_device *device); /* Used for control commands, not for descriptor submission. */ static int idxd_wait_cmd(struct spdk_user_idxd_device *user_idxd, int _timeout) { uint32_t timeout = _timeout; union idxd_cmdsts_register cmd_status = {}; cmd_status.raw = spdk_mmio_read_4(&user_idxd->registers->cmdsts.raw); while (cmd_status.active && --timeout) { usleep(1); cmd_status.raw = spdk_mmio_read_4(&user_idxd->registers->cmdsts.raw); } /* Check for timeout */ if (timeout == 0 && cmd_status.active) { SPDK_ERRLOG("Command timeout, waited %u\n", _timeout); return -EBUSY; } /* Check for error */ if (cmd_status.err) { SPDK_ERRLOG("Command status reg reports error 0x%x\n", cmd_status.err); return -EINVAL; } return 0; } static int idxd_unmap_pci_bar(struct spdk_user_idxd_device *user_idxd, int bar) { int rc = 0; void *addr = NULL; if (bar == IDXD_MMIO_BAR) { addr = (void *)user_idxd->registers; } else if (bar == IDXD_WQ_BAR) { addr = (void *)user_idxd->idxd.portal; } if (addr) { rc = spdk_pci_device_unmap_bar(user_idxd->device, 0, addr); } return rc; } static int idxd_map_pci_bars(struct spdk_user_idxd_device *user_idxd) { int rc; void *addr; uint64_t phys_addr, size; rc = spdk_pci_device_map_bar(user_idxd->device, IDXD_MMIO_BAR, &addr, &phys_addr, &size); if (rc != 0 || addr == NULL) { SPDK_ERRLOG("pci_device_map_range failed with error code %d\n", rc); return -1; } user_idxd->registers = (struct idxd_registers *)addr; rc = spdk_pci_device_map_bar(user_idxd->device, IDXD_WQ_BAR, &addr, &phys_addr, &size); if (rc != 0 || addr == NULL) { SPDK_ERRLOG("pci_device_map_range failed with error code %d\n", rc); rc = idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR); if (rc) { SPDK_ERRLOG("unable to unmap MMIO bar\n"); } return -EINVAL; } user_idxd->idxd.portal = addr; return 0; } static void idxd_disable_dev(struct spdk_user_idxd_device *user_idxd) { int rc; union idxd_cmd_register cmd = {}; cmd.command_code = IDXD_DISABLE_DEV; spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw); rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US); if (rc < 0) { SPDK_ERRLOG("Error disabling device %u\n", rc); } } static int idxd_reset_dev(struct spdk_user_idxd_device *user_idxd) { int rc; union idxd_cmd_register cmd = {}; cmd.command_code = IDXD_RESET_DEVICE; spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw); rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US); if (rc < 0) { SPDK_ERRLOG("Error resetting device %u\n", rc); } return rc; } static int idxd_group_config(struct spdk_user_idxd_device *user_idxd) { int i; union idxd_groupcap_register groupcap; union idxd_enginecap_register enginecap; union idxd_wqcap_register wqcap; union idxd_offsets_register table_offsets; struct idxd_grptbl *grptbl; struct idxd_grpcfg grpcfg = {}; groupcap.raw = spdk_mmio_read_8(&user_idxd->registers->groupcap.raw); enginecap.raw = spdk_mmio_read_8(&user_idxd->registers->enginecap.raw); wqcap.raw = spdk_mmio_read_8(&user_idxd->registers->wqcap.raw); if (wqcap.num_wqs < 1) { return -ENOTSUP; } /* Build one group with all of the engines and a single work queue. */ grpcfg.wqs[0] = 1; grpcfg.flags.read_buffers_allowed = groupcap.read_bufs; for (i = 0; i < enginecap.num_engines; i++) { grpcfg.engines |= (1 << i); } table_offsets.raw[0] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[0]); table_offsets.raw[1] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[1]); grptbl = (struct idxd_grptbl *)((uint8_t *)user_idxd->registers + (table_offsets.grpcfg * IDXD_TABLE_OFFSET_MULT)); /* Write the group we've configured */ spdk_mmio_write_8(&grptbl->group[0].wqs[0], grpcfg.wqs[0]); spdk_mmio_write_8(&grptbl->group[0].wqs[1], 0); spdk_mmio_write_8(&grptbl->group[0].wqs[2], 0); spdk_mmio_write_8(&grptbl->group[0].wqs[3], 0); spdk_mmio_write_8(&grptbl->group[0].engines, grpcfg.engines); spdk_mmio_write_4(&grptbl->group[0].flags.raw, grpcfg.flags.raw); /* Write zeroes to the rest of the groups */ for (i = 1 ; i < groupcap.num_groups; i++) { spdk_mmio_write_8(&grptbl->group[i].wqs[0], 0L); spdk_mmio_write_8(&grptbl->group[i].wqs[1], 0L); spdk_mmio_write_8(&grptbl->group[i].wqs[2], 0L); spdk_mmio_write_8(&grptbl->group[i].wqs[3], 0L); spdk_mmio_write_8(&grptbl->group[i].engines, 0L); spdk_mmio_write_4(&grptbl->group[i].flags.raw, 0L); } return 0; } static int idxd_wq_config(struct spdk_user_idxd_device *user_idxd) { uint32_t i; struct spdk_idxd_device *idxd = &user_idxd->idxd; union idxd_wqcap_register wqcap; union idxd_offsets_register table_offsets; union idxd_wqcfg *wqcfg; wqcap.raw = spdk_mmio_read_8(&user_idxd->registers->wqcap.raw); SPDK_DEBUGLOG(idxd, "Total ring slots available 0x%x\n", wqcap.total_wq_size); idxd->total_wq_size = wqcap.total_wq_size; /* Spread the channels we allow per device based on the total number of WQE to try * and achieve optimal performance for common cases. */ idxd->chan_per_device = (idxd->total_wq_size >= 128) ? 8 : 4; table_offsets.raw[0] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[0]); table_offsets.raw[1] = spdk_mmio_read_8(&user_idxd->registers->offsets.raw[1]); wqcfg = (union idxd_wqcfg *)((uint8_t *)user_idxd->registers + (table_offsets.wqcfg * IDXD_TABLE_OFFSET_MULT)); for (i = 0 ; i < SPDK_COUNTOF(wqcfg->raw); i++) { wqcfg->raw[i] = spdk_mmio_read_4(&wqcfg->raw[i]); } wqcfg->wq_size = wqcap.total_wq_size; wqcfg->mode = WQ_MODE_DEDICATED; wqcfg->max_batch_shift = LOG2_WQ_MAX_BATCH; wqcfg->max_xfer_shift = LOG2_WQ_MAX_XFER; wqcfg->wq_state = WQ_ENABLED; wqcfg->priority = WQ_PRIORITY_1; for (i = 0; i < SPDK_COUNTOF(wqcfg->raw); i++) { spdk_mmio_write_4(&wqcfg->raw[i], wqcfg->raw[i]); } return 0; } static int idxd_device_configure(struct spdk_user_idxd_device *user_idxd) { int rc = 0; union idxd_gensts_register gensts_reg; union idxd_cmd_register cmd = {}; /* * Map BAR0 and BAR2 */ rc = idxd_map_pci_bars(user_idxd); if (rc) { return rc; } /* * Reset the device */ rc = idxd_reset_dev(user_idxd); if (rc) { goto err_reset; } /* * Configure groups and work queues. */ rc = idxd_group_config(user_idxd); if (rc) { goto err_group_cfg; } rc = idxd_wq_config(user_idxd); if (rc) { goto err_wq_cfg; } /* * Enable the device */ gensts_reg.raw = spdk_mmio_read_4(&user_idxd->registers->gensts.raw); assert(gensts_reg.state == IDXD_DEVICE_STATE_DISABLED); cmd.command_code = IDXD_ENABLE_DEV; spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw); rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US); gensts_reg.raw = spdk_mmio_read_4(&user_idxd->registers->gensts.raw); if ((rc < 0) || (gensts_reg.state != IDXD_DEVICE_STATE_ENABLED)) { rc = -EINVAL; SPDK_ERRLOG("Error enabling device %u\n", rc); goto err_device_enable; } /* * Enable the work queue that we've configured */ cmd.command_code = IDXD_ENABLE_WQ; cmd.operand = 0; spdk_mmio_write_4(&user_idxd->registers->cmd.raw, cmd.raw); rc = idxd_wait_cmd(user_idxd, IDXD_REGISTER_TIMEOUT_US); if (rc < 0) { SPDK_ERRLOG("Error enabling work queues 0x%x\n", rc); goto err_wq_enable; } if ((rc == 0) && (gensts_reg.state == IDXD_DEVICE_STATE_ENABLED)) { SPDK_DEBUGLOG(idxd, "Device enabled\n"); } return rc; err_wq_enable: err_device_enable: err_wq_cfg: err_group_cfg: err_reset: idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR); idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR); return rc; } static void user_idxd_device_destruct(struct spdk_idxd_device *idxd) { struct spdk_user_idxd_device *user_idxd = __user_idxd(idxd); idxd_disable_dev(user_idxd); idxd_unmap_pci_bar(user_idxd, IDXD_MMIO_BAR); idxd_unmap_pci_bar(user_idxd, IDXD_WQ_BAR); spdk_pci_device_detach(user_idxd->device); free(user_idxd); } struct idxd_enum_ctx { spdk_idxd_probe_cb probe_cb; spdk_idxd_attach_cb attach_cb; void *cb_ctx; }; /* This function must only be called while holding g_driver_lock */ static int idxd_enum_cb(void *ctx, struct spdk_pci_device *pci_dev) { struct idxd_enum_ctx *enum_ctx = ctx; struct spdk_idxd_device *idxd; if (enum_ctx->probe_cb(enum_ctx->cb_ctx, pci_dev)) { idxd = idxd_attach(pci_dev); if (idxd == NULL) { SPDK_ERRLOG("idxd_attach() failed\n"); return -EINVAL; } enum_ctx->attach_cb(enum_ctx->cb_ctx, idxd); } return 0; } static bool probe_cb(void *cb_ctx, struct spdk_pci_device *pci_dev) { struct spdk_pci_addr pci_addr __attribute__((unused)); pci_addr = spdk_pci_device_get_addr(pci_dev); SPDK_DEBUGLOG(idxd, " Found matching device at %04x:%02x:%02x.%x vendor:0x%04x device:0x%04x\n", pci_addr.domain, pci_addr.bus, pci_addr.dev, pci_addr.func, spdk_pci_device_get_vendor_id(pci_dev), spdk_pci_device_get_device_id(pci_dev)); /* Claim the device in case conflict with other process */ if (spdk_pci_device_claim(pci_dev) < 0) { return false; } return true; } static int user_idxd_probe(void *cb_ctx, spdk_idxd_attach_cb attach_cb) { int rc; struct idxd_enum_ctx enum_ctx; enum_ctx.probe_cb = probe_cb; enum_ctx.attach_cb = attach_cb; enum_ctx.cb_ctx = cb_ctx; pthread_mutex_lock(&g_driver_lock); rc = spdk_pci_enumerate(spdk_pci_idxd_get_driver(), idxd_enum_cb, &enum_ctx); pthread_mutex_unlock(&g_driver_lock); return rc; } static void user_idxd_dump_sw_err(struct spdk_idxd_device *idxd, void *portal) { struct spdk_user_idxd_device *user_idxd = __user_idxd(idxd); union idxd_swerr_register sw_err; uint16_t i; SPDK_NOTICELOG("SW Error Raw:"); for (i = 0; i < 4; i++) { sw_err.raw[i] = spdk_mmio_read_8(&user_idxd->registers->sw_err.raw[i]); SPDK_NOTICELOG(" 0x%lx\n", sw_err.raw[i]); } SPDK_NOTICELOG("SW Error error code: %#x\n", (uint8_t)(sw_err.error)); SPDK_NOTICELOG("SW Error WQ index: %u\n", (uint8_t)(sw_err.wq_idx)); SPDK_NOTICELOG("SW Error Operation: %u\n", (uint8_t)(sw_err.operation)); } static char * user_idxd_portal_get_addr(struct spdk_idxd_device *idxd) { return (char *)idxd->portal; } static struct spdk_idxd_impl g_user_idxd_impl = { .name = "user", .probe = user_idxd_probe, .destruct = user_idxd_device_destruct, .dump_sw_error = user_idxd_dump_sw_err, .portal_get_addr = user_idxd_portal_get_addr }; /* Caller must hold g_driver_lock */ static struct spdk_idxd_device * idxd_attach(struct spdk_pci_device *device) { struct spdk_user_idxd_device *user_idxd; struct spdk_idxd_device *idxd; uint32_t cmd_reg; int rc; user_idxd = calloc(1, sizeof(struct spdk_user_idxd_device)); if (user_idxd == NULL) { SPDK_ERRLOG("Failed to allocate memory for user_idxd device.\n"); return NULL; } idxd = &user_idxd->idxd; user_idxd->device = device; idxd->impl = &g_user_idxd_impl; idxd->socket_id = device->socket_id; pthread_mutex_init(&idxd->num_channels_lock, NULL); /* Enable PCI busmaster. */ spdk_pci_device_cfg_read32(device, &cmd_reg, 4); cmd_reg |= 0x4; spdk_pci_device_cfg_write32(device, cmd_reg, 4); rc = idxd_device_configure(user_idxd); if (rc) { goto err; } return idxd; err: user_idxd_device_destruct(idxd); return NULL; } SPDK_IDXD_IMPL_REGISTER(user, &g_user_idxd_impl);