17d652d720
Signed-off-by: Tomasz Zawadzki <tomasz.zawadzki@intel.com> Signed-off-by: Piotr Pelplinski <piotr.pelplinski@intel.com> Change-Id: I621a8a3891c8f3829564940219c70c6520c6f9c7 Reviewed-on: https://review.gerrithub.io/427899 Chandler-Test-Pool: SPDK Automated Test System <sys_sgsw@intel.com> Reviewed-by: Jim Harris <james.r.harris@intel.com> Reviewed-by: Shuhei Matsumoto <shuhei.matsumoto.xt@hitachi.com> Reviewed-by: Ben Walker <benjamin.walker@intel.com> Tested-by: SPDK CI Jenkins <sys_sgci@intel.com>
762 lines
19 KiB
C
762 lines
19 KiB
C
/*-
|
|
* BSD LICENSE
|
|
*
|
|
* Copyright (c) Intel Corporation.
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
*
|
|
* * Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in
|
|
* the documentation and/or other materials provided with the
|
|
* distribution.
|
|
* * Neither the name of Intel Corporation nor the names of its
|
|
* contributors may be used to endorse or promote products derived
|
|
* from this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include "bdev_aio.h"
|
|
|
|
#include "spdk/stdinc.h"
|
|
|
|
#include "spdk/bdev.h"
|
|
#include "spdk/conf.h"
|
|
#include "spdk/env.h"
|
|
#include "spdk/fd.h"
|
|
#include "spdk/thread.h"
|
|
#include "spdk/json.h"
|
|
#include "spdk/util.h"
|
|
#include "spdk/string.h"
|
|
|
|
#include "spdk_internal/log.h"
|
|
|
|
static int bdev_aio_initialize(void);
|
|
static void bdev_aio_fini(void);
|
|
static void aio_free_disk(struct file_disk *fdisk);
|
|
static void bdev_aio_get_spdk_running_config(FILE *fp);
|
|
static TAILQ_HEAD(, file_disk) g_aio_disk_head;
|
|
|
|
#define SPDK_AIO_QUEUE_DEPTH 128
|
|
#define MAX_EVENTS_PER_POLL 32
|
|
|
|
static int
|
|
bdev_aio_get_ctx_size(void)
|
|
{
|
|
return sizeof(struct bdev_aio_task);
|
|
}
|
|
|
|
static struct spdk_bdev_module aio_if = {
|
|
.name = "aio",
|
|
.module_init = bdev_aio_initialize,
|
|
.module_fini = bdev_aio_fini,
|
|
.config_text = bdev_aio_get_spdk_running_config,
|
|
.get_ctx_size = bdev_aio_get_ctx_size,
|
|
};
|
|
|
|
struct bdev_aio_group_channel {
|
|
struct spdk_poller *poller;
|
|
int epfd;
|
|
};
|
|
|
|
SPDK_BDEV_MODULE_REGISTER(&aio_if)
|
|
|
|
static int
|
|
bdev_aio_open(struct file_disk *disk)
|
|
{
|
|
int fd;
|
|
|
|
fd = open(disk->filename, O_RDWR | O_DIRECT);
|
|
if (fd < 0) {
|
|
/* Try without O_DIRECT for non-disk files */
|
|
fd = open(disk->filename, O_RDWR);
|
|
if (fd < 0) {
|
|
SPDK_ERRLOG("open() failed (file:%s), errno %d: %s\n",
|
|
disk->filename, errno, spdk_strerror(errno));
|
|
disk->fd = -1;
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
disk->fd = fd;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int
|
|
bdev_aio_close(struct file_disk *disk)
|
|
{
|
|
int rc;
|
|
|
|
if (disk->fd == -1) {
|
|
return 0;
|
|
}
|
|
|
|
rc = close(disk->fd);
|
|
if (rc < 0) {
|
|
SPDK_ERRLOG("close() failed (fd=%d), errno %d: %s\n",
|
|
disk->fd, errno, spdk_strerror(errno));
|
|
return -1;
|
|
}
|
|
|
|
disk->fd = -1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int64_t
|
|
bdev_aio_readv(struct file_disk *fdisk, struct spdk_io_channel *ch,
|
|
struct bdev_aio_task *aio_task,
|
|
struct iovec *iov, int iovcnt, uint64_t nbytes, uint64_t offset)
|
|
{
|
|
struct iocb *iocb = &aio_task->iocb;
|
|
struct bdev_aio_io_channel *aio_ch = spdk_io_channel_get_ctx(ch);
|
|
int rc;
|
|
|
|
io_prep_preadv(iocb, fdisk->fd, iov, iovcnt, offset);
|
|
iocb->data = aio_task;
|
|
aio_task->len = nbytes;
|
|
io_set_eventfd(iocb, aio_ch->efd);
|
|
|
|
SPDK_DEBUGLOG(SPDK_LOG_AIO, "read %d iovs size %lu to off: %#lx\n",
|
|
iovcnt, nbytes, offset);
|
|
|
|
rc = io_submit(aio_ch->io_ctx, 1, &iocb);
|
|
if (rc < 0) {
|
|
if (rc == -EAGAIN) {
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(aio_task), SPDK_BDEV_IO_STATUS_NOMEM);
|
|
} else {
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(aio_task), SPDK_BDEV_IO_STATUS_FAILED);
|
|
SPDK_ERRLOG("%s: io_submit returned %d\n", __func__, rc);
|
|
}
|
|
return -1;
|
|
}
|
|
aio_ch->io_inflight++;
|
|
return nbytes;
|
|
}
|
|
|
|
static int64_t
|
|
bdev_aio_writev(struct file_disk *fdisk, struct spdk_io_channel *ch,
|
|
struct bdev_aio_task *aio_task,
|
|
struct iovec *iov, int iovcnt, size_t len, uint64_t offset)
|
|
{
|
|
struct iocb *iocb = &aio_task->iocb;
|
|
struct bdev_aio_io_channel *aio_ch = spdk_io_channel_get_ctx(ch);
|
|
int rc;
|
|
|
|
io_prep_pwritev(iocb, fdisk->fd, iov, iovcnt, offset);
|
|
iocb->data = aio_task;
|
|
aio_task->len = len;
|
|
io_set_eventfd(iocb, aio_ch->efd);
|
|
|
|
SPDK_DEBUGLOG(SPDK_LOG_AIO, "write %d iovs size %lu from off: %#lx\n",
|
|
iovcnt, len, offset);
|
|
|
|
rc = io_submit(aio_ch->io_ctx, 1, &iocb);
|
|
if (rc < 0) {
|
|
if (rc == -EAGAIN) {
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(aio_task), SPDK_BDEV_IO_STATUS_NOMEM);
|
|
} else {
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(aio_task), SPDK_BDEV_IO_STATUS_FAILED);
|
|
SPDK_ERRLOG("%s: io_submit returned %d\n", __func__, rc);
|
|
}
|
|
return -1;
|
|
}
|
|
aio_ch->io_inflight++;
|
|
return len;
|
|
}
|
|
|
|
static void
|
|
bdev_aio_flush(struct file_disk *fdisk, struct bdev_aio_task *aio_task)
|
|
{
|
|
int rc = fsync(fdisk->fd);
|
|
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(aio_task),
|
|
rc == 0 ? SPDK_BDEV_IO_STATUS_SUCCESS : SPDK_BDEV_IO_STATUS_FAILED);
|
|
}
|
|
|
|
static int
|
|
bdev_aio_destruct(void *ctx)
|
|
{
|
|
struct file_disk *fdisk = ctx;
|
|
int rc = 0;
|
|
|
|
TAILQ_REMOVE(&g_aio_disk_head, fdisk, link);
|
|
rc = bdev_aio_close(fdisk);
|
|
if (rc < 0) {
|
|
SPDK_ERRLOG("bdev_aio_close() failed\n");
|
|
}
|
|
return rc;
|
|
}
|
|
|
|
static int
|
|
bdev_aio_initialize_io_channel(struct bdev_aio_io_channel *ch)
|
|
{
|
|
ch->efd = eventfd(0, EFD_NONBLOCK | EFD_CLOEXEC);
|
|
if (ch->efd == -1) {
|
|
SPDK_ERRLOG("Cannot create efd\n");
|
|
return -1;
|
|
}
|
|
|
|
if (io_setup(SPDK_AIO_QUEUE_DEPTH, &ch->io_ctx) < 0) {
|
|
close(ch->efd);
|
|
SPDK_ERRLOG("async I/O context setup failure\n");
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int
|
|
bdev_aio_group_poll(void *arg)
|
|
{
|
|
struct bdev_aio_group_channel *group_ch = arg;
|
|
struct bdev_aio_io_channel *ch;
|
|
int nr, i, j, rc, total_nr = 0;
|
|
enum spdk_bdev_io_status status;
|
|
struct bdev_aio_task *aio_task;
|
|
struct timespec timeout;
|
|
struct io_event events[SPDK_AIO_QUEUE_DEPTH];
|
|
struct epoll_event epevents[MAX_EVENTS_PER_POLL];
|
|
|
|
timeout.tv_sec = 0;
|
|
timeout.tv_nsec = 0;
|
|
rc = epoll_wait(group_ch->epfd, epevents, MAX_EVENTS_PER_POLL, 0);
|
|
if (rc == -1) {
|
|
SPDK_ERRLOG("epoll_wait error(%d): %s on ch=%p\n", errno, spdk_strerror(errno), group_ch);
|
|
return -1;
|
|
}
|
|
|
|
for (j = 0; j < rc; j++) {
|
|
ch = epevents[j].data.ptr;
|
|
nr = io_getevents(ch->io_ctx, 1, SPDK_AIO_QUEUE_DEPTH,
|
|
events, &timeout);
|
|
|
|
if (nr < 0) {
|
|
SPDK_ERRLOG("Returned %d on bdev_aio_io_channel %p\n", nr, ch);
|
|
continue;
|
|
}
|
|
|
|
total_nr += nr;
|
|
for (i = 0; i < nr; i++) {
|
|
aio_task = events[i].data;
|
|
if (events[i].res != aio_task->len) {
|
|
status = SPDK_BDEV_IO_STATUS_FAILED;
|
|
} else {
|
|
status = SPDK_BDEV_IO_STATUS_SUCCESS;
|
|
}
|
|
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(aio_task), status);
|
|
ch->io_inflight--;
|
|
}
|
|
}
|
|
|
|
return total_nr;
|
|
}
|
|
|
|
static void
|
|
_bdev_aio_get_io_inflight(struct spdk_io_channel_iter *i)
|
|
{
|
|
struct spdk_io_channel *ch = spdk_io_channel_iter_get_channel(i);
|
|
struct bdev_aio_io_channel *aio_ch = spdk_io_channel_get_ctx(ch);
|
|
|
|
if (aio_ch->io_inflight) {
|
|
spdk_for_each_channel_continue(i, -1);
|
|
return;
|
|
}
|
|
|
|
spdk_for_each_channel_continue(i, 0);
|
|
}
|
|
|
|
static int bdev_aio_reset_retry_timer(void *arg);
|
|
|
|
static void
|
|
_bdev_aio_get_io_inflight_done(struct spdk_io_channel_iter *i, int status)
|
|
{
|
|
struct file_disk *fdisk = spdk_io_channel_iter_get_ctx(i);
|
|
|
|
if (status == -1) {
|
|
fdisk->reset_retry_timer = spdk_poller_register(bdev_aio_reset_retry_timer, fdisk, 500);
|
|
return;
|
|
}
|
|
|
|
spdk_bdev_io_complete(spdk_bdev_io_from_ctx(fdisk->reset_task), SPDK_BDEV_IO_STATUS_SUCCESS);
|
|
}
|
|
|
|
static int
|
|
bdev_aio_reset_retry_timer(void *arg)
|
|
{
|
|
struct file_disk *fdisk = arg;
|
|
|
|
if (fdisk->reset_retry_timer) {
|
|
spdk_poller_unregister(&fdisk->reset_retry_timer);
|
|
}
|
|
|
|
spdk_for_each_channel(fdisk,
|
|
_bdev_aio_get_io_inflight,
|
|
fdisk,
|
|
_bdev_aio_get_io_inflight_done);
|
|
|
|
return -1;
|
|
}
|
|
|
|
static void
|
|
bdev_aio_reset(struct file_disk *fdisk, struct bdev_aio_task *aio_task)
|
|
{
|
|
fdisk->reset_task = aio_task;
|
|
|
|
bdev_aio_reset_retry_timer(fdisk);
|
|
}
|
|
|
|
static void bdev_aio_get_buf_cb(struct spdk_io_channel *ch, struct spdk_bdev_io *bdev_io)
|
|
{
|
|
switch (bdev_io->type) {
|
|
case SPDK_BDEV_IO_TYPE_READ:
|
|
bdev_aio_readv((struct file_disk *)bdev_io->bdev->ctxt,
|
|
ch,
|
|
(struct bdev_aio_task *)bdev_io->driver_ctx,
|
|
bdev_io->u.bdev.iovs,
|
|
bdev_io->u.bdev.iovcnt,
|
|
bdev_io->u.bdev.num_blocks * bdev_io->bdev->blocklen,
|
|
bdev_io->u.bdev.offset_blocks * bdev_io->bdev->blocklen);
|
|
break;
|
|
case SPDK_BDEV_IO_TYPE_WRITE:
|
|
bdev_aio_writev((struct file_disk *)bdev_io->bdev->ctxt,
|
|
ch,
|
|
(struct bdev_aio_task *)bdev_io->driver_ctx,
|
|
bdev_io->u.bdev.iovs,
|
|
bdev_io->u.bdev.iovcnt,
|
|
bdev_io->u.bdev.num_blocks * bdev_io->bdev->blocklen,
|
|
bdev_io->u.bdev.offset_blocks * bdev_io->bdev->blocklen);
|
|
break;
|
|
default:
|
|
SPDK_ERRLOG("Wrong io type\n");
|
|
break;
|
|
}
|
|
}
|
|
|
|
static int _bdev_aio_submit_request(struct spdk_io_channel *ch, struct spdk_bdev_io *bdev_io)
|
|
{
|
|
switch (bdev_io->type) {
|
|
/* Read and write operations must be performed on buffers aligned to
|
|
* bdev->required_alignment. If user specified unaligned buffers,
|
|
* get the aligned buffer from the pool by calling spdk_bdev_io_get_buf. */
|
|
case SPDK_BDEV_IO_TYPE_READ:
|
|
case SPDK_BDEV_IO_TYPE_WRITE:
|
|
spdk_bdev_io_get_buf(bdev_io, bdev_aio_get_buf_cb,
|
|
bdev_io->u.bdev.num_blocks * bdev_io->bdev->blocklen);
|
|
return 0;
|
|
case SPDK_BDEV_IO_TYPE_FLUSH:
|
|
bdev_aio_flush((struct file_disk *)bdev_io->bdev->ctxt,
|
|
(struct bdev_aio_task *)bdev_io->driver_ctx);
|
|
return 0;
|
|
|
|
case SPDK_BDEV_IO_TYPE_RESET:
|
|
bdev_aio_reset((struct file_disk *)bdev_io->bdev->ctxt,
|
|
(struct bdev_aio_task *)bdev_io->driver_ctx);
|
|
return 0;
|
|
default:
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
static void bdev_aio_submit_request(struct spdk_io_channel *ch, struct spdk_bdev_io *bdev_io)
|
|
{
|
|
if (_bdev_aio_submit_request(ch, bdev_io) < 0) {
|
|
spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
|
|
}
|
|
}
|
|
|
|
static bool
|
|
bdev_aio_io_type_supported(void *ctx, enum spdk_bdev_io_type io_type)
|
|
{
|
|
switch (io_type) {
|
|
case SPDK_BDEV_IO_TYPE_READ:
|
|
case SPDK_BDEV_IO_TYPE_WRITE:
|
|
case SPDK_BDEV_IO_TYPE_FLUSH:
|
|
case SPDK_BDEV_IO_TYPE_RESET:
|
|
return true;
|
|
|
|
default:
|
|
return false;
|
|
}
|
|
}
|
|
|
|
static int
|
|
bdev_aio_create_cb(void *io_device, void *ctx_buf)
|
|
{
|
|
struct bdev_aio_io_channel *ch = ctx_buf;
|
|
struct bdev_aio_group_channel *group_ch_ctx;
|
|
struct epoll_event epevent;
|
|
|
|
if (bdev_aio_initialize_io_channel(ch) != 0) {
|
|
return -1;
|
|
}
|
|
|
|
ch->group_ch = spdk_get_io_channel(&aio_if);
|
|
group_ch_ctx = spdk_io_channel_get_ctx(ch->group_ch);
|
|
|
|
epevent.events = EPOLLIN | EPOLLET;
|
|
epevent.data.ptr = ch;
|
|
if (epoll_ctl(group_ch_ctx->epfd, EPOLL_CTL_ADD, ch->efd, &epevent)) {
|
|
close(ch->efd);
|
|
io_destroy(ch->io_ctx);
|
|
spdk_put_io_channel(ch->group_ch);
|
|
SPDK_ERRLOG("epoll_ctl error\n");
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
bdev_aio_destroy_cb(void *io_device, void *ctx_buf)
|
|
{
|
|
struct bdev_aio_io_channel *io_channel = ctx_buf;
|
|
struct bdev_aio_group_channel *group_ch_ctx;
|
|
struct epoll_event event;
|
|
|
|
group_ch_ctx = spdk_io_channel_get_ctx(io_channel->group_ch);
|
|
epoll_ctl(group_ch_ctx->epfd, EPOLL_CTL_DEL, io_channel->efd, &event);
|
|
spdk_put_io_channel(io_channel->group_ch);
|
|
close(io_channel->efd);
|
|
io_destroy(io_channel->io_ctx);
|
|
|
|
}
|
|
|
|
static struct spdk_io_channel *
|
|
bdev_aio_get_io_channel(void *ctx)
|
|
{
|
|
struct file_disk *fdisk = ctx;
|
|
|
|
return spdk_get_io_channel(fdisk);
|
|
}
|
|
|
|
|
|
static int
|
|
bdev_aio_dump_info_json(void *ctx, struct spdk_json_write_ctx *w)
|
|
{
|
|
struct file_disk *fdisk = ctx;
|
|
|
|
spdk_json_write_name(w, "aio");
|
|
spdk_json_write_object_begin(w);
|
|
|
|
spdk_json_write_name(w, "filename");
|
|
spdk_json_write_string(w, fdisk->filename);
|
|
|
|
spdk_json_write_object_end(w);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
bdev_aio_write_json_config(struct spdk_bdev *bdev, struct spdk_json_write_ctx *w)
|
|
{
|
|
struct file_disk *fdisk = bdev->ctxt;
|
|
|
|
spdk_json_write_object_begin(w);
|
|
|
|
spdk_json_write_named_string(w, "method", "construct_aio_bdev");
|
|
|
|
spdk_json_write_named_object_begin(w, "params");
|
|
spdk_json_write_named_string(w, "name", bdev->name);
|
|
if (fdisk->block_size_override) {
|
|
spdk_json_write_named_uint32(w, "block_size", bdev->blocklen);
|
|
}
|
|
spdk_json_write_named_string(w, "filename", fdisk->filename);
|
|
spdk_json_write_object_end(w);
|
|
|
|
spdk_json_write_object_end(w);
|
|
}
|
|
|
|
static const struct spdk_bdev_fn_table aio_fn_table = {
|
|
.destruct = bdev_aio_destruct,
|
|
.submit_request = bdev_aio_submit_request,
|
|
.io_type_supported = bdev_aio_io_type_supported,
|
|
.get_io_channel = bdev_aio_get_io_channel,
|
|
.dump_info_json = bdev_aio_dump_info_json,
|
|
.write_config_json = bdev_aio_write_json_config,
|
|
};
|
|
|
|
static void aio_free_disk(struct file_disk *fdisk)
|
|
{
|
|
if (fdisk == NULL) {
|
|
return;
|
|
}
|
|
free(fdisk->filename);
|
|
free(fdisk->disk.name);
|
|
free(fdisk);
|
|
}
|
|
|
|
static int
|
|
bdev_aio_group_create_cb(void *io_device, void *ctx_buf)
|
|
{
|
|
struct bdev_aio_group_channel *ch = ctx_buf;
|
|
|
|
ch->epfd = epoll_create1(0);
|
|
if (ch->epfd == -1) {
|
|
SPDK_ERRLOG("cannot create epoll fd\n");
|
|
return -1;
|
|
}
|
|
|
|
ch->poller = spdk_poller_register(bdev_aio_group_poll, ch, 0);
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
bdev_aio_group_destroy_cb(void *io_device, void *ctx_buf)
|
|
{
|
|
struct bdev_aio_group_channel *ch = ctx_buf;
|
|
|
|
close(ch->epfd);
|
|
spdk_poller_unregister(&ch->poller);
|
|
}
|
|
|
|
struct spdk_bdev *
|
|
create_aio_disk(const char *name, const char *filename, uint32_t block_size)
|
|
{
|
|
struct file_disk *fdisk;
|
|
uint32_t detected_block_size;
|
|
uint64_t disk_size;
|
|
int rc;
|
|
|
|
fdisk = calloc(1, sizeof(*fdisk));
|
|
if (!fdisk) {
|
|
SPDK_ERRLOG("Unable to allocate enough memory for aio backend\n");
|
|
return NULL;
|
|
}
|
|
|
|
fdisk->filename = strdup(filename);
|
|
if (!fdisk->filename) {
|
|
goto error_return;
|
|
}
|
|
|
|
if (bdev_aio_open(fdisk)) {
|
|
SPDK_ERRLOG("Unable to open file %s. fd: %d errno: %d\n", filename, fdisk->fd, errno);
|
|
goto error_return;
|
|
}
|
|
|
|
disk_size = spdk_fd_get_size(fdisk->fd);
|
|
|
|
fdisk->disk.name = strdup(name);
|
|
if (!fdisk->disk.name) {
|
|
goto error_return;
|
|
}
|
|
fdisk->disk.product_name = "AIO disk";
|
|
fdisk->disk.module = &aio_if;
|
|
|
|
fdisk->disk.write_cache = 1;
|
|
|
|
detected_block_size = spdk_fd_get_blocklen(fdisk->fd);
|
|
if (block_size == 0) {
|
|
/* User did not specify block size - use autodetected block size. */
|
|
if (detected_block_size == 0) {
|
|
SPDK_ERRLOG("Block size could not be auto-detected\n");
|
|
goto error_return;
|
|
}
|
|
fdisk->block_size_override = false;
|
|
block_size = detected_block_size;
|
|
} else {
|
|
if (block_size < detected_block_size) {
|
|
SPDK_ERRLOG("Specified block size %" PRIu32 " is smaller than "
|
|
"auto-detected block size %" PRIu32 "\n",
|
|
block_size, detected_block_size);
|
|
goto error_return;
|
|
} else if (detected_block_size != 0 && block_size != detected_block_size) {
|
|
SPDK_WARNLOG("Specified block size %" PRIu32 " does not match "
|
|
"auto-detected block size %" PRIu32 "\n",
|
|
block_size, detected_block_size);
|
|
}
|
|
fdisk->block_size_override = true;
|
|
}
|
|
|
|
if (block_size < 512) {
|
|
SPDK_ERRLOG("Invalid block size %" PRIu32 " (must be at least 512).\n", block_size);
|
|
goto error_return;
|
|
}
|
|
|
|
if (!spdk_u32_is_pow2(block_size)) {
|
|
SPDK_ERRLOG("Invalid block size %" PRIu32 " (must be a power of 2.)\n", block_size);
|
|
goto error_return;
|
|
}
|
|
|
|
fdisk->disk.blocklen = block_size;
|
|
fdisk->disk.required_alignment = spdk_u32log2(block_size);
|
|
|
|
if (disk_size % fdisk->disk.blocklen != 0) {
|
|
SPDK_ERRLOG("Disk size %" PRIu64 " is not a multiple of block size %" PRIu32 "\n",
|
|
disk_size, fdisk->disk.blocklen);
|
|
goto error_return;
|
|
}
|
|
|
|
fdisk->disk.blockcnt = disk_size / fdisk->disk.blocklen;
|
|
fdisk->disk.ctxt = fdisk;
|
|
|
|
fdisk->disk.fn_table = &aio_fn_table;
|
|
|
|
spdk_io_device_register(fdisk, bdev_aio_create_cb, bdev_aio_destroy_cb,
|
|
sizeof(struct bdev_aio_io_channel),
|
|
fdisk->disk.name);
|
|
rc = spdk_bdev_register(&fdisk->disk);
|
|
if (rc) {
|
|
spdk_io_device_unregister(fdisk, NULL);
|
|
goto error_return;
|
|
}
|
|
|
|
TAILQ_INSERT_TAIL(&g_aio_disk_head, fdisk, link);
|
|
return &fdisk->disk;
|
|
|
|
error_return:
|
|
bdev_aio_close(fdisk);
|
|
aio_free_disk(fdisk);
|
|
return NULL;
|
|
}
|
|
|
|
static void
|
|
aio_io_device_unregister_cb(void *io_device)
|
|
{
|
|
struct file_disk *fdisk = io_device;
|
|
spdk_delete_aio_complete cb_fn = fdisk->delete_cb_fn;
|
|
void *cb_arg = fdisk->delete_cb_arg;
|
|
|
|
aio_free_disk(fdisk);
|
|
cb_fn(cb_arg, 0);
|
|
}
|
|
|
|
static void
|
|
aio_bdev_unregister_cb(void *arg, int bdeverrno)
|
|
{
|
|
struct file_disk *fdisk = arg;
|
|
|
|
if (bdeverrno != 0) {
|
|
fdisk->delete_cb_fn(fdisk->delete_cb_arg, bdeverrno);
|
|
return;
|
|
}
|
|
|
|
spdk_io_device_unregister(fdisk, aio_io_device_unregister_cb);
|
|
}
|
|
|
|
void
|
|
delete_aio_disk(struct spdk_bdev *bdev, spdk_delete_aio_complete cb_fn, void *cb_arg)
|
|
{
|
|
struct file_disk *fdisk;
|
|
|
|
if (!bdev || bdev->module != &aio_if) {
|
|
cb_fn(cb_arg, -ENODEV);
|
|
return;
|
|
}
|
|
|
|
fdisk = bdev->ctxt;
|
|
fdisk->delete_cb_fn = cb_fn;
|
|
fdisk->delete_cb_arg = cb_arg;
|
|
spdk_bdev_unregister(bdev, aio_bdev_unregister_cb, fdisk);
|
|
}
|
|
|
|
static int
|
|
bdev_aio_initialize(void)
|
|
{
|
|
size_t i;
|
|
struct spdk_conf_section *sp;
|
|
struct spdk_bdev *bdev;
|
|
|
|
TAILQ_INIT(&g_aio_disk_head);
|
|
spdk_io_device_register(&aio_if, bdev_aio_group_create_cb, bdev_aio_group_destroy_cb,
|
|
sizeof(struct bdev_aio_group_channel),
|
|
"aio_module");
|
|
|
|
sp = spdk_conf_find_section(NULL, "AIO");
|
|
if (!sp) {
|
|
return 0;
|
|
}
|
|
|
|
i = 0;
|
|
while (true) {
|
|
const char *file;
|
|
const char *name;
|
|
const char *block_size_str;
|
|
uint32_t block_size = 0;
|
|
|
|
file = spdk_conf_section_get_nmval(sp, "AIO", i, 0);
|
|
if (!file) {
|
|
break;
|
|
}
|
|
|
|
name = spdk_conf_section_get_nmval(sp, "AIO", i, 1);
|
|
if (!name) {
|
|
SPDK_ERRLOG("No name provided for AIO disk with file %s\n", file);
|
|
i++;
|
|
continue;
|
|
}
|
|
|
|
block_size_str = spdk_conf_section_get_nmval(sp, "AIO", i, 2);
|
|
if (block_size_str) {
|
|
block_size = atoi(block_size_str);
|
|
}
|
|
|
|
bdev = create_aio_disk(name, file, block_size);
|
|
if (!bdev) {
|
|
SPDK_ERRLOG("Unable to create AIO bdev from file %s\n", file);
|
|
i++;
|
|
continue;
|
|
}
|
|
|
|
i++;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
bdev_aio_fini(void)
|
|
{
|
|
spdk_io_device_unregister(&aio_if, NULL);
|
|
}
|
|
|
|
static void
|
|
bdev_aio_get_spdk_running_config(FILE *fp)
|
|
{
|
|
char *file;
|
|
char *name;
|
|
uint32_t block_size;
|
|
struct file_disk *fdisk;
|
|
|
|
fprintf(fp,
|
|
"\n"
|
|
"# Users must change this section to match the /dev/sdX devices to be\n"
|
|
"# exported as iSCSI LUNs. The devices are accessed using Linux AIO.\n"
|
|
"# The format is:\n"
|
|
"# AIO <file name> <bdev name> [<block size>]\n"
|
|
"# The file name is the backing device\n"
|
|
"# The bdev name can be referenced from elsewhere in the configuration file.\n"
|
|
"# Block size may be omitted to automatically detect the block size of a disk.\n"
|
|
"[AIO]\n");
|
|
|
|
TAILQ_FOREACH(fdisk, &g_aio_disk_head, link) {
|
|
file = fdisk->filename;
|
|
name = fdisk->disk.name;
|
|
block_size = fdisk->disk.blocklen;
|
|
fprintf(fp, " AIO %s %s ", file, name);
|
|
if (fdisk->block_size_override) {
|
|
fprintf(fp, "%d", block_size);
|
|
}
|
|
fprintf(fp, "\n");
|
|
}
|
|
fprintf(fp, "\n");
|
|
}
|
|
|
|
SPDK_LOG_REGISTER_COMPONENT("aio", SPDK_LOG_AIO)
|