summaryrefslogtreecommitdiffstats
path: root/src/spdk/module/bdev/null/bdev_null.c
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-21 11:54:28 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-21 11:54:28 +0000
commite6918187568dbd01842d8d1d2c808ce16a894239 (patch)
tree64f88b554b444a49f656b6c656111a145cbbaa28 /src/spdk/module/bdev/null/bdev_null.c
parentInitial commit. (diff)
downloadceph-e6918187568dbd01842d8d1d2c808ce16a894239.tar.xz
ceph-e6918187568dbd01842d8d1d2c808ce16a894239.zip
Adding upstream version 18.2.2.upstream/18.2.2
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/spdk/module/bdev/null/bdev_null.c')
-rw-r--r--src/spdk/module/bdev/null/bdev_null.c550
1 files changed, 550 insertions, 0 deletions
diff --git a/src/spdk/module/bdev/null/bdev_null.c b/src/spdk/module/bdev/null/bdev_null.c
new file mode 100644
index 000000000..97aa8b03f
--- /dev/null
+++ b/src/spdk/module/bdev/null/bdev_null.c
@@ -0,0 +1,550 @@
+/*-
+ * BSD LICENSE
+ *
+ * Copyright (c) Intel Corporation. All rights reserved.
+ * Copyright (c) 2019 Mellanox Technologies LTD. All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * * Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * * Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ * * Neither the name of Intel Corporation nor the names of its
+ * contributors may be used to endorse or promote products derived
+ * from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+ * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+ * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+ * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+ * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "spdk/stdinc.h"
+
+#include "spdk/bdev.h"
+#include "spdk/conf.h"
+#include "spdk/env.h"
+#include "spdk/thread.h"
+#include "spdk/json.h"
+#include "spdk/string.h"
+#include "spdk/likely.h"
+
+#include "spdk/bdev_module.h"
+#include "spdk_internal/log.h"
+
+#include "bdev_null.h"
+
+struct null_bdev {
+ struct spdk_bdev bdev;
+ TAILQ_ENTRY(null_bdev) tailq;
+};
+
+struct null_io_channel {
+ struct spdk_poller *poller;
+ TAILQ_HEAD(, spdk_bdev_io) io;
+};
+
+static TAILQ_HEAD(, null_bdev) g_null_bdev_head;
+static void *g_null_read_buf;
+
+static int bdev_null_initialize(void);
+static void bdev_null_finish(void);
+static void bdev_null_get_spdk_running_config(FILE *fp);
+
+static struct spdk_bdev_module null_if = {
+ .name = "null",
+ .module_init = bdev_null_initialize,
+ .module_fini = bdev_null_finish,
+ .config_text = bdev_null_get_spdk_running_config,
+ .async_fini = true,
+};
+
+SPDK_BDEV_MODULE_REGISTER(null, &null_if)
+
+static int
+bdev_null_destruct(void *ctx)
+{
+ struct null_bdev *bdev = ctx;
+
+ TAILQ_REMOVE(&g_null_bdev_head, bdev, tailq);
+ free(bdev->bdev.name);
+ free(bdev);
+
+ return 0;
+}
+
+static bool
+bdev_null_abort_io(struct null_io_channel *ch, struct spdk_bdev_io *bio_to_abort)
+{
+ struct spdk_bdev_io *bdev_io;
+
+ TAILQ_FOREACH(bdev_io, &ch->io, module_link) {
+ if (bdev_io == bio_to_abort) {
+ TAILQ_REMOVE(&ch->io, bio_to_abort, module_link);
+ spdk_bdev_io_complete(bio_to_abort, SPDK_BDEV_IO_STATUS_ABORTED);
+ return true;
+ }
+ }
+
+ return false;
+}
+
+static void
+bdev_null_submit_request(struct spdk_io_channel *_ch, struct spdk_bdev_io *bdev_io)
+{
+ struct null_io_channel *ch = spdk_io_channel_get_ctx(_ch);
+ struct spdk_bdev *bdev = bdev_io->bdev;
+ struct spdk_dif_ctx dif_ctx;
+ struct spdk_dif_error err_blk;
+ int rc;
+
+ if (SPDK_DIF_DISABLE != bdev->dif_type &&
+ (SPDK_BDEV_IO_TYPE_READ == bdev_io->type ||
+ SPDK_BDEV_IO_TYPE_WRITE == bdev_io->type)) {
+ rc = spdk_dif_ctx_init(&dif_ctx,
+ bdev->blocklen,
+ bdev->md_len,
+ bdev->md_interleave,
+ bdev->dif_is_head_of_md,
+ bdev->dif_type,
+ bdev->dif_check_flags,
+ bdev_io->u.bdev.offset_blocks & 0xFFFFFFFF,
+ 0xFFFF, 0, 0, 0);
+ if (0 != rc) {
+ SPDK_ERRLOG("Failed to initialize DIF context, error %d\n", rc);
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
+ return;
+ }
+ }
+
+ switch (bdev_io->type) {
+ case SPDK_BDEV_IO_TYPE_READ:
+ if (bdev_io->u.bdev.iovs[0].iov_base == NULL) {
+ assert(bdev_io->u.bdev.iovcnt == 1);
+ if (spdk_likely(bdev_io->u.bdev.num_blocks * bdev_io->bdev->blocklen <=
+ SPDK_BDEV_LARGE_BUF_MAX_SIZE)) {
+ bdev_io->u.bdev.iovs[0].iov_base = g_null_read_buf;
+ bdev_io->u.bdev.iovs[0].iov_len = bdev_io->u.bdev.num_blocks * bdev_io->bdev->blocklen;
+ } else {
+ SPDK_ERRLOG("Overflow occurred. Read I/O size %" PRIu64 " was larger than permitted %d\n",
+ bdev_io->u.bdev.num_blocks * bdev_io->bdev->blocklen,
+ SPDK_BDEV_LARGE_BUF_MAX_SIZE);
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
+ return;
+ }
+ }
+ if (SPDK_DIF_DISABLE != bdev->dif_type) {
+ rc = spdk_dif_generate(bdev_io->u.bdev.iovs, bdev_io->u.bdev.iovcnt,
+ bdev_io->u.bdev.num_blocks, &dif_ctx);
+ if (0 != rc) {
+ SPDK_ERRLOG("IO DIF generation failed: lba %lu, num_block %lu\n",
+ bdev_io->u.bdev.offset_blocks,
+ bdev_io->u.bdev.num_blocks);
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
+ return;
+ }
+ }
+ TAILQ_INSERT_TAIL(&ch->io, bdev_io, module_link);
+ break;
+ case SPDK_BDEV_IO_TYPE_WRITE:
+ if (SPDK_DIF_DISABLE != bdev->dif_type) {
+ rc = spdk_dif_verify(bdev_io->u.bdev.iovs, bdev_io->u.bdev.iovcnt,
+ bdev_io->u.bdev.num_blocks, &dif_ctx, &err_blk);
+ if (0 != rc) {
+ SPDK_ERRLOG("IO DIF verification failed: lba %lu, num_blocks %lu, "
+ "err_type %u, expected %u, actual %u, err_offset %u\n",
+ bdev_io->u.bdev.offset_blocks,
+ bdev_io->u.bdev.num_blocks,
+ err_blk.err_type,
+ err_blk.expected,
+ err_blk.actual,
+ err_blk.err_offset);
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
+ return;
+ }
+ }
+ TAILQ_INSERT_TAIL(&ch->io, bdev_io, module_link);
+ break;
+ case SPDK_BDEV_IO_TYPE_WRITE_ZEROES:
+ case SPDK_BDEV_IO_TYPE_RESET:
+ TAILQ_INSERT_TAIL(&ch->io, bdev_io, module_link);
+ break;
+ case SPDK_BDEV_IO_TYPE_ABORT:
+ if (bdev_null_abort_io(ch, bdev_io->u.abort.bio_to_abort)) {
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_SUCCESS);
+ } else {
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
+ }
+ break;
+ case SPDK_BDEV_IO_TYPE_FLUSH:
+ case SPDK_BDEV_IO_TYPE_UNMAP:
+ default:
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_FAILED);
+ break;
+ }
+}
+
+static bool
+bdev_null_io_type_supported(void *ctx, enum spdk_bdev_io_type io_type)
+{
+ switch (io_type) {
+ case SPDK_BDEV_IO_TYPE_READ:
+ case SPDK_BDEV_IO_TYPE_WRITE:
+ case SPDK_BDEV_IO_TYPE_WRITE_ZEROES:
+ case SPDK_BDEV_IO_TYPE_RESET:
+ case SPDK_BDEV_IO_TYPE_ABORT:
+ return true;
+ case SPDK_BDEV_IO_TYPE_FLUSH:
+ case SPDK_BDEV_IO_TYPE_UNMAP:
+ default:
+ return false;
+ }
+}
+
+static struct spdk_io_channel *
+bdev_null_get_io_channel(void *ctx)
+{
+ return spdk_get_io_channel(&g_null_bdev_head);
+}
+
+static void
+bdev_null_write_config_json(struct spdk_bdev *bdev, struct spdk_json_write_ctx *w)
+{
+ char uuid_str[SPDK_UUID_STRING_LEN];
+
+ spdk_json_write_object_begin(w);
+
+ spdk_json_write_named_string(w, "method", "bdev_null_create");
+
+ spdk_json_write_named_object_begin(w, "params");
+ spdk_json_write_named_string(w, "name", bdev->name);
+ spdk_json_write_named_uint64(w, "num_blocks", bdev->blockcnt);
+ spdk_json_write_named_uint32(w, "block_size", bdev->blocklen);
+ spdk_json_write_named_uint32(w, "md_size", bdev->md_len);
+ spdk_json_write_named_uint32(w, "dif_type", bdev->dif_type);
+ spdk_json_write_named_bool(w, "dif_is_head_of_md", bdev->dif_is_head_of_md);
+ spdk_uuid_fmt_lower(uuid_str, sizeof(uuid_str), &bdev->uuid);
+ spdk_json_write_named_string(w, "uuid", uuid_str);
+ spdk_json_write_object_end(w);
+
+ spdk_json_write_object_end(w);
+}
+
+static const struct spdk_bdev_fn_table null_fn_table = {
+ .destruct = bdev_null_destruct,
+ .submit_request = bdev_null_submit_request,
+ .io_type_supported = bdev_null_io_type_supported,
+ .get_io_channel = bdev_null_get_io_channel,
+ .write_config_json = bdev_null_write_config_json,
+};
+
+int
+bdev_null_create(struct spdk_bdev **bdev, const struct spdk_null_bdev_opts *opts)
+{
+ struct null_bdev *null_disk;
+ uint32_t data_block_size;
+ int rc;
+
+ if (!opts) {
+ SPDK_ERRLOG("No options provided for Null bdev.\n");
+ return -EINVAL;
+ }
+
+ if (opts->md_interleave) {
+ if (opts->block_size < opts->md_size) {
+ SPDK_ERRLOG("Interleaved metadata size can not be greater than block size.\n");
+ return -EINVAL;
+ }
+ data_block_size = opts->block_size - opts->md_size;
+ } else {
+ if (opts->md_size != 0) {
+ SPDK_ERRLOG("Metadata in separate buffer is not supported\n");
+ return -ENOTSUP;
+ }
+ data_block_size = opts->block_size;
+ }
+
+ if (data_block_size % 512 != 0) {
+ SPDK_ERRLOG("Data block size %u is not a multiple of 512.\n", opts->block_size);
+ return -EINVAL;
+ }
+
+ if (opts->num_blocks == 0) {
+ SPDK_ERRLOG("Disk must be more than 0 blocks\n");
+ return -EINVAL;
+ }
+
+ null_disk = calloc(1, sizeof(*null_disk));
+ if (!null_disk) {
+ SPDK_ERRLOG("could not allocate null_bdev\n");
+ return -ENOMEM;
+ }
+
+ null_disk->bdev.name = strdup(opts->name);
+ if (!null_disk->bdev.name) {
+ free(null_disk);
+ return -ENOMEM;
+ }
+ null_disk->bdev.product_name = "Null disk";
+
+ null_disk->bdev.write_cache = 0;
+ null_disk->bdev.blocklen = opts->block_size;
+ null_disk->bdev.blockcnt = opts->num_blocks;
+ null_disk->bdev.md_len = opts->md_size;
+ null_disk->bdev.md_interleave = opts->md_interleave;
+ null_disk->bdev.dif_type = opts->dif_type;
+ null_disk->bdev.dif_is_head_of_md = opts->dif_is_head_of_md;
+ /* Current block device layer API does not propagate
+ * any DIF related information from user. So, we can
+ * not generate or verify Application Tag.
+ */
+ switch (opts->dif_type) {
+ case SPDK_DIF_TYPE1:
+ case SPDK_DIF_TYPE2:
+ null_disk->bdev.dif_check_flags = SPDK_DIF_FLAGS_GUARD_CHECK |
+ SPDK_DIF_FLAGS_REFTAG_CHECK;
+ break;
+ case SPDK_DIF_TYPE3:
+ null_disk->bdev.dif_check_flags = SPDK_DIF_FLAGS_GUARD_CHECK;
+ break;
+ case SPDK_DIF_DISABLE:
+ break;
+ }
+ if (opts->uuid) {
+ null_disk->bdev.uuid = *opts->uuid;
+ } else {
+ spdk_uuid_generate(&null_disk->bdev.uuid);
+ }
+
+ null_disk->bdev.ctxt = null_disk;
+ null_disk->bdev.fn_table = &null_fn_table;
+ null_disk->bdev.module = &null_if;
+
+ rc = spdk_bdev_register(&null_disk->bdev);
+ if (rc) {
+ free(null_disk->bdev.name);
+ free(null_disk);
+ return rc;
+ }
+
+ *bdev = &(null_disk->bdev);
+
+ TAILQ_INSERT_TAIL(&g_null_bdev_head, null_disk, tailq);
+
+ return rc;
+}
+
+void
+bdev_null_delete(struct spdk_bdev *bdev, spdk_delete_null_complete cb_fn, void *cb_arg)
+{
+ if (!bdev || bdev->module != &null_if) {
+ cb_fn(cb_arg, -ENODEV);
+ return;
+ }
+
+ spdk_bdev_unregister(bdev, cb_fn, cb_arg);
+}
+
+static int
+null_io_poll(void *arg)
+{
+ struct null_io_channel *ch = arg;
+ TAILQ_HEAD(, spdk_bdev_io) io;
+ struct spdk_bdev_io *bdev_io;
+
+ TAILQ_INIT(&io);
+ TAILQ_SWAP(&ch->io, &io, spdk_bdev_io, module_link);
+
+ if (TAILQ_EMPTY(&io)) {
+ return SPDK_POLLER_IDLE;
+ }
+
+ while (!TAILQ_EMPTY(&io)) {
+ bdev_io = TAILQ_FIRST(&io);
+ TAILQ_REMOVE(&io, bdev_io, module_link);
+ spdk_bdev_io_complete(bdev_io, SPDK_BDEV_IO_STATUS_SUCCESS);
+ }
+
+ return SPDK_POLLER_BUSY;
+}
+
+static int
+null_bdev_create_cb(void *io_device, void *ctx_buf)
+{
+ struct null_io_channel *ch = ctx_buf;
+
+ TAILQ_INIT(&ch->io);
+ ch->poller = SPDK_POLLER_REGISTER(null_io_poll, ch, 0);
+
+ return 0;
+}
+
+static void
+null_bdev_destroy_cb(void *io_device, void *ctx_buf)
+{
+ struct null_io_channel *ch = ctx_buf;
+
+ spdk_poller_unregister(&ch->poller);
+}
+
+static void
+_bdev_null_cleanup_cb(void *arg)
+{
+ spdk_free(g_null_read_buf);
+}
+
+static int
+bdev_null_initialize(void)
+{
+ struct spdk_conf_section *sp = spdk_conf_find_section(NULL, "Null");
+ uint64_t size_in_mb, num_blocks;
+ int block_size, i, rc = 0;
+ int md_size, dif_type;
+ struct spdk_bdev *bdev;
+ const char *name, *val;
+ struct spdk_null_bdev_opts opts = {};
+
+ TAILQ_INIT(&g_null_bdev_head);
+
+ /*
+ * This will be used if upper layer expects us to allocate the read buffer.
+ * Instead of using a real rbuf from the bdev pool, just always point to
+ * this same zeroed buffer.
+ */
+ g_null_read_buf = spdk_zmalloc(SPDK_BDEV_LARGE_BUF_MAX_SIZE, 0, NULL,
+ SPDK_ENV_SOCKET_ID_ANY, SPDK_MALLOC_DMA);
+
+ /*
+ * We need to pick some unique address as our "io device" - so just use the
+ * address of the global tailq.
+ */
+ spdk_io_device_register(&g_null_bdev_head, null_bdev_create_cb, null_bdev_destroy_cb,
+ sizeof(struct null_io_channel),
+ "null_bdev");
+
+ if (sp == NULL) {
+ goto end;
+ }
+
+ for (i = 0; ; ++i) {
+ val = spdk_conf_section_get_nval(sp, "Dev", i);
+ if (val == NULL) {
+ break;
+ }
+
+ name = spdk_conf_section_get_nmval(sp, "Dev", i, 0);
+ if (name == NULL) {
+ SPDK_ERRLOG("Null entry %d: Name must be provided\n", i);
+ continue;
+ }
+
+ val = spdk_conf_section_get_nmval(sp, "Dev", i, 1);
+ if (val == NULL) {
+ SPDK_ERRLOG("Null entry %d: Size in MB must be provided\n", i);
+ continue;
+ }
+
+ errno = 0;
+ size_in_mb = strtoull(val, NULL, 10);
+ if (errno) {
+ SPDK_ERRLOG("Null entry %d: Invalid size in MB %s\n", i, val);
+ continue;
+ }
+
+ val = spdk_conf_section_get_nmval(sp, "Dev", i, 2);
+ if (val == NULL) {
+ block_size = 512;
+ } else {
+ block_size = (int)spdk_strtol(val, 10);
+ if (block_size <= 0) {
+ SPDK_ERRLOG("Null entry %d: Invalid block size %s\n", i, val);
+ continue;
+ }
+ }
+
+ val = spdk_conf_section_get_nmval(sp, "Dev", i, 3);
+ if (val == NULL) {
+ md_size = 0;
+ } else {
+ md_size = (int)spdk_strtol(val, 10);
+ if (md_size < 0) {
+ SPDK_ERRLOG("Null entry %d: Invalid metadata size %s\n", i, val);
+ continue;
+ }
+ }
+
+ val = spdk_conf_section_get_nmval(sp, "Dev", i, 4);
+ if (val == NULL) {
+ dif_type = SPDK_DIF_DISABLE;
+ } else {
+ dif_type = (int)spdk_strtol(val, 10);
+ if (dif_type < SPDK_DIF_DISABLE || dif_type > SPDK_DIF_TYPE3) {
+ SPDK_ERRLOG("Null entry %d: Invalid data protection type %s\n", i, val);
+ continue;
+ }
+ }
+ num_blocks = size_in_mb * (1024 * 1024) / block_size;
+
+ opts.name = name;
+ opts.num_blocks = num_blocks;
+ opts.block_size = block_size;
+ opts.md_size = md_size;
+ opts.md_interleave = true;
+ opts.dif_type = dif_type;
+ opts.dif_is_head_of_md = false;
+ rc = bdev_null_create(&bdev, &opts);
+ if (rc) {
+ SPDK_ERRLOG("Could not create null bdev\n");
+ goto end;
+ }
+ }
+end:
+ if (rc) {
+ spdk_io_device_unregister(&g_null_bdev_head, _bdev_null_cleanup_cb);
+ }
+ return rc;
+}
+
+static void
+_bdev_null_finish_cb(void *arg)
+{
+ spdk_free(g_null_read_buf);
+ spdk_bdev_module_finish_done();
+}
+
+static void
+bdev_null_finish(void)
+{
+ spdk_io_device_unregister(&g_null_bdev_head, _bdev_null_finish_cb);
+}
+
+static void
+bdev_null_get_spdk_running_config(FILE *fp)
+{
+ struct null_bdev *bdev;
+ uint64_t null_bdev_size;
+
+ fprintf(fp, "\n[Null]\n");
+
+ TAILQ_FOREACH(bdev, &g_null_bdev_head, tailq) {
+ null_bdev_size = bdev->bdev.blocklen * bdev->bdev.blockcnt;
+ null_bdev_size /= (1024 * 1024);
+ fprintf(fp, " Dev %s %" PRIu64 " %d %d %d\n",
+ bdev->bdev.name, null_bdev_size, bdev->bdev.blocklen, bdev->bdev.md_len,
+ bdev->bdev.dif_type);
+ }
+}
+
+SPDK_LOG_REGISTER_COMPONENT("bdev_null", SPDK_LOG_BDEV_NULL)