diff options
Diffstat (limited to 'storage/tokudb/PerconaFT/ft/tests/ft-serialize-test.cc')
-rw-r--r-- | storage/tokudb/PerconaFT/ft/tests/ft-serialize-test.cc | 1299 |
1 files changed, 1299 insertions, 0 deletions
diff --git a/storage/tokudb/PerconaFT/ft/tests/ft-serialize-test.cc b/storage/tokudb/PerconaFT/ft/tests/ft-serialize-test.cc new file mode 100644 index 00000000..4fca8efa --- /dev/null +++ b/storage/tokudb/PerconaFT/ft/tests/ft-serialize-test.cc @@ -0,0 +1,1299 @@ +/* -*- mode: C++; c-basic-offset: 4; indent-tabs-mode: nil -*- */ +// vim: ft=cpp:expandtab:ts=8:sw=4:softtabstop=4: +#ident "$Id$" +/*====== +This file is part of PerconaFT. + + +Copyright (c) 2006, 2015, Percona and/or its affiliates. All rights reserved. + + PerconaFT is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License, version 2, + as published by the Free Software Foundation. + + PerconaFT is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with PerconaFT. If not, see <http://www.gnu.org/licenses/>. + +---------------------------------------- + + PerconaFT is free software: you can redistribute it and/or modify + it under the terms of the GNU Affero General Public License, version 3, + as published by the Free Software Foundation. + + PerconaFT is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU Affero General Public License for more details. + + You should have received a copy of the GNU Affero General Public License + along with PerconaFT. If not, see <http://www.gnu.org/licenses/>. +======= */ + +#ident "Copyright (c) 2006, 2015, Percona and/or its affiliates. All rights reserved." + +#include "test.h" +#include "bndata.h" + +#ifndef MIN +#define MIN(x, y) (((x) < (y)) ? (x) : (y)) +#endif + +static size_t le_add_to_bn(bn_data *bn, + uint32_t idx, + const char *key, + int keysize, + const char *val, + int valsize) { + LEAFENTRY r = NULL; + uint32_t size_needed = LE_CLEAN_MEMSIZE(valsize); + void *maybe_free = nullptr; + bn->get_space_for_insert(idx, key, keysize, size_needed, &r, &maybe_free); + if (maybe_free) { + toku_free(maybe_free); + } + resource_assert(r); + r->type = LE_CLEAN; + r->u.clean.vallen = valsize; + memcpy(r->u.clean.val, val, valsize); + return size_needed + keysize + sizeof(uint32_t); +} + +class test_key_le_pair { + public: + uint32_t keylen; + char *keyp; + LEAFENTRY le; + + test_key_le_pair() : keylen(), keyp(), le() {} + void init(const char *_keyp, const char *_val) { + init(_keyp, strlen(_keyp) + 1, _val, strlen(_val) + 1); + } + void init(const char *_keyp, + uint32_t _keylen, + const char *_val, + uint32_t _vallen) { + keylen = _keylen; + + CAST_FROM_VOIDP(le, toku_malloc(LE_CLEAN_MEMSIZE(_vallen))); + le->type = LE_CLEAN; + le->u.clean.vallen = _vallen; + memcpy(le->u.clean.val, _val, _vallen); + + CAST_FROM_VOIDP(keyp, toku_xmemdup(_keyp, keylen)); + } + ~test_key_le_pair() { + toku_free(le); + toku_free(keyp); + } +}; + +enum ftnode_verify_type { read_all = 1, read_compressed, read_none }; + +static int string_key_cmp(DB *UU(e), const DBT *a, const DBT *b) { + char *CAST_FROM_VOIDP(s, a->data); + char *CAST_FROM_VOIDP(t, b->data); + return strcmp(s, t); +} + +static void setup_dn(enum ftnode_verify_type bft, + int fd, + FT ft_h, + FTNODE *dn, + FTNODE_DISK_DATA *ndd) { + int r; + if (bft == read_all) { + ftnode_fetch_extra bfe; + bfe.create_for_full_read(ft_h); + r = toku_deserialize_ftnode_from( + fd, make_blocknum(20), 0 /*pass zero for hash*/, dn, ndd, &bfe); + invariant(r == 0); + } else if (bft == read_compressed || bft == read_none) { + ftnode_fetch_extra bfe; + bfe.create_for_min_read(ft_h); + r = toku_deserialize_ftnode_from( + fd, make_blocknum(20), 0 /*pass zero for hash*/, dn, ndd, &bfe); + invariant(r == 0); + // invariant all bp's are compressed or on disk. + for (int i = 0; i < (*dn)->n_children; i++) { + invariant(BP_STATE(*dn, i) == PT_COMPRESSED || + BP_STATE(*dn, i) == PT_ON_DISK); + } + // if read_none, get rid of the compressed bp's + if (bft == read_none) { + if ((*dn)->height == 0) { + toku_ftnode_pe_callback(*dn, + make_pair_attr(0xffffffff), + ft_h, + def_pe_finalize_impl, + nullptr); + // invariant all bp's are on disk + for (int i = 0; i < (*dn)->n_children; i++) { + if ((*dn)->height == 0) { + invariant(BP_STATE(*dn, i) == PT_ON_DISK); + invariant(is_BNULL(*dn, i)); + } else { + invariant(BP_STATE(*dn, i) == PT_COMPRESSED); + } + } + } else { + // first decompress everything, and make sure + // that it is available + // then run partial eviction to get it compressed + PAIR_ATTR attr; + bfe.create_for_full_read(ft_h); + invariant(toku_ftnode_pf_req_callback(*dn, &bfe)); + r = toku_ftnode_pf_callback(*dn, *ndd, &bfe, fd, &attr); + invariant(r == 0); + // invariant all bp's are available + for (int i = 0; i < (*dn)->n_children; i++) { + invariant(BP_STATE(*dn, i) == PT_AVAIL); + } + toku_ftnode_pe_callback(*dn, + make_pair_attr(0xffffffff), + ft_h, + def_pe_finalize_impl, + nullptr); + for (int i = 0; i < (*dn)->n_children; i++) { + // invariant all bp's are still available, because we touched + // the clock + invariant(BP_STATE(*dn, i) == PT_AVAIL); + // now invariant all should be evicted + invariant(BP_SHOULD_EVICT(*dn, i)); + } + toku_ftnode_pe_callback(*dn, + make_pair_attr(0xffffffff), + ft_h, + def_pe_finalize_impl, + nullptr); + for (int i = 0; i < (*dn)->n_children; i++) { + invariant(BP_STATE(*dn, i) == PT_COMPRESSED); + } + } + } + // now decompress them + bfe.create_for_full_read(ft_h); + invariant(toku_ftnode_pf_req_callback(*dn, &bfe)); + PAIR_ATTR attr; + r = toku_ftnode_pf_callback(*dn, *ndd, &bfe, fd, &attr); + invariant(r == 0); + // invariant all bp's are available + for (int i = 0; i < (*dn)->n_children; i++) { + invariant(BP_STATE(*dn, i) == PT_AVAIL); + } + // continue on with test + } else { + // if we get here, this is a test bug, NOT a bug in development code + invariant(false); + } +} + +static void write_sn_to_disk(int fd, + FT_HANDLE ft, + FTNODE sn, + FTNODE_DISK_DATA *src_ndd, + bool do_clone) { + int r; + if (do_clone) { + void *cloned_node_v = NULL; + PAIR_ATTR attr; + long clone_size; + toku_ftnode_clone_callback( + sn, &cloned_node_v, &clone_size, &attr, false, ft->ft); + FTNODE CAST_FROM_VOIDP(cloned_node, cloned_node_v); + r = toku_serialize_ftnode_to( + fd, make_blocknum(20), cloned_node, src_ndd, false, ft->ft, false); + invariant(r == 0); + toku_ftnode_free(&cloned_node); + } else { + r = toku_serialize_ftnode_to( + fd, make_blocknum(20), sn, src_ndd, true, ft->ft, false); + invariant(r == 0); + } +} + +static void test_serialize_leaf_check_msn(enum ftnode_verify_type bft, + bool do_clone) { + // struct ft_handle source_ft; + struct ftnode sn, *dn; + + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + int r; + +#define PRESERIALIZE_MSN_ON_DISK ((MSN){MIN_MSN.msn + 42}) +#define POSTSERIALIZE_MSN_ON_DISK ((MSN){MIN_MSN.msn + 84}) + + sn.max_msn_applied_to_node_on_disk = PRESERIALIZE_MSN_ON_DISK; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 0; + sn.n_children = 2; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + MALLOC_N(sn.n_children, sn.bp); + DBT pivotkey; + sn.pivotkeys.create_from_dbts(toku_fill_dbt(&pivotkey, "b", 2), 1); + BP_STATE(&sn, 0) = PT_AVAIL; + BP_STATE(&sn, 1) = PT_AVAIL; + set_BLB(&sn, 0, toku_create_empty_bn()); + set_BLB(&sn, 1, toku_create_empty_bn()); + le_add_to_bn(BLB_DATA(&sn, 0), 0, "a", 2, "aval", 5); + le_add_to_bn(BLB_DATA(&sn, 0), 1, "b", 2, "bval", 5); + le_add_to_bn(BLB_DATA(&sn, 1), 0, "x", 2, "xval", 5); + BLB_MAX_MSN_APPLIED(&sn, 0) = ((MSN){MIN_MSN.msn + 73}); + BLB_MAX_MSN_APPLIED(&sn, 1) = POSTSERIALIZE_MSN_ON_DISK; + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft->ft = ft_h; + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + invariant(dn->layout_version_read_from_disk == FT_LAYOUT_VERSION); + invariant(dn->height == 0); + invariant(dn->n_children >= 1); + invariant(dn->max_msn_applied_to_node_on_disk.msn == + POSTSERIALIZE_MSN_ON_DISK.msn); + { + // Man, this is way too ugly. This entire test suite needs to be + // refactored. + // Create a dummy mempool and put the leaves there. Ugh. + test_key_le_pair elts[3]; + elts[0].init("a", "aval"); + elts[1].init("b", "bval"); + elts[2].init("x", "xval"); + const uint32_t npartitions = dn->n_children; + uint32_t last_i = 0; + for (uint32_t bn = 0; bn < npartitions; ++bn) { + invariant(BLB_MAX_MSN_APPLIED(dn, bn).msn == + POSTSERIALIZE_MSN_ON_DISK.msn); + invariant(dest_ndd[bn].start > 0); + invariant(dest_ndd[bn].size > 0); + if (bn > 0) { + invariant(dest_ndd[bn].start >= + dest_ndd[bn - 1].start + dest_ndd[bn - 1].size); + } + for (uint32_t i = 0; i < BLB_DATA(dn, bn)->num_klpairs(); i++) { + LEAFENTRY curr_le; + uint32_t curr_keylen; + void *curr_key; + BLB_DATA(dn, bn) + ->fetch_klpair(i, &curr_le, &curr_keylen, &curr_key); + invariant(leafentry_memsize(curr_le) == + leafentry_memsize(elts[last_i].le)); + invariant(memcmp(curr_le, + elts[last_i].le, + leafentry_memsize(curr_le)) == 0); + if (bn < npartitions - 1) { + invariant(strcmp((char *)dn->pivotkeys.get_pivot(bn).data, + elts[last_i].keyp) <= 0); + } + // TODO for later, get a key comparison here as well + last_i++; + } + } + invariant(last_i == 3); + } + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +static void test_serialize_leaf_with_large_pivots(enum ftnode_verify_type bft, + bool do_clone) { + int r; + struct ftnode sn, *dn; + const int keylens = 256 * 1024, vallens = 0; + const uint32_t nrows = 8; + // invariant(val_size > BN_MAX_SIZE); // BN_MAX_SIZE isn't visible + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + sn.max_msn_applied_to_node_on_disk.msn = 0; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 0; + sn.n_children = nrows; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + + MALLOC_N(sn.n_children, sn.bp); + sn.pivotkeys.create_empty(); + for (int i = 0; i < sn.n_children; ++i) { + BP_STATE(&sn, i) = PT_AVAIL; + set_BLB(&sn, i, toku_create_empty_bn()); + } + for (uint32_t i = 0; i < nrows; ++i) { // one basement per row + char key[keylens], val[vallens]; + key[keylens - 1] = '\0'; + char c = 'a' + i; + memset(key, c, keylens - 1); + le_add_to_bn(BLB_DATA(&sn, i), + 0, + (char *)&key, + sizeof(key), + (char *)&val, + sizeof(val)); + if (i < nrows - 1) { + uint32_t keylen; + void *curr_key; + BLB_DATA(&sn, i)->fetch_key_and_len(0, &keylen, &curr_key); + DBT pivotkey; + sn.pivotkeys.insert_at(toku_fill_dbt(&pivotkey, curr_key, keylen), + i); + } + } + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft->ft = ft_h; + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + { + // Man, this is way too ugly. This entire test suite needs to be + // refactored. + // Create a dummy mempool and put the leaves there. Ugh. + test_key_le_pair *les = new test_key_le_pair[nrows]; + { + char key[keylens], val[vallens]; + key[keylens - 1] = '\0'; + for (uint32_t i = 0; i < nrows; ++i) { + char c = 'a' + i; + memset(key, c, keylens - 1); + les[i].init( + (char *)&key, sizeof(key), (char *)&val, sizeof(val)); + } + } + const uint32_t npartitions = dn->n_children; + uint32_t last_i = 0; + for (uint32_t bn = 0; bn < npartitions; ++bn) { + invariant(dest_ndd[bn].start > 0); + invariant(dest_ndd[bn].size > 0); + if (bn > 0) { + invariant(dest_ndd[bn].start >= + dest_ndd[bn - 1].start + dest_ndd[bn - 1].size); + } + invariant(BLB_DATA(dn, bn)->num_klpairs() > 0); + for (uint32_t i = 0; i < BLB_DATA(dn, bn)->num_klpairs(); i++) { + LEAFENTRY curr_le; + uint32_t curr_keylen; + void *curr_key; + BLB_DATA(dn, bn) + ->fetch_klpair(i, &curr_le, &curr_keylen, &curr_key); + invariant(leafentry_memsize(curr_le) == + leafentry_memsize(les[last_i].le)); + invariant(memcmp(curr_le, + les[last_i].le, + leafentry_memsize(curr_le)) == 0); + if (bn < npartitions - 1) { + invariant(strcmp((char *)dn->pivotkeys.get_pivot(bn).data, + les[last_i].keyp) <= 0); + } + // TODO for later, get a key comparison here as well + last_i++; + } + } + invariant(last_i == nrows); + delete[] les; + } + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +static void test_serialize_leaf_with_many_rows(enum ftnode_verify_type bft, + bool do_clone) { + int r; + struct ftnode sn, *dn; + const uint32_t nrows = 196 * 1024; + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + sn.max_msn_applied_to_node_on_disk.msn = 0; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 0; + sn.n_children = 1; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + + XMALLOC_N(sn.n_children, sn.bp); + sn.pivotkeys.create_empty(); + for (int i = 0; i < sn.n_children; ++i) { + BP_STATE(&sn, i) = PT_AVAIL; + set_BLB(&sn, i, toku_create_empty_bn()); + } + size_t total_size = 0; + for (uint32_t i = 0; i < nrows; ++i) { + uint32_t key = i; + uint32_t val = i; + total_size += le_add_to_bn(BLB_DATA(&sn, 0), + i, + (char *)&key, + sizeof(key), + (char *)&val, + sizeof(val)); + } + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft->ft = ft_h; + + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + { + // Man, this is way too ugly. This entire test suite needs to be + // refactored. + // Create a dummy mempool and put the leaves there. Ugh. + test_key_le_pair *les = new test_key_le_pair[nrows]; + { + int key = 0, val = 0; + for (uint32_t i = 0; i < nrows; ++i, key++, val++) { + les[i].init( + (char *)&key, sizeof(key), (char *)&val, sizeof(val)); + } + } + const uint32_t npartitions = dn->n_children; + uint32_t last_i = 0; + for (uint32_t bn = 0; bn < npartitions; ++bn) { + invariant(dest_ndd[bn].start > 0); + invariant(dest_ndd[bn].size > 0); + if (bn > 0) { + invariant(dest_ndd[bn].start >= + dest_ndd[bn - 1].start + dest_ndd[bn - 1].size); + } + invariant(BLB_DATA(dn, bn)->num_klpairs() > 0); + for (uint32_t i = 0; i < BLB_DATA(dn, bn)->num_klpairs(); i++) { + LEAFENTRY curr_le; + uint32_t curr_keylen; + void *curr_key; + BLB_DATA(dn, bn) + ->fetch_klpair(i, &curr_le, &curr_keylen, &curr_key); + invariant(leafentry_memsize(curr_le) == + leafentry_memsize(les[last_i].le)); + invariant(memcmp(curr_le, + les[last_i].le, + leafentry_memsize(curr_le)) == 0); + if (bn < npartitions - 1) { + uint32_t *CAST_FROM_VOIDP(pivot, + dn->pivotkeys.get_pivot(bn).data); + void *tmp = les[last_i].keyp; + uint32_t *CAST_FROM_VOIDP(item, tmp); + invariant(*pivot >= *item); + } + // TODO for later, get a key comparison here as well + last_i++; + } + // don't check soft_copy_is_up_to_date or seqinsert + invariant(BLB_DATA(dn, bn)->get_disk_size() < + 128 * 1024); // BN_MAX_SIZE, apt to change + } + invariant(last_i == nrows); + delete[] les; + } + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +static void test_serialize_leaf_with_large_rows(enum ftnode_verify_type bft, + bool do_clone) { + int r; + struct ftnode sn, *dn; + const uint32_t nrows = 7; + const size_t key_size = 8; + const size_t val_size = 512 * 1024; + // invariant(val_size > BN_MAX_SIZE); // BN_MAX_SIZE isn't visible + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + sn.max_msn_applied_to_node_on_disk.msn = 0; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 0; + sn.n_children = 1; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + + MALLOC_N(sn.n_children, sn.bp); + sn.pivotkeys.create_empty(); + for (int i = 0; i < sn.n_children; ++i) { + BP_STATE(&sn, i) = PT_AVAIL; + set_BLB(&sn, i, toku_create_empty_bn()); + } + for (uint32_t i = 0; i < nrows; ++i) { + char key[key_size], val[val_size]; + key[key_size - 1] = '\0'; + val[val_size - 1] = '\0'; + char c = 'a' + i; + memset(key, c, key_size - 1); + memset(val, c, val_size - 1); + le_add_to_bn(BLB_DATA(&sn, 0), i, key, 8, val, val_size); + } + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft->ft = ft_h; + + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + { + // Man, this is way too ugly. This entire test suite needs to be + // refactored. + // Create a dummy mempool and put the leaves there. Ugh. + test_key_le_pair *les = new test_key_le_pair[nrows]; + { + char key[key_size], val[val_size]; + key[key_size - 1] = '\0'; + val[val_size - 1] = '\0'; + for (uint32_t i = 0; i < nrows; ++i) { + char c = 'a' + i; + memset(key, c, key_size - 1); + memset(val, c, val_size - 1); + les[i].init(key, key_size, val, val_size); + } + } + const uint32_t npartitions = dn->n_children; + invariant(npartitions == nrows); + uint32_t last_i = 0; + for (uint32_t bn = 0; bn < npartitions; ++bn) { + invariant(dest_ndd[bn].start > 0); + invariant(dest_ndd[bn].size > 0); + if (bn > 0) { + invariant(dest_ndd[bn].start >= + dest_ndd[bn - 1].start + dest_ndd[bn - 1].size); + } + invariant(BLB_DATA(dn, bn)->num_klpairs() > 0); + for (uint32_t i = 0; i < BLB_DATA(dn, bn)->num_klpairs(); i++) { + LEAFENTRY curr_le; + uint32_t curr_keylen; + void *curr_key; + BLB_DATA(dn, bn) + ->fetch_klpair(i, &curr_le, &curr_keylen, &curr_key); + invariant(leafentry_memsize(curr_le) == + leafentry_memsize(les[last_i].le)); + invariant(memcmp(curr_le, + les[last_i].le, + leafentry_memsize(curr_le)) == 0); + if (bn < npartitions - 1) { + invariant(strcmp((char *)dn->pivotkeys.get_pivot(bn).data, + (char *)(les[last_i].keyp)) <= 0); + } + // TODO for later, get a key comparison here as well + last_i++; + } + // don't check soft_copy_is_up_to_date or seqinsert + } + invariant(last_i == 7); + delete[] les; + } + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +static void test_serialize_leaf_with_empty_basement_nodes( + enum ftnode_verify_type bft, + bool do_clone) { + struct ftnode sn, *dn; + + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + int r; + + sn.max_msn_applied_to_node_on_disk.msn = 0; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 0; + sn.n_children = 7; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + MALLOC_N(sn.n_children, sn.bp); + DBT pivotkeys[6]; + toku_fill_dbt(&pivotkeys[0], "A", 2); + toku_fill_dbt(&pivotkeys[1], "a", 2); + toku_fill_dbt(&pivotkeys[2], "a", 2); + toku_fill_dbt(&pivotkeys[3], "b", 2); + toku_fill_dbt(&pivotkeys[4], "b", 2); + toku_fill_dbt(&pivotkeys[5], "x", 2); + sn.pivotkeys.create_from_dbts(pivotkeys, 6); + for (int i = 0; i < sn.n_children; ++i) { + BP_STATE(&sn, i) = PT_AVAIL; + set_BLB(&sn, i, toku_create_empty_bn()); + BLB_SEQINSERT(&sn, i) = 0; + } + le_add_to_bn(BLB_DATA(&sn, 1), 0, "a", 2, "aval", 5); + le_add_to_bn(BLB_DATA(&sn, 3), 0, "b", 2, "bval", 5); + le_add_to_bn(BLB_DATA(&sn, 5), 0, "x", 2, "xval", 5); + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft->ft = ft_h; + + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + invariant(dn->layout_version_read_from_disk == FT_LAYOUT_VERSION); + invariant(dn->height == 0); + invariant(dn->n_children > 0); + { + test_key_le_pair elts[3]; + + // Man, this is way too ugly. This entire test suite needs to be + // refactored. + // Create a dummy mempool and put the leaves there. Ugh. + elts[0].init("a", "aval"); + elts[1].init("b", "bval"); + elts[2].init("x", "xval"); + const uint32_t npartitions = dn->n_children; + uint32_t last_i = 0; + for (uint32_t bn = 0; bn < npartitions; ++bn) { + invariant(dest_ndd[bn].start > 0); + invariant(dest_ndd[bn].size > 0); + if (bn > 0) { + invariant(dest_ndd[bn].start >= + dest_ndd[bn - 1].start + dest_ndd[bn - 1].size); + } + for (uint32_t i = 0; i < BLB_DATA(dn, bn)->num_klpairs(); i++) { + LEAFENTRY curr_le; + uint32_t curr_keylen; + void *curr_key; + BLB_DATA(dn, bn) + ->fetch_klpair(i, &curr_le, &curr_keylen, &curr_key); + invariant(leafentry_memsize(curr_le) == + leafentry_memsize(elts[last_i].le)); + invariant(memcmp(curr_le, + elts[last_i].le, + leafentry_memsize(curr_le)) == 0); + if (bn < npartitions - 1) { + invariant(strcmp((char *)dn->pivotkeys.get_pivot(bn).data, + (char *)(elts[last_i].keyp)) <= 0); + } + // TODO for later, get a key comparison here as well + last_i++; + } + } + invariant(last_i == 3); + } + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +static void test_serialize_leaf_with_multiple_empty_basement_nodes( + enum ftnode_verify_type bft, + bool do_clone) { + struct ftnode sn, *dn; + + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + int r; + + sn.max_msn_applied_to_node_on_disk.msn = 0; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 0; + sn.n_children = 4; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + MALLOC_N(sn.n_children, sn.bp); + DBT pivotkeys[3]; + toku_fill_dbt(&pivotkeys[0], "A", 2); + toku_fill_dbt(&pivotkeys[1], "A", 2); + toku_fill_dbt(&pivotkeys[2], "A", 2); + sn.pivotkeys.create_from_dbts(pivotkeys, 3); + for (int i = 0; i < sn.n_children; ++i) { + BP_STATE(&sn, i) = PT_AVAIL; + set_BLB(&sn, i, toku_create_empty_bn()); + } + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft->ft = ft_h; + + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + invariant(dn->layout_version_read_from_disk == FT_LAYOUT_VERSION); + invariant(dn->height == 0); + invariant(dn->n_children == 1); + { + const uint32_t npartitions = dn->n_children; + for (uint32_t i = 0; i < npartitions; ++i) { + invariant(dest_ndd[i].start > 0); + invariant(dest_ndd[i].size > 0); + if (i > 0) { + invariant(dest_ndd[i].start >= + dest_ndd[i - 1].start + dest_ndd[i - 1].size); + } + invariant(BLB_DATA(dn, i)->num_klpairs() == 0); + } + } + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +static void test_serialize_nonleaf(enum ftnode_verify_type bft, bool do_clone) { + // struct ft_handle source_ft; + struct ftnode sn, *dn; + + int fd = open(TOKU_TEST_FILENAME, + O_RDWR | O_CREAT | O_BINARY, + S_IRWXU | S_IRWXG | S_IRWXO); + invariant(fd >= 0); + + int r; + + // source_ft.fd=fd; + sn.max_msn_applied_to_node_on_disk.msn = 0; + sn.flags = 0x11223344; + sn.blocknum.b = 20; + sn.layout_version = FT_LAYOUT_VERSION; + sn.layout_version_original = FT_LAYOUT_VERSION; + sn.height = 1; + sn.n_children = 2; + sn.set_dirty(); + sn.oldest_referenced_xid_known = TXNID_NONE; + MALLOC_N(2, sn.bp); + DBT pivotkey; + sn.pivotkeys.create_from_dbts(toku_fill_dbt(&pivotkey, "hello", 6), 1); + BP_BLOCKNUM(&sn, 0).b = 30; + BP_BLOCKNUM(&sn, 1).b = 35; + BP_STATE(&sn, 0) = PT_AVAIL; + BP_STATE(&sn, 1) = PT_AVAIL; + set_BNC(&sn, 0, toku_create_empty_nl()); + set_BNC(&sn, 1, toku_create_empty_nl()); + // Create XIDS + XIDS xids_0 = toku_xids_get_root_xids(); + XIDS xids_123; + XIDS xids_234; + r = toku_xids_create_child(xids_0, &xids_123, (TXNID)123); + CKERR(r); + r = toku_xids_create_child(xids_123, &xids_234, (TXNID)234); + CKERR(r); + + toku::comparator cmp; + cmp.create(string_key_cmp, nullptr); + + toku_bnc_insert_msg(BNC(&sn, 0), + "a", + 2, + "aval", + 5, + FT_NONE, + next_dummymsn(), + xids_0, + true, + cmp); + toku_bnc_insert_msg(BNC(&sn, 0), + "b", + 2, + "bval", + 5, + FT_NONE, + next_dummymsn(), + xids_123, + false, + cmp); + toku_bnc_insert_msg(BNC(&sn, 1), + "x", + 2, + "xval", + 5, + FT_NONE, + next_dummymsn(), + xids_234, + true, + cmp); + + // Cleanup: + toku_xids_destroy(&xids_0); + toku_xids_destroy(&xids_123); + toku_xids_destroy(&xids_234); + cmp.destroy(); + + FT_HANDLE XMALLOC(ft); + FT XCALLOC(ft_h); + toku_ft_init(ft_h, + make_blocknum(0), + ZERO_LSN, + TXNID_NONE, + 4 * 1024 * 1024, + 128 * 1024, + TOKU_DEFAULT_COMPRESSION_METHOD, + 16); + ft_h->cmp.create(string_key_cmp, nullptr); + ft->ft = ft_h; + + ft_h->blocktable.create(); + { + int r_truncate = ftruncate(fd, 0); + CKERR(r_truncate); + } + // Want to use block #20 + BLOCKNUM b = make_blocknum(0); + while (b.b < 20) { + ft_h->blocktable.allocate_blocknum(&b, ft_h); + } + invariant(b.b == 20); + + { + DISKOFF offset; + DISKOFF size; + ft_h->blocktable.realloc_on_disk(b, 100, &offset, ft_h, fd, false); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + + ft_h->blocktable.translate_blocknum_to_offset_size(b, &offset, &size); + invariant(offset == + (DISKOFF)BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE); + invariant(size == 100); + } + FTNODE_DISK_DATA src_ndd = NULL; + FTNODE_DISK_DATA dest_ndd = NULL; + write_sn_to_disk(fd, ft, &sn, &src_ndd, do_clone); + + setup_dn(bft, fd, ft_h, &dn, &dest_ndd); + + invariant(dn->blocknum.b == 20); + + invariant(dn->layout_version == FT_LAYOUT_VERSION); + invariant(dn->layout_version_original == FT_LAYOUT_VERSION); + invariant(dn->layout_version_read_from_disk == FT_LAYOUT_VERSION); + invariant(dn->height == 1); + invariant(dn->n_children == 2); + invariant(strcmp((char *)dn->pivotkeys.get_pivot(0).data, "hello") == 0); + invariant(dn->pivotkeys.get_pivot(0).size == 6); + invariant(BP_BLOCKNUM(dn, 0).b == 30); + invariant(BP_BLOCKNUM(dn, 1).b == 35); + + message_buffer *src_msg_buffer1 = &BNC(&sn, 0)->msg_buffer; + message_buffer *src_msg_buffer2 = &BNC(&sn, 1)->msg_buffer; + message_buffer *dest_msg_buffer1 = &BNC(dn, 0)->msg_buffer; + message_buffer *dest_msg_buffer2 = &BNC(dn, 1)->msg_buffer; + + invariant(src_msg_buffer1->equals(dest_msg_buffer1)); + invariant(src_msg_buffer2->equals(dest_msg_buffer2)); + + toku_ftnode_free(&dn); + toku_destroy_ftnode_internals(&sn); + + ft_h->blocktable.block_free( + BlockAllocator::BLOCK_ALLOCATOR_TOTAL_HEADER_RESERVE, 100); + ft_h->blocktable.destroy(); + ft_h->cmp.destroy(); + toku_free(ft_h->h); + toku_free(ft_h); + toku_free(ft); + toku_free(src_ndd); + toku_free(dest_ndd); + + r = close(fd); + invariant(r != -1); +} + +int test_main(int argc __attribute__((__unused__)), + const char *argv[] __attribute__((__unused__))) { + initialize_dummymsn(); + + test_serialize_nonleaf(read_none, false); + test_serialize_nonleaf(read_all, false); + test_serialize_nonleaf(read_compressed, false); + test_serialize_nonleaf(read_none, true); + test_serialize_nonleaf(read_all, true); + test_serialize_nonleaf(read_compressed, true); + + test_serialize_leaf_check_msn(read_none, false); + test_serialize_leaf_check_msn(read_all, false); + test_serialize_leaf_check_msn(read_compressed, false); + test_serialize_leaf_check_msn(read_none, true); + test_serialize_leaf_check_msn(read_all, true); + test_serialize_leaf_check_msn(read_compressed, true); + + test_serialize_leaf_with_multiple_empty_basement_nodes(read_none, false); + test_serialize_leaf_with_multiple_empty_basement_nodes(read_all, false); + test_serialize_leaf_with_multiple_empty_basement_nodes(read_compressed, + false); + test_serialize_leaf_with_multiple_empty_basement_nodes(read_none, true); + test_serialize_leaf_with_multiple_empty_basement_nodes(read_all, true); + test_serialize_leaf_with_multiple_empty_basement_nodes(read_compressed, + true); + + test_serialize_leaf_with_empty_basement_nodes(read_none, false); + test_serialize_leaf_with_empty_basement_nodes(read_all, false); + test_serialize_leaf_with_empty_basement_nodes(read_compressed, false); + test_serialize_leaf_with_empty_basement_nodes(read_none, true); + test_serialize_leaf_with_empty_basement_nodes(read_all, true); + test_serialize_leaf_with_empty_basement_nodes(read_compressed, true); + + test_serialize_leaf_with_large_rows(read_none, false); + test_serialize_leaf_with_large_rows(read_all, false); + test_serialize_leaf_with_large_rows(read_compressed, false); + test_serialize_leaf_with_large_rows(read_none, true); + test_serialize_leaf_with_large_rows(read_all, true); + test_serialize_leaf_with_large_rows(read_compressed, true); + + test_serialize_leaf_with_large_pivots(read_none, false); + test_serialize_leaf_with_large_pivots(read_all, false); + test_serialize_leaf_with_large_pivots(read_compressed, false); + test_serialize_leaf_with_large_pivots(read_none, true); + test_serialize_leaf_with_large_pivots(read_all, true); + test_serialize_leaf_with_large_pivots(read_compressed, true); + + test_serialize_leaf_with_many_rows(read_none, false); + test_serialize_leaf_with_many_rows(read_all, false); + test_serialize_leaf_with_many_rows(read_compressed, false); + test_serialize_leaf_with_many_rows(read_none, true); + test_serialize_leaf_with_many_rows(read_all, true); + test_serialize_leaf_with_many_rows(read_compressed, true); + + return 0; +} |