635 lines
15 KiB
C
635 lines
15 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Copyright (C) 2017 Oracle. All rights reserved.
|
|
*/
|
|
|
|
#include <linux/types.h>
|
|
#include "btrfs-tests.h"
|
|
#include "../ctree.h"
|
|
#include "../volumes.h"
|
|
#include "../disk-io.h"
|
|
#include "../block-group.h"
|
|
|
|
static void free_extent_map_tree(struct extent_map_tree *em_tree)
|
|
{
|
|
struct extent_map *em;
|
|
struct rb_node *node;
|
|
|
|
while (!RB_EMPTY_ROOT(&em_tree->map.rb_root)) {
|
|
node = rb_first_cached(&em_tree->map);
|
|
em = rb_entry(node, struct extent_map, rb_node);
|
|
remove_extent_mapping(em_tree, em);
|
|
|
|
#ifdef CONFIG_BTRFS_DEBUG
|
|
if (refcount_read(&em->refs) != 1) {
|
|
test_err(
|
|
"em leak: em (start 0x%llx len 0x%llx block_start 0x%llx block_len 0x%llx) refs %d",
|
|
em->start, em->len, em->block_start,
|
|
em->block_len, refcount_read(&em->refs));
|
|
|
|
refcount_set(&em->refs, 1);
|
|
}
|
|
#endif
|
|
free_extent_map(em);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Test scenario:
|
|
*
|
|
* Suppose that no extent map has been loaded into memory yet, there is a file
|
|
* extent [0, 16K), followed by another file extent [16K, 20K), two dio reads
|
|
* are entering btrfs_get_extent() concurrently, t1 is reading [8K, 16K), t2 is
|
|
* reading [0, 8K)
|
|
*
|
|
* t1 t2
|
|
* btrfs_get_extent() btrfs_get_extent()
|
|
* -> lookup_extent_mapping() ->lookup_extent_mapping()
|
|
* -> add_extent_mapping(0, 16K)
|
|
* -> return em
|
|
* ->add_extent_mapping(0, 16K)
|
|
* -> #handle -EEXIST
|
|
*/
|
|
static int test_case_1(struct btrfs_fs_info *fs_info,
|
|
struct extent_map_tree *em_tree)
|
|
{
|
|
struct extent_map *em;
|
|
u64 start = 0;
|
|
u64 len = SZ_8K;
|
|
int ret;
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/* Add [0, 16K) */
|
|
em->start = 0;
|
|
em->len = SZ_16K;
|
|
em->block_start = 0;
|
|
em->block_len = SZ_16K;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [0, 16K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
/* Add [16K, 20K) following [0, 16K) */
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
em->start = SZ_16K;
|
|
em->len = SZ_4K;
|
|
em->block_start = SZ_32K; /* avoid merging */
|
|
em->block_len = SZ_4K;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [16K, 20K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
/* Add [0, 8K), should return [0, 16K) instead. */
|
|
em->start = start;
|
|
em->len = len;
|
|
em->block_start = start;
|
|
em->block_len = len;
|
|
write_lock(&em_tree->lock);
|
|
ret = btrfs_add_extent_mapping(fs_info, em_tree, &em, em->start, em->len);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret) {
|
|
test_err("case1 [%llu %llu]: ret %d", start, start + len, ret);
|
|
goto out;
|
|
}
|
|
if (em &&
|
|
(em->start != 0 || extent_map_end(em) != SZ_16K ||
|
|
em->block_start != 0 || em->block_len != SZ_16K)) {
|
|
test_err(
|
|
"case1 [%llu %llu]: ret %d return a wrong em (start %llu len %llu block_start %llu block_len %llu",
|
|
start, start + len, ret, em->start, em->len,
|
|
em->block_start, em->block_len);
|
|
ret = -EINVAL;
|
|
}
|
|
free_extent_map(em);
|
|
out:
|
|
free_extent_map_tree(em_tree);
|
|
|
|
return ret;
|
|
}
|
|
|
|
/*
|
|
* Test scenario:
|
|
*
|
|
* Reading the inline ending up with EEXIST, ie. read an inline
|
|
* extent and discard page cache and read it again.
|
|
*/
|
|
static int test_case_2(struct btrfs_fs_info *fs_info,
|
|
struct extent_map_tree *em_tree)
|
|
{
|
|
struct extent_map *em;
|
|
int ret;
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/* Add [0, 1K) */
|
|
em->start = 0;
|
|
em->len = SZ_1K;
|
|
em->block_start = EXTENT_MAP_INLINE;
|
|
em->block_len = (u64)-1;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [0, 1K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
/* Add [4K, 8K) following [0, 1K) */
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
em->start = SZ_4K;
|
|
em->len = SZ_4K;
|
|
em->block_start = SZ_4K;
|
|
em->block_len = SZ_4K;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [4K, 8K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
/* Add [0, 1K) */
|
|
em->start = 0;
|
|
em->len = SZ_1K;
|
|
em->block_start = EXTENT_MAP_INLINE;
|
|
em->block_len = (u64)-1;
|
|
write_lock(&em_tree->lock);
|
|
ret = btrfs_add_extent_mapping(fs_info, em_tree, &em, em->start, em->len);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret) {
|
|
test_err("case2 [0 1K]: ret %d", ret);
|
|
goto out;
|
|
}
|
|
if (em &&
|
|
(em->start != 0 || extent_map_end(em) != SZ_1K ||
|
|
em->block_start != EXTENT_MAP_INLINE || em->block_len != (u64)-1)) {
|
|
test_err(
|
|
"case2 [0 1K]: ret %d return a wrong em (start %llu len %llu block_start %llu block_len %llu",
|
|
ret, em->start, em->len, em->block_start,
|
|
em->block_len);
|
|
ret = -EINVAL;
|
|
}
|
|
free_extent_map(em);
|
|
out:
|
|
free_extent_map_tree(em_tree);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int __test_case_3(struct btrfs_fs_info *fs_info,
|
|
struct extent_map_tree *em_tree, u64 start)
|
|
{
|
|
struct extent_map *em;
|
|
u64 len = SZ_4K;
|
|
int ret;
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/* Add [4K, 8K) */
|
|
em->start = SZ_4K;
|
|
em->len = SZ_4K;
|
|
em->block_start = SZ_4K;
|
|
em->block_len = SZ_4K;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [4K, 8K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
/* Add [0, 16K) */
|
|
em->start = 0;
|
|
em->len = SZ_16K;
|
|
em->block_start = 0;
|
|
em->block_len = SZ_16K;
|
|
write_lock(&em_tree->lock);
|
|
ret = btrfs_add_extent_mapping(fs_info, em_tree, &em, start, len);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret) {
|
|
test_err("case3 [0x%llx 0x%llx): ret %d",
|
|
start, start + len, ret);
|
|
goto out;
|
|
}
|
|
/*
|
|
* Since bytes within em are contiguous, em->block_start is identical to
|
|
* em->start.
|
|
*/
|
|
if (em &&
|
|
(start < em->start || start + len > extent_map_end(em) ||
|
|
em->start != em->block_start || em->len != em->block_len)) {
|
|
test_err(
|
|
"case3 [0x%llx 0x%llx): ret %d em (start 0x%llx len 0x%llx block_start 0x%llx block_len 0x%llx)",
|
|
start, start + len, ret, em->start, em->len,
|
|
em->block_start, em->block_len);
|
|
ret = -EINVAL;
|
|
}
|
|
free_extent_map(em);
|
|
out:
|
|
free_extent_map_tree(em_tree);
|
|
|
|
return ret;
|
|
}
|
|
|
|
/*
|
|
* Test scenario:
|
|
*
|
|
* Suppose that no extent map has been loaded into memory yet.
|
|
* There is a file extent [0, 16K), two jobs are running concurrently
|
|
* against it, t1 is buffered writing to [4K, 8K) and t2 is doing dio
|
|
* read from [0, 4K) or [8K, 12K) or [12K, 16K).
|
|
*
|
|
* t1 goes ahead of t2 and adds em [4K, 8K) into tree.
|
|
*
|
|
* t1 t2
|
|
* cow_file_range() btrfs_get_extent()
|
|
* -> lookup_extent_mapping()
|
|
* -> add_extent_mapping()
|
|
* -> add_extent_mapping()
|
|
*/
|
|
static int test_case_3(struct btrfs_fs_info *fs_info,
|
|
struct extent_map_tree *em_tree)
|
|
{
|
|
int ret;
|
|
|
|
ret = __test_case_3(fs_info, em_tree, 0);
|
|
if (ret)
|
|
return ret;
|
|
ret = __test_case_3(fs_info, em_tree, SZ_8K);
|
|
if (ret)
|
|
return ret;
|
|
ret = __test_case_3(fs_info, em_tree, (12 * SZ_1K));
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int __test_case_4(struct btrfs_fs_info *fs_info,
|
|
struct extent_map_tree *em_tree, u64 start)
|
|
{
|
|
struct extent_map *em;
|
|
u64 len = SZ_4K;
|
|
int ret;
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/* Add [0K, 8K) */
|
|
em->start = 0;
|
|
em->len = SZ_8K;
|
|
em->block_start = 0;
|
|
em->block_len = SZ_8K;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [0, 8K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
/* Add [8K, 32K) */
|
|
em->start = SZ_8K;
|
|
em->len = 24 * SZ_1K;
|
|
em->block_start = SZ_16K; /* avoid merging */
|
|
em->block_len = 24 * SZ_1K;
|
|
write_lock(&em_tree->lock);
|
|
ret = add_extent_mapping(em_tree, em, 0);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret < 0) {
|
|
test_err("cannot add extent range [8K, 32K)");
|
|
goto out;
|
|
}
|
|
free_extent_map(em);
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
/* Add [0K, 32K) */
|
|
em->start = 0;
|
|
em->len = SZ_32K;
|
|
em->block_start = 0;
|
|
em->block_len = SZ_32K;
|
|
write_lock(&em_tree->lock);
|
|
ret = btrfs_add_extent_mapping(fs_info, em_tree, &em, start, len);
|
|
write_unlock(&em_tree->lock);
|
|
if (ret) {
|
|
test_err("case4 [0x%llx 0x%llx): ret %d",
|
|
start, len, ret);
|
|
goto out;
|
|
}
|
|
if (em && (start < em->start || start + len > extent_map_end(em))) {
|
|
test_err(
|
|
"case4 [0x%llx 0x%llx): ret %d, added wrong em (start 0x%llx len 0x%llx block_start 0x%llx block_len 0x%llx)",
|
|
start, len, ret, em->start, em->len, em->block_start,
|
|
em->block_len);
|
|
ret = -EINVAL;
|
|
}
|
|
free_extent_map(em);
|
|
out:
|
|
free_extent_map_tree(em_tree);
|
|
|
|
return ret;
|
|
}
|
|
|
|
/*
|
|
* Test scenario:
|
|
*
|
|
* Suppose that no extent map has been loaded into memory yet.
|
|
* There is a file extent [0, 32K), two jobs are running concurrently
|
|
* against it, t1 is doing dio write to [8K, 32K) and t2 is doing dio
|
|
* read from [0, 4K) or [4K, 8K).
|
|
*
|
|
* t1 goes ahead of t2 and splits em [0, 32K) to em [0K, 8K) and [8K 32K).
|
|
*
|
|
* t1 t2
|
|
* btrfs_get_blocks_direct() btrfs_get_blocks_direct()
|
|
* -> btrfs_get_extent() -> btrfs_get_extent()
|
|
* -> lookup_extent_mapping()
|
|
* -> add_extent_mapping() -> lookup_extent_mapping()
|
|
* # load [0, 32K)
|
|
* -> btrfs_new_extent_direct()
|
|
* -> btrfs_drop_extent_cache()
|
|
* # split [0, 32K)
|
|
* -> add_extent_mapping()
|
|
* # add [8K, 32K)
|
|
* -> add_extent_mapping()
|
|
* # handle -EEXIST when adding
|
|
* # [0, 32K)
|
|
*/
|
|
static int test_case_4(struct btrfs_fs_info *fs_info,
|
|
struct extent_map_tree *em_tree)
|
|
{
|
|
int ret;
|
|
|
|
ret = __test_case_4(fs_info, em_tree, 0);
|
|
if (ret)
|
|
return ret;
|
|
ret = __test_case_4(fs_info, em_tree, SZ_4K);
|
|
|
|
return ret;
|
|
}
|
|
|
|
struct rmap_test_vector {
|
|
u64 raid_type;
|
|
u64 physical_start;
|
|
u64 data_stripe_size;
|
|
u64 num_data_stripes;
|
|
u64 num_stripes;
|
|
/* Assume we won't have more than 5 physical stripes */
|
|
u64 data_stripe_phys_start[5];
|
|
bool expected_mapped_addr;
|
|
/* Physical to logical addresses */
|
|
u64 mapped_logical[5];
|
|
};
|
|
|
|
static int test_rmap_block(struct btrfs_fs_info *fs_info,
|
|
struct rmap_test_vector *test)
|
|
{
|
|
struct extent_map *em;
|
|
struct map_lookup *map = NULL;
|
|
u64 *logical = NULL;
|
|
int i, out_ndaddrs, out_stripe_len;
|
|
int ret;
|
|
|
|
em = alloc_extent_map();
|
|
if (!em) {
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
map = kmalloc(map_lookup_size(test->num_stripes), GFP_KERNEL);
|
|
if (!map) {
|
|
kfree(em);
|
|
test_std_err(TEST_ALLOC_EXTENT_MAP);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
set_bit(EXTENT_FLAG_FS_MAPPING, &em->flags);
|
|
/* Start at 4GiB logical address */
|
|
em->start = SZ_4G;
|
|
em->len = test->data_stripe_size * test->num_data_stripes;
|
|
em->block_len = em->len;
|
|
em->orig_block_len = test->data_stripe_size;
|
|
em->map_lookup = map;
|
|
|
|
map->num_stripes = test->num_stripes;
|
|
map->stripe_len = BTRFS_STRIPE_LEN;
|
|
map->type = test->raid_type;
|
|
|
|
for (i = 0; i < map->num_stripes; i++) {
|
|
struct btrfs_device *dev = btrfs_alloc_dummy_device(fs_info);
|
|
|
|
if (IS_ERR(dev)) {
|
|
test_err("cannot allocate device");
|
|
ret = PTR_ERR(dev);
|
|
goto out;
|
|
}
|
|
map->stripes[i].dev = dev;
|
|
map->stripes[i].physical = test->data_stripe_phys_start[i];
|
|
}
|
|
|
|
write_lock(&fs_info->mapping_tree.lock);
|
|
ret = add_extent_mapping(&fs_info->mapping_tree, em, 0);
|
|
write_unlock(&fs_info->mapping_tree.lock);
|
|
if (ret) {
|
|
test_err("error adding block group mapping to mapping tree");
|
|
goto out_free;
|
|
}
|
|
|
|
ret = btrfs_rmap_block(fs_info, em->start, NULL, btrfs_sb_offset(1),
|
|
&logical, &out_ndaddrs, &out_stripe_len);
|
|
if (ret || (out_ndaddrs == 0 && test->expected_mapped_addr)) {
|
|
test_err("didn't rmap anything but expected %d",
|
|
test->expected_mapped_addr);
|
|
goto out;
|
|
}
|
|
|
|
if (out_stripe_len != BTRFS_STRIPE_LEN) {
|
|
test_err("calculated stripe length doesn't match");
|
|
goto out;
|
|
}
|
|
|
|
if (out_ndaddrs != test->expected_mapped_addr) {
|
|
for (i = 0; i < out_ndaddrs; i++)
|
|
test_msg("mapped %llu", logical[i]);
|
|
test_err("unexpected number of mapped addresses: %d", out_ndaddrs);
|
|
goto out;
|
|
}
|
|
|
|
for (i = 0; i < out_ndaddrs; i++) {
|
|
if (logical[i] != test->mapped_logical[i]) {
|
|
test_err("unexpected logical address mapped");
|
|
goto out;
|
|
}
|
|
}
|
|
|
|
ret = 0;
|
|
out:
|
|
write_lock(&fs_info->mapping_tree.lock);
|
|
remove_extent_mapping(&fs_info->mapping_tree, em);
|
|
write_unlock(&fs_info->mapping_tree.lock);
|
|
/* For us */
|
|
free_extent_map(em);
|
|
out_free:
|
|
/* For the tree */
|
|
free_extent_map(em);
|
|
kfree(logical);
|
|
return ret;
|
|
}
|
|
|
|
int btrfs_test_extent_map(void)
|
|
{
|
|
struct btrfs_fs_info *fs_info = NULL;
|
|
struct extent_map_tree *em_tree;
|
|
int ret = 0, i;
|
|
struct rmap_test_vector rmap_tests[] = {
|
|
{
|
|
/*
|
|
* Test a chunk with 2 data stripes one of which
|
|
* interesects the physical address of the super block
|
|
* is correctly recognised.
|
|
*/
|
|
.raid_type = BTRFS_BLOCK_GROUP_RAID1,
|
|
.physical_start = SZ_64M - SZ_4M,
|
|
.data_stripe_size = SZ_256M,
|
|
.num_data_stripes = 2,
|
|
.num_stripes = 2,
|
|
.data_stripe_phys_start =
|
|
{SZ_64M - SZ_4M, SZ_64M - SZ_4M + SZ_256M},
|
|
.expected_mapped_addr = true,
|
|
.mapped_logical= {SZ_4G + SZ_4M}
|
|
},
|
|
{
|
|
/*
|
|
* Test that out-of-range physical addresses are
|
|
* ignored
|
|
*/
|
|
|
|
/* SINGLE chunk type */
|
|
.raid_type = 0,
|
|
.physical_start = SZ_4G,
|
|
.data_stripe_size = SZ_256M,
|
|
.num_data_stripes = 1,
|
|
.num_stripes = 1,
|
|
.data_stripe_phys_start = {SZ_256M},
|
|
.expected_mapped_addr = false,
|
|
.mapped_logical = {0}
|
|
}
|
|
};
|
|
|
|
test_msg("running extent_map tests");
|
|
|
|
/*
|
|
* Note: the fs_info is not set up completely, we only need
|
|
* fs_info::fsid for the tracepoint.
|
|
*/
|
|
fs_info = btrfs_alloc_dummy_fs_info(PAGE_SIZE, PAGE_SIZE);
|
|
if (!fs_info) {
|
|
test_std_err(TEST_ALLOC_FS_INFO);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
em_tree = kzalloc(sizeof(*em_tree), GFP_KERNEL);
|
|
if (!em_tree) {
|
|
ret = -ENOMEM;
|
|
goto out;
|
|
}
|
|
|
|
extent_map_tree_init(em_tree);
|
|
|
|
ret = test_case_1(fs_info, em_tree);
|
|
if (ret)
|
|
goto out;
|
|
ret = test_case_2(fs_info, em_tree);
|
|
if (ret)
|
|
goto out;
|
|
ret = test_case_3(fs_info, em_tree);
|
|
if (ret)
|
|
goto out;
|
|
ret = test_case_4(fs_info, em_tree);
|
|
|
|
test_msg("running rmap tests");
|
|
for (i = 0; i < ARRAY_SIZE(rmap_tests); i++) {
|
|
ret = test_rmap_block(fs_info, &rmap_tests[i]);
|
|
if (ret)
|
|
goto out;
|
|
}
|
|
|
|
out:
|
|
kfree(em_tree);
|
|
btrfs_free_dummy_fs_info(fs_info);
|
|
|
|
return ret;
|
|
}
|