Skip to content

Commit

Permalink
DAOS-14352 object: recover migrate with correct epoch (#13547)
Browse files Browse the repository at this point in the history
During migration, it should choose the minimum epoch from
rebuild stable epoch and EC aggregation boundary to make
sure correct data is being fetched during recovery.

Add tests to verify the process.

Signed-off-by: Di Wang <[email protected]>
  • Loading branch information
wangdi committed Feb 7, 2024
1 parent edcca6b commit e91143c
Show file tree
Hide file tree
Showing 2 changed files with 46 additions and 15 deletions.
12 changes: 6 additions & 6 deletions src/object/srv_obj_migrate.c
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
/**
* (C) Copyright 2019-2023 Intel Corporation.
* (C) Copyright 2019-2024 Intel Corporation.
*
* SPDX-License-Identifier: BSD-2-Clause-Patent
*/
Expand Down Expand Up @@ -1040,10 +1040,10 @@ migrate_fetch_update_parity(struct migrate_one *mrone, daos_handle_t oh,
/* If the epoch is higher than EC aggregate boundary, then
* it should use stable epoch to fetch the data, since
* the data could be aggregated independently on parity
* and data shard, so using stable epoch could make sure
* the consistency view during rebuild. And also EC aggregation
* should already aggregate the parity, so there should not
* be any partial update on the parity as well.
* and data shard, so it should select the minimum epoch
* between stable epoch and boundary epoch as the recovery
* epoch to make sure parity data rebuilt will not be interfered
* by the newer update.
*
* Otherwise there might be partial update on this rebuilding
* shard, so let's use the epoch from the parity shard to fetch
Expand All @@ -1054,7 +1054,7 @@ migrate_fetch_update_parity(struct migrate_one *mrone, daos_handle_t oh,
*/
if (ds_cont->sc_ec_agg_eph_boundary >
mrone->mo_iods_update_ephs_from_parity[i][j])
fetch_eph = mrone->mo_epoch;
fetch_eph = min(ds_cont->sc_ec_agg_eph_boundary, mrone->mo_epoch);
else
fetch_eph = mrone->mo_iods_update_ephs_from_parity[i][j];

Expand Down
49 changes: 40 additions & 9 deletions src/tests/suite/daos_rebuild_ec.c
Original file line number Diff line number Diff line change
Expand Up @@ -1254,23 +1254,28 @@ rebuild_ec_multiple_failure_tgts(void **state)
}

static void
rebuild_ec_parity_overwrite_fail_parity(void **state)
rebuild_ec_parity_overwrite_fail_parity_internal(void **state, int *kill_shards, int nr,
bool aggregation)
{
test_arg_t *arg = *state;
daos_obj_id_t oid;
struct ioreq req;
char *data;
char *verify_data;
daos_recx_t recx;
d_rank_t data_ranks[2];
d_rank_t data_ranks[4];
d_rank_t parity_rank;
uint64_t dkey_hash;
int shard_idx;
int stripe_size = 4 * CELL_SIZE;
int i;

if (!test_runable(arg, 8))
return;

if (svc_nreplicas < 5)
return;

oid = daos_test_oid_gen(arg->coh, OC_EC_4P2G1, 0, 0, arg->myrank);
ioreq_init(&req, arg->coh, oid, DAOS_IOD_ARRAY, arg);
data = (char *)malloc(stripe_size);
Expand All @@ -1282,6 +1287,9 @@ rebuild_ec_parity_overwrite_fail_parity(void **state)
insert_recxs("d_key", "a_key", 1, DAOS_TX_NONE, &recx, 1,
data, stripe_size, &req);

if (aggregation)
trigger_and_wait_ec_aggreation(arg, &oid, 1, "d_key", "a_key", 0,
0, DAOS_FORCE_EC_AGG);
make_buffer(data, 'b', 1000);
memcpy(verify_data, data, stripe_size);
recx.rx_idx = 0;
Expand All @@ -1297,20 +1305,20 @@ rebuild_ec_parity_overwrite_fail_parity(void **state)
rebuild_single_pool_rank(arg, parity_rank, true);

/* fail data shard */
shard_idx = (dkey_hash % 6 + 0) % 6;
data_ranks[0] = get_rank_by_oid_shard(arg, oid, shard_idx);
shard_idx = (dkey_hash % 6 + 1) % 6;
data_ranks[1] = get_rank_by_oid_shard(arg, oid, shard_idx);
for (i = 0; i < nr; i++) {
shard_idx = (dkey_hash % 6 + kill_shards[i]) % 6;
data_ranks[i] = get_rank_by_oid_shard(arg, oid, shard_idx);
}

rebuild_pools_ranks(&arg, 1, data_ranks, 2, true);
rebuild_pools_ranks(&arg, 1, data_ranks, nr, true);
recx.rx_idx = 0; /* full stripe */
recx.rx_nr = stripe_size;
lookup_recxs("d_key", "a_key", 1, DAOS_TX_NONE, &recx, 1,
data, stripe_size, &req);

assert_memory_equal(data, verify_data, stripe_size);

reintegrate_pools_ranks(&arg, 1, data_ranks, 2, true);
reintegrate_pools_ranks(&arg, 1, data_ranks, nr, true);
reintegrate_pools_ranks(&arg, 1, &parity_rank, 1, true);

lookup_recxs("d_key", "a_key", 1, DAOS_TX_NONE, &recx, 1,
Expand All @@ -1324,6 +1332,26 @@ rebuild_ec_parity_overwrite_fail_parity(void **state)
free(verify_data);
}

static void
rebuild_ec_overwrite_fail_parity_data(void **state)
{
int kill_shards[2];

kill_shards[0] = 0;
kill_shards[1] = 1;
rebuild_ec_parity_overwrite_fail_parity_internal(state, kill_shards, 2, false);
}

static void
rebuild_ec_overwrite_fail_parity_data_with_parity(void **state)
{
int kill_shards[2];

kill_shards[0] = 1;
kill_shards[1] = 2;
rebuild_ec_parity_overwrite_fail_parity_internal(state, kill_shards, 2, true);
}

/** create a new pool/container for each test */
static const struct CMUnitTest rebuild_tests[] = {
{"REBUILD0: rebuild partial update with data tgt fail",
Expand Down Expand Up @@ -1457,7 +1485,10 @@ static const struct CMUnitTest rebuild_tests[] = {
rebuild_ec_multiple_failure_tgts, rebuild_ec_8nodes_setup,
test_teardown},
{"REBUILD46: fail parity shard and data shards after overwrite",
rebuild_ec_parity_overwrite_fail_parity, rebuild_ec_8nodes_setup,
rebuild_ec_overwrite_fail_parity_data, rebuild_ec_8nodes_setup,
test_teardown},
{"REBUILD46: fail parity shard and data shards after overwrite with aggregation",
rebuild_ec_overwrite_fail_parity_data_with_parity, rebuild_ec_8nodes_setup,
test_teardown},
};

Expand Down

0 comments on commit e91143c

Please sign in to comment.