diff options
-rw-r--r-- | tests/basic/afr/resolve.t | 49 | ||||
-rw-r--r-- | tests/include.rc | 2 | ||||
-rw-r--r-- | xlators/cluster/afr/src/afr-common.c | 28 | ||||
-rw-r--r-- | xlators/cluster/afr/src/afr.h | 1 | ||||
-rw-r--r-- | xlators/protocol/client/src/client-rpc-fops.c | 2 |
5 files changed, 71 insertions, 11 deletions
diff --git a/tests/basic/afr/resolve.t b/tests/basic/afr/resolve.t new file mode 100644 index 00000000000..7dd432996f6 --- /dev/null +++ b/tests/basic/afr/resolve.t @@ -0,0 +1,49 @@ +#!/bin/bash + +. $(dirname $0)/../../include.rc +. $(dirname $0)/../../volume.rc + +#Check that operations succeed after changing the disk of the brick while +#a brick is down +cleanup; + +TEST glusterd +TEST pidof glusterd +TEST $CLI volume create $V0 replica 2 $H0:$B0/${V0}{0,1} +TEST $CLI volume set $V0 cluster.self-heal-daemon off +TEST $CLI volume start $V0 +TEST glusterfs --volfile-id=/$V0 --volfile-server=$H0 $M0 +TEST glusterfs --volfile-id=/$V0 --volfile-server=$H0 $M1 +TEST cd $M0 +TEST mkdir -p a/b/c/d/e +TEST cd a/b/c/d/e +echo abc > g + +#Simulate disk replacement +TEST kill_brick $V0 $H0 $B0/${V0}0 +rm -rf $B0/${V0}0/.glusterfs $B0/${V0}0/a + +TEST $CLI volume start $V0 force +EXPECT_WITHIN $CHILD_UP_TIMEOUT "1" afr_child_up_status $V0 0 +#Test that the lookup returns ENOENT instead of ESTALE +#If lookup returns ESTALE this command will fail with ESTALE +TEST touch f + +#Test that ESTALE is ignored when there is a good copy +EXPECT abc cat g + +#Simulate file changing only one mount +#create the file on first mount +echo ghi > $M0/b + +#re-create the file on other mount while one of the bricks is down. +TEST kill_brick $V0 $H0 $B0/${V0}0 +TEST rm -f $M1/b +echo jkl > $M1/b +#Clear the extended attributes on the directory to create a scenario where +#gfid-mismatch happened. This should result in EIO +TEST setfattr -x trusted.afr.$V0-client-0 $B0/${V0}1 +TEST $CLI volume start $V0 force +EXPECT_WITHIN $CHILD_UP_TIMEOUT "1" afr_child_up_status $V0 0 +TEST ! cat $M0/b +cleanup diff --git a/tests/include.rc b/tests/include.rc index 40dd8ac96b9..3017de9e653 100644 --- a/tests/include.rc +++ b/tests/include.rc @@ -7,7 +7,7 @@ B0=${B0:=/d/backends}; # top level of brick directories H0=${H0:=`hostname --fqdn`}; # hostname DEBUG=${DEBUG:=0} # turn on debugging? statedumpdir=`gluster --print-statedumpdir`; # Default directory for statedump - +CHILD_UP_TIMEOUT=60 CLI="gluster --mode=script"; mkdir -p $B0; diff --git a/xlators/cluster/afr/src/afr-common.c b/xlators/cluster/afr/src/afr-common.c index c4e57625220..2f9913152d4 100644 --- a/xlators/cluster/afr/src/afr-common.c +++ b/xlators/cluster/afr/src/afr-common.c @@ -2321,18 +2321,18 @@ afr_lookup_done (call_frame_t *frame, xlator_t *this) * others in that they must be given higher priority while * returning to the user. * - * The hierarchy is ESTALE > EIO > ENOENT > others + * The hierarchy is EIO > ENOENT > ESTALE > others */ int32_t afr_most_important_error(int32_t old_errno, int32_t new_errno, gf_boolean_t eio) { - if (old_errno == ESTALE || new_errno == ESTALE) - return ESTALE; if (eio && (old_errno == EIO || new_errno == EIO)) return EIO; if (old_errno == ENOENT || new_errno == ENOENT) return ENOENT; + if (old_errno == ESTALE || new_errno == ESTALE) + return ESTALE; return new_errno; } @@ -2361,8 +2361,19 @@ afr_resultant_errno_get (int32_t *children, } static void -afr_lookup_handle_error (afr_local_t *local, int32_t op_ret, int32_t op_errno) +afr_lookup_handle_error (afr_local_t *local, int32_t op_ret, int32_t op_errno, + dict_t *xattr) { + if (local->cont.lookup.needs_fresh_lookup) + return; + + if (xattr && dict_get (xattr, "gfid-changed")) { + local->op_ret = -1; + local->op_errno = ESTALE; + local->cont.lookup.needs_fresh_lookup = _gf_true; + return; + } + if ((local->loc.name == NULL) && (op_errno == ESTALE)) op_errno = ENOENT; @@ -2371,10 +2382,6 @@ afr_lookup_handle_error (afr_local_t *local, int32_t op_ret, int32_t op_errno) local->op_errno = afr_most_important_error(local->op_errno, op_errno, _gf_false); - - if (local->op_errno == ESTALE) { - local->op_ret = -1; - } } static void @@ -2491,7 +2498,7 @@ afr_lookup_handle_success (afr_local_t *local, xlator_t *this, int32_t child_ind afr_private_t *priv = this->private; if (local->success_count == 0) { - if (local->op_errno != ESTALE) { + if (!local->cont.lookup.needs_fresh_lookup) { local->op_ret = op_ret; local->op_errno = 0; } @@ -2528,7 +2535,8 @@ afr_lookup_cbk (call_frame_t *frame, void *cookie, local = frame->local; if (op_ret == -1) { - afr_lookup_handle_error (local, op_ret, op_errno); + afr_lookup_handle_error (local, op_ret, op_errno, + xattr); goto unlock; } afr_lookup_handle_success (local, this, child_index, op_ret, diff --git a/xlators/cluster/afr/src/afr.h b/xlators/cluster/afr/src/afr.h index 9abb48694a2..af57d8b0eff 100644 --- a/xlators/cluster/afr/src/afr.h +++ b/xlators/cluster/afr/src/afr.h @@ -550,6 +550,7 @@ typedef struct _afr_local { int32_t **pending_matrix; gf_boolean_t fresh_lookup; gf_boolean_t possible_spb; + gf_boolean_t needs_fresh_lookup; } lookup; struct { diff --git a/xlators/protocol/client/src/client-rpc-fops.c b/xlators/protocol/client/src/client-rpc-fops.c index 38bc7b6238f..3bd1206e4d0 100644 --- a/xlators/protocol/client/src/client-rpc-fops.c +++ b/xlators/protocol/client/src/client-rpc-fops.c @@ -2755,6 +2755,8 @@ client3_3_lookup_cbk (struct rpc_req *req, struct iovec *iov, int count, "gfid changed for %s", local->loc.path); rsp.op_ret = -1; op_errno = ESTALE; + if (xdata) + ret = dict_set_int32 (xdata, "gfid-changed", 1); goto out; } |