diff options
| author | Dan Lambright <dlambrig@redhat.com> | 2015-11-01 10:22:00 -0500 | 
|---|---|---|
| committer | Dan Lambright <dlambrig@redhat.com> | 2015-11-07 13:44:38 -0800 | 
| commit | 5b989f034d522ffe8c311481b7ef2064358cb06f (patch) | |
| tree | 9fd1feba9c3a71b361c66240ff13c79f17f4de88 | |
| parent | f3b555e029e6531d914fb67e098929ffe03d161b (diff) | |
cluster/tier correct promotion cycle calculation
This is a backport of 12480
The tier translator should only choose candidate files for promotion
from the most recent cycle, not a multiple of the most recent cycles.
Otherwise user observed behavior can be inconsistent. Remove related
test in tier.t that is subject to race condition.
> Change-Id: I9ad1523cac00f904097ce468efa6ddd515857024
> BUG: 1275524
> Signed-off-by: root <root@rhs-cli-15.gdev.lab.eng.bos.redhat.com>
> Signed-off-by: Dan Lambright <dlambrig@redhat.com>
> Reviewed-on: http://review.gluster.org/12480
> Reviewed-by: Joseph Fernandes
> Tested-by: Gluster Build System <jenkins@build.gluster.com>
Signed-off-by: Dan Lambright <dlambrig@redhat.com>
Signed-off-by: Dan Lambright <dlambrig@redhat.com>
Conflicts:
	tests/basic/tier/tier.t
	xlators/cluster/dht/src/tier.c
Change-Id: Ic4587bf1b5d26ba377a12a4ce8e329362988a33b
BUG: 1275483
Reviewed-on: http://review.gluster.org/12536
Tested-by: NetBSD Build System <jenkins@build.gluster.org>
Reviewed-by: Dan Lambright <dlambrig@redhat.com>
Tested-by: Dan Lambright <dlambrig@redhat.com>
| -rw-r--r-- | tests/basic/tier/legacy-many.t | 19 | ||||
| -rwxr-xr-x | tests/basic/tier/tier.t | 38 | ||||
| -rw-r--r-- | tests/tier.rc | 13 | ||||
| -rw-r--r-- | xlators/cluster/dht/src/tier.c | 12 | 
4 files changed, 53 insertions, 29 deletions
diff --git a/tests/basic/tier/legacy-many.t b/tests/basic/tier/legacy-many.t index 2c7ff3e5407..6e1147aec2d 100644 --- a/tests/basic/tier/legacy-many.t +++ b/tests/basic/tier/legacy-many.t @@ -9,13 +9,12 @@ LAST_BRICK=3  CACHE_BRICK_FIRST=4  CACHE_BRICK_LAST=5  DEMOTE_TIMEOUT=12 -PROMOTE_TIMEOUT=5 +PROMOTE_TIMEOUT=12  MIGRATION_TIMEOUT=10  DEMOTE_FREQ=60 -PROMOTE_FREQ=4 +PROMOTE_FREQ=10  TEST_DIR="test_files" -NUM_FILES=20 - +NUM_FILES=15  function read_all {      for file in * @@ -49,19 +48,25 @@ wait  TEST $CLI volume attach-tier $V0 replica 2 $H0:$B0/${V0}$CACHE_BRICK_FIRST $H0:$B0/${V0}$CACHE_BRICK_LAST  TEST $CLI volume rebalance $V0 tier status +  TEST $CLI volume set $V0 cluster.tier-demote-frequency $DEMOTE_FREQ  TEST $CLI volume set $V0 cluster.tier-promote-frequency $PROMOTE_FREQ  TEST $CLI volume set $V0 cluster.read-freq-threshold 0  TEST $CLI volume set $V0 cluster.write-freq-threshold 0 +# wait a little for lookup heal to finish +sleep 10 +  # Read "legacy" files  drop_cache $M0 -cd ${TEST_DIR} + +sleep_until_mid_cycle $DEMOTE_FREQ +  TEST read_all  # Test to make sure files were promoted as expected -sleep $DEMOTE_TIMEOUT -EXPECT_WITHIN $DEMOTE_TIMEOUT "0" check_counters $NUM_FILES 0 +sleep $PROMOTE_TIMEOUT +EXPECT_WITHIN $PROMOTE_TIMEOUT "0" check_counters $NUM_FILES 0  cd;  cleanup diff --git a/tests/basic/tier/tier.t b/tests/basic/tier/tier.t index 5bb2dc95164..a197d6eb127 100755 --- a/tests/basic/tier/tier.t +++ b/tests/basic/tier/tier.t @@ -11,22 +11,14 @@ DEMOTE_TIMEOUT=12  PROMOTE_TIMEOUT=5  MIGRATION_TIMEOUT=10  DEMOTE_FREQ=4 -PROMOTE_FREQ=4 - - -# Timing adjustment to avoid spurious errors with first instances of  file_on_fast_tier -function sleep_first_cycle { -    startTime=$(date +%s) -    mod=$(( ( $startTime % $DEMOTE_FREQ ) + 1 )) -    sleep $mod -} +PROMOTE_FREQ=12  function file_on_slow_tier {      found=0      for i in `seq 0 $LAST_BRICK`; do -        test -e $B0/${V0}${i}/$1 && found=1 && break; +        test -e "$B0/${V0}${i}/$1" && found=1 && break;      done      if [ "$found" == "1" ] @@ -56,7 +48,7 @@ function file_on_fast_tier {      found=0      for j in `seq $CACHE_BRICK_FIRST $CACHE_BRICK_LAST`; do -        test -e $B0/${V0}${j}/$1 && found=1 && break; +        test -e "$B0/${V0}${j}/$1" && found=1 && break;      done @@ -120,10 +112,14 @@ TEST ! $CLI volume set $V0 cluster.tier-max-files -3  TEST ! $CLI volume set $V0 cluster.watermark-low 90  # stop the volume and restart it. The rebalance daemon should restart. +cd /tmp +umount $M0  TEST $CLI volume stop $V0  TEST $CLI volume start $V0 +TEST $GFS --volfile-id=/$V0 --volfile-server=$H0 $M0; +cd $M0 -sleep_first_cycle +sleep_first_cycle $DEMOTE_FREQ  $CLI volume tier $V0 status  #Tier options expect non-negative value @@ -158,9 +154,12 @@ uuidgen > /tmp/d1/data2.txt  md5data2=$(fingerprint /tmp/d1/data2.txt)  cp /tmp/d1/data2.txt ./d1/data2.txt -uuidgen > /tmp/d1/data3.txt -md5data3=$(fingerprint /tmp/d1/data3.txt) -mv /tmp/d1/data3.txt ./d1/data3.txt +#File with spaces and special characters. +SPACE_FILE="file with spaces & $peci@l ch@r@cter$ @!@$%^$#@^^*&%$#$%.txt" + +uuidgen > "/tmp/d1/$SPACE_FILE" +md5space=$(fingerprint "/tmp/d1/$SPACE_FILE") +mv "/tmp/d1/$SPACE_FILE" "./d1/$SPACE_FILE"  # Check auto-demotion on write new.  sleep $DEMOTE_TIMEOUT @@ -169,11 +168,12 @@ sleep $DEMOTE_TIMEOUT  UUID=$(uuidgen)  echo $UUID >> /tmp/d1/data2.txt  md5data2=$(fingerprint /tmp/d1/data2.txt) -echo $UUID >> ./d1/data2.txt -# Check promotion on read to slow tier +sleep_until_mid_cycle $DEMOTE_FREQ  drop_cache $M0 -cat d1/data3.txt + +echo $UUID >> ./d1/data2.txt +cat "./d1/$SPACE_FILE"  sleep $PROMOTE_TIMEOUT  sleep $DEMOTE_FREQ @@ -185,7 +185,7 @@ TEST glusterd  EXPECT "0" file_on_slow_tier d1/data.txt $md5data  EXPECT "0" file_on_slow_tier d1/data2.txt $md5data2 -EXPECT "0" file_on_slow_tier d1/data3.txt $md5data3 +EXPECT "0" file_on_slow_tier "./d1/$SPACE_FILE" $md5space  TEST $CLI volume tier $V0 detach start diff --git a/tests/tier.rc b/tests/tier.rc index 3fa6af6a40f..4fd24de0659 100644 --- a/tests/tier.rc +++ b/tests/tier.rc @@ -99,3 +99,16 @@ function confirm_vol_stopped {      fi  } + +function sleep_first_cycle { +    startTime=$(date +%s) +    mod=$(( ( $startTime % $1 ) + 1 )) +    sleep $mod +} + +function sleep_until_mid_cycle { +    startTime=$(date +%s) +    mod=$(( ( $startTime % $1 ) + 1 )) +    mod=$(( $mod + $1 / 2 )) +    sleep $mod +} diff --git a/xlators/cluster/dht/src/tier.c b/xlators/cluster/dht/src/tier.c index 31d5e8b627e..618b82d18ee 100644 --- a/xlators/cluster/dht/src/tier.c +++ b/xlators/cluster/dht/src/tier.c @@ -31,7 +31,6 @@ static void *libhandle;  static gfdb_methods_t gfdb_methods;  #define DB_QUERY_RECORD_SIZE 4096 -#define  PROMOTION_CYCLE_CNT 4  static int @@ -1067,7 +1066,14 @@ tier_build_migration_qfile (demotion_args_t *args,                  goto out;          }          time_in_past.tv_sec = current_time.tv_sec - time_in_past.tv_sec; -        time_in_past.tv_usec = current_time.tv_usec - time_in_past.tv_usec; + +        /* The migration daemon may run a varrying numberof usec after the sleep */ +        /* call triggers. A file may be registered in CTR some number of usec X */ +        /* after the daemon started and missed in the subsequent cycle if the */ +        /* daemon starts Y usec after the period in seconds where Y>X. Normalize */ +        /* away this problem by always setting usec to 0. */ +        time_in_past.tv_usec = 0; +          gfdb_brick_dict_info.time_stamp = &time_in_past;          gfdb_brick_dict_info._gfdb_promote = is_promotion;          gfdb_brick_dict_info._query_cbk_args = query_cbk_args; @@ -1482,7 +1488,7 @@ tier_start (xlator_t *this, gf_defrag_info_t *defrag)                          promotion_args.this = this;                          promotion_args.brick_list = &bricklist_cold;                          promotion_args.defrag = defrag; -                        promotion_args.freq_time = freq_promote *  PROMOTION_CYCLE_CNT; +                        promotion_args.freq_time = freq_promote;                          ret_promotion = pthread_create (&promote_thread,                                                  NULL, &tier_promote,                                                  &promotion_args);  | 
