Skip to content

Commit

Permalink
Fix flaky RemoteIndexRecoveryIT testRerouteRecovery test #9580 (#11918)
Browse files Browse the repository at this point in the history
Signed-off-by: Ashish Singh <ssashish@amazon.com>
  • Loading branch information
ashking94 authored Jan 31, 2024
1 parent 2f8d267 commit c6cebc7
Show file tree
Hide file tree
Showing 3 changed files with 35 additions and 8 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -523,12 +523,12 @@ public void testRerouteRecovery() throws Exception {

logger.info("--> waiting for recovery to start both on source and target");
final Index index = resolveIndex(INDEX_NAME);
assertBusy(() -> {
assertBusyWithFixedSleepTime(() -> {
IndicesService indicesService = internalCluster().getInstance(IndicesService.class, nodeA);
assertThat(indicesService.indexServiceSafe(index).getShard(0).recoveryStats().currentAsSource(), equalTo(1));
indicesService = internalCluster().getInstance(IndicesService.class, nodeB);
assertThat(indicesService.indexServiceSafe(index).getShard(0).recoveryStats().currentAsTarget(), equalTo(1));
});
}, TimeValue.timeValueSeconds(10), TimeValue.timeValueMillis(500));

logger.info("--> request recoveries");
RecoveryResponse response = client().admin().indices().prepareRecoveries(INDEX_NAME).execute().actionGet();
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -157,10 +157,4 @@ public void testDisconnectsDuringRecovery() {
public void testReplicaRecovery() {

}

@AwaitsFix(bugUrl = "https://github.com/opensearch-project/OpenSearch/issues/9580")
public void testRerouteRecovery() {

}

}
Original file line number Diff line number Diff line change
Expand Up @@ -83,6 +83,7 @@
import org.opensearch.common.settings.Settings;
import org.opensearch.common.time.DateUtils;
import org.opensearch.common.time.FormatNames;
import org.opensearch.common.unit.TimeValue;
import org.opensearch.common.util.MockBigArrays;
import org.opensearch.common.util.MockPageCacheRecycler;
import org.opensearch.common.util.concurrent.ThreadContext;
Expand Down Expand Up @@ -1095,6 +1096,38 @@ public static void assertBusy(CheckedRunnable<Exception> codeBlock, long maxWait
}
}

/**
* Runs the code block for the provided max wait time and sleeping for fixed sleep time, waiting for no assertions to trip.
*/
public static void assertBusyWithFixedSleepTime(CheckedRunnable<Exception> codeBlock, TimeValue maxWaitTime, TimeValue sleepTime)
throws Exception {
long maxTimeInMillis = maxWaitTime.millis();
long sleepTimeInMillis = sleepTime.millis();
if (sleepTimeInMillis > maxTimeInMillis) {
throw new IllegalArgumentException("sleepTime is more than the maxWaitTime");
}
long sum = 0;
List<AssertionError> failures = new ArrayList<>();
while (sum <= maxTimeInMillis) {
try {
codeBlock.run();
return;
} catch (AssertionError e) {
failures.add(e);
}
sum += sleepTimeInMillis;
Thread.sleep(sleepTimeInMillis);
}
try {
codeBlock.run();
} catch (AssertionError e) {
for (AssertionError failure : failures) {
e.addSuppressed(failure);
}
throw e;
}
}

/**
* Periodically execute the supplied function until it returns true, or a timeout
* is reached. This version uses a timeout of 10 seconds. If at all possible,
Expand Down

0 comments on commit c6cebc7

Please sign in to comment.