Skip to content

Commit

Permalink
rate-limiter: fix clock skew if enabling auto-tuned. (#401)
Browse files Browse the repository at this point in the history
close tikv/tikv#17995

Signed-off-by: lucasliang <[email protected]>
  • Loading branch information
LykxSassinator authored Jan 16, 2025
1 parent e255444 commit f65a78f
Show file tree
Hide file tree
Showing 2 changed files with 43 additions and 10 deletions.
39 changes: 29 additions & 10 deletions utilities/rate_limiters/write_amp_based_rate_limiter.cc
Original file line number Diff line number Diff line change
Expand Up @@ -195,7 +195,11 @@ void WriteAmpBasedRateLimiter::Request(int64_t bytes, const Env::IOPriority pri,
if (leader_ == nullptr && IsFrontOfOneQueue(&r)) {
leader_ = &r;
int64_t delta = next_refill_us_ - NowMicrosMonotonic(env_);
delta = delta > 0 ? delta : 0;
// Clamp delta between 0 and refill_period_us_:
// (1) set negative values to 0
// (2) cap maximum wait time to refill_period_us_ to prevent excessive
// delays that could occur due to clock skew.
delta = delta > 0 ? std::min(delta, refill_period_us_) : 0;
if (delta == 0) {
timedout = true;
} else {
Expand Down Expand Up @@ -359,20 +363,35 @@ Status WriteAmpBasedRateLimiter::Tune() {
// lower bound for write amplification estimation
const int kRatioLower = 10;
const int kPercentDeltaMax = 6;
const auto millis_per_tune = 1000 * secs_per_tune_;
// Define the max limit of tick duration limits to handle clock skew.
const auto max_tune_tick_duration_limit =
std::chrono::microseconds(secs_per_tune_ * 1000 * 1000) * 7 /
4; // 1.75x multiplier

std::chrono::microseconds prev_tuned_time = tuned_time_;
const std::chrono::microseconds prev_tuned_time = tuned_time_;
tuned_time_ = std::chrono::microseconds(NowMicrosMonotonic(env_));
auto duration = tuned_time_ - prev_tuned_time;
auto duration_ms =
std::chrono::duration_cast<std::chrono::milliseconds>(duration).count();
// Validate tuning interval to detect system anomalies:
// (1) tuned_time_ < prev_tuned_time: Clock moved backwards (clock skew)
// (2) Interval > max_tune_tick_duration_limit: System stall or severe clock
// skew
if (tuned_time_ <= prev_tuned_time ||
tuned_time_ >= prev_tuned_time + max_tune_tick_duration_limit) {
// Fall back to max rate limiter for safety if duration is invalid or
// exceeds max limit.
SetActualBytesPerSecond(max_bytes_per_sec_.load(std::memory_order_relaxed));
return Status::Aborted();
}
auto duration_ms = std::chrono::duration_cast<std::chrono::milliseconds>(
tuned_time_ - prev_tuned_time)
.count();

int64_t prev_bytes_per_sec = GetBytesPerSecond();

// This function can be called less frequent than we anticipate when
// compaction rate is low. Loop through the actual time slice to correct
// the estimation.
auto millis_per_tune = 1000 * secs_per_tune_;
for (uint32_t i = 0; i < duration_ms / millis_per_tune; i++) {
auto sampling_count = duration_ms / millis_per_tune;
for (uint32_t i = 0; i < sampling_count; i++) {
bytes_sampler_.AddSample(duration_bytes_through_ * 1000 / duration_ms);
highpri_bytes_sampler_.AddSample(duration_highpri_bytes_through_ * 1000 /
duration_ms);
Expand Down Expand Up @@ -441,8 +460,8 @@ void WriteAmpBasedRateLimiter::PaceUp(bool critical) {
}

RateLimiter* NewWriteAmpBasedRateLimiter(
int64_t rate_bytes_per_sec, int64_t refill_period_us /* = 100 * 1000 */,
int32_t fairness /* = 10 */,
int64_t rate_bytes_per_sec /* = 10GiB */,
int64_t refill_period_us /* = 100 * 1000 */, int32_t fairness /* = 10 */,
RateLimiter::Mode mode /* = RateLimiter::Mode::kWritesOnly */,
bool auto_tuned /* = false */, int tune_per_sec /* = 1 */,
size_t smooth_window_size /* = 300 */,
Expand Down
14 changes: 14 additions & 0 deletions utilities/rate_limiters/write_amp_based_rate_limiter_test.cc
Original file line number Diff line number Diff line change
Expand Up @@ -79,6 +79,20 @@ TEST_F(WriteAmpBasedRateLimiterTest, AutoTune) {
limiter.Request(1000 /* bytes */, Env::IO_LOW, nullptr /* stats */,
RateLimiter::OpType::kWrite);
ASSERT_EQ(10485760, limiter.GetBytesPerSecond());
// If there exists clock skew issues, the next Tune()
// should be skipped and use the max_rate_bytes_per_sec
// as the next limit.
thread_env->SleepForMicroseconds(2000 * 1000);
limiter.Request(1000 /* bytes */, Env::IO_LOW, nullptr /* stats */,
RateLimiter::OpType::kWrite);
ASSERT_EQ(10000, limiter.GetBytesPerSecond());
// After recovering, the auto-tune works normally.
for (auto i = 1; i <= 3; i++) {
thread_env->SleepForMicroseconds(1000 * 1000);
limiter.Request(1000 /* bytes */, Env::IO_LOW, nullptr /* stats */,
RateLimiter::OpType::kWrite);
ASSERT_EQ(10485760, limiter.GetBytesPerSecond());
}
// TODO: add more logic for auto-tune
}

Expand Down

0 comments on commit f65a78f

Please sign in to comment.