Modify the calculation formula of max_concurrency

0410cbcf · TousakaRin · 9d5ca591 · 0410cbcf · 0410cbcf · 0410cbcf
Commit 0410cbcf authored Aug 13, 2018 by TousakaRin
Showing with 85 additions and 49 deletions

auto_concurrency_limiter.cpp src/brpc/policy/auto_concurrency_limiter.cpp +77 -44

auto_concurrency_limiter.h src/brpc/policy/auto_concurrency_limiter.h +7 -4

server.cpp src/brpc/server.cpp +1 -1

No files found.
--- a/src/brpc/policy/auto_concurrency_limiter.cpp
+++ b/src/brpc/policy/auto_concurrency_limiter.cpp
@@ -22,40 +22,51 @@
 namespace brpc {
 namespace policy {
-DEFINE_int32(auto_cl_peak_qps_window_size, 30, "");
+DEFINE_int32(auto_cl_peak_qps_window_size, 50, 
+             "The number of samples windows used for peak-qps calculations.");
 DEFINE_int32(auto_cl_sampling_interval_us, 100, 
-    "Interval for sampling request in auto concurrency limiter");
+             "Interval for sampling request in auto concurrency limiter");
 DEFINE_int32(auto_cl_sample_window_size_ms, 1000,
-    "Sample window size for update max concurrency in grandient "
+             "Sample window size for update max concurrency in grandient "
-    "concurrency limiter");
+             "concurrency limiter");
 DEFINE_int32(auto_cl_min_sample_count, 100,
-    "Minimum sample count for update max concurrency");
+             "Minimum sample count for update max concurrency");
-DEFINE_double(auto_cl_adjust_smooth, 0.9,
+DEFINE_int32(auto_cl_max_sample_count, 500,
-    "Smooth coefficient for adjust the max concurrency, the value is 0-1,"
+             "Maximum sample count for update max concurrency");
-    "the larger the value, the smaller the amount of each change");
 DEFINE_int32(auto_cl_initial_max_concurrency, 40,
-    "Initial max concurrency for grandient concurrency limiter");
+             "Initial max concurrency for grandient concurrency limiter");
-DEFINE_bool(auto_cl_enable_error_punish, true,
+DEFINE_int32(auto_cl_reset_interval_ms, 50000, 
-    "Whether to consider failed requests when calculating maximum concurrency");
+             "Interval for remeasurement of noload_latency. The period of "
+             "remeasurement of noload_latency will halve max_concurrency.");
+DEFINE_int32(auto_cl_reset_duration_ms, 2000, 
+             "The duration of the remeasurement of noload_latency.");
+DEFINE_int32(auto_cl_min_concurrency, 40, "Minimum value of max_concurrency");
+DEFINE_double(auto_cl_adjust_smooth, 0.9,
+              "Smooth coefficient for adjust the max concurrency, the value "
+              "is 0-1, the larger the value, the smaller the amount of each "
+              "change");
 DEFINE_double(auto_cl_fail_punish_ratio, 1.0,
-    "Use the failed requests to punish normal requests. The larger the "
+              "Use the failed requests to punish normal requests. The larger "
-    "configuration item, the more aggressive the penalty strategy.");
+              "the configuration item, the more aggressive the penalty strategy.");
-DEFINE_int32(auto_cl_min_reserved_concurrency, 10, "");
+DEFINE_double(auto_cl_overload_threshold, 0.40, 
-DEFINE_int32(auto_cl_reset_count, 30, 
+              "Expected ratio of latency fluctuations");
-    "The service's latency will be re-measured every `reset_count' windows.");
-DEFINE_double(auto_cl_latency_fluctuate_rate, 0.4, "");
+DEFINE_bool(auto_cl_enable_error_punish, true,
+            "Whether to consider failed requests when calculating maximum concurrency");
 static int32_t cast_max_concurrency(void* arg) {
    return *(int32_t*) arg;
 }
 AutoConcurrencyLimiter::AutoConcurrencyLimiter()
-    : _reset_count(NextResetCount())
+    : _reset_start_ms(NextResetTime())
+    , _reset_end_ms(0)
    , _min_latency_us(-1)
-    , _smooth(FLAGS_auto_cl_adjust_smooth)
    , _ema_peak_qps(-1)
-    , _rest_noload_count(0)
    , _qps_bq(FLAGS_auto_cl_peak_qps_window_size)
+    , _smooth(FLAGS_auto_cl_adjust_smooth)
+    , _overload_threshold(FLAGS_auto_cl_overload_threshold)
    , _max_concurrency_bvar(cast_max_concurrency, &_max_concurrency)
    , _last_sampling_time_us(0)
    , _total_succ_req(0)
@@ -110,15 +121,17 @@ void AutoConcurrencyLimiter::OnResponded(int error_code, int64_t latency_us) {
            if (max_concurrency != 0) {
                LOG(INFO) 
                    << "MaxConcurrency updated by auto limiter,"
-                    << "current_max_concurrency:" << max_concurrency; 
+                    << "current_max_concurrency:" << max_concurrency << " " << _min_latency_us;
            }
        }
    }
 }
-int AutoConcurrencyLimiter::NextResetCount() {
+int64_t AutoConcurrencyLimiter::NextResetTime() {
-    int max_reset_count = FLAGS_auto_cl_reset_count;
+    int64_t reset_start_ms = butil::gettimeofday_ms() + 
-    return butil::fast_rand_less_than(max_reset_count / 2) + max_reset_count / 2;
+        FLAGS_auto_cl_reset_interval_ms / 2 +
+        butil::fast_rand_less_than(FLAGS_auto_cl_reset_interval_ms / 2);
+    return reset_start_ms;
 }
 int32_t AutoConcurrencyLimiter::AddSample(int error_code, 
@@ -138,10 +151,12 @@ int32_t AutoConcurrencyLimiter::AddSample(int error_code,
        _sw.total_succ_us += latency_us;
    }
-    if (sampling_time_us - _sw.start_time_us < 
+    if (_sw.succ_count + _sw.failed_count < 
-            FLAGS_auto_cl_sample_window_size_ms * 1000 ||
+            FLAGS_auto_cl_min_sample_count ||
-        _sw.succ_count + _sw.failed_count <
+        (sampling_time_us - _sw.start_time_us < 
-            FLAGS_auto_cl_min_sample_count) {
+            FLAGS_auto_cl_sample_window_size_ms &&
+         _sw.succ_count + _sw.failed_count <
+            FLAGS_auto_cl_max_sample_count)) {
        return 0;
    }
@@ -176,7 +191,7 @@ void AutoConcurrencyLimiter::UpdateMinLatency(int64_t latency_us) {
 }
 void AutoConcurrencyLimiter::UpdateQps(int32_t succ_count, 
-                                           int64_t sampling_time_us) {
+                                       int64_t sampling_time_us) {
    double qps = 1000000.0 * succ_count / (sampling_time_us - _sw.start_time_us);
    _qps_bq.elim_push(qps);
    double peak_qps = *(_qps_bq.bottom());
@@ -184,7 +199,12 @@ void AutoConcurrencyLimiter::UpdateQps(int32_t succ_count,
    for (size_t i = 0; i < _qps_bq.size(); ++i) {
        peak_qps = std::max(*(_qps_bq.bottom(i)), peak_qps);
    }
-    _ema_peak_qps = _ema_peak_qps * _smooth + peak_qps * (1 - _smooth);
+    if (peak_qps >= _ema_peak_qps) {
+        _ema_peak_qps = peak_qps;
+    } else {
+        _ema_peak_qps = _ema_peak_qps * _smooth + peak_qps * (1 - _smooth);
+    }
 }
 int32_t AutoConcurrencyLimiter::UpdateMaxConcurrency(int64_t sampling_time_us) {
@@ -197,30 +217,43 @@ int32_t AutoConcurrencyLimiter::UpdateMaxConcurrency(int64_t sampling_time_us) {
    UpdateMinLatency(avg_latency);
    UpdateQps(total_succ_req, sampling_time_us);
-    if (_rest_noload_count > 0) {
+    if (_reset_end_ms > sampling_time_us / 1000) {
-        --_rest_noload_count;
        return 0;
    }
    int next_max_concurrency = 0;
-    if (--_reset_count == 0) {
+    if (_reset_start_ms <= sampling_time_us / 1000) {
        _min_latency_us = -1;
-        _reset_count = NextResetCount();
+        _reset_start_ms = NextResetTime();
-        _rest_noload_count = std::ceil(
+        _reset_end_ms = sampling_time_us/1000 + FLAGS_auto_cl_reset_duration_ms;
-            double(avg_latency) / FLAGS_auto_cl_sample_window_size_ms / 1000);
        next_max_concurrency = _max_concurrency / 2;
    } else {
-        int32_t noload_concurrency = _ema_peak_qps * _min_latency_us / 1000000.0;
+        int32_t noload_concurrency = std::ceil(_min_latency_us * _ema_peak_qps / 1000000);
-        if (avg_latency > (1 + FLAGS_auto_cl_latency_fluctuate_rate) * _min_latency_us) {
+        if (avg_latency < (1.0 + _overload_threshold) * _min_latency_us) {
-            next_max_concurrency = noload_concurrency;
+//            LOG(INFO) << "<<<" << _min_latency_us << " " << avg_latency << " " << _ema_peak_qps << " " << noload_concurrency;
+            next_max_concurrency = std::ceil(noload_concurrency * (2.0 + _overload_threshold - double(avg_latency) / _min_latency_us));
        } else {
-            next_max_concurrency = 
+//            LOG(INFO) << ">>>" << _min_latency_us << " " << avg_latency << " " << _ema_peak_qps << " " << noload_concurrency;
-                std::ceil(_ema_peak_qps * ((2 + FLAGS_auto_cl_latency_fluctuate_rate) * _min_latency_us - avg_latency) / 1000000.0 );
+            next_max_concurrency = noload_concurrency;
-            if (avg_latency <= (1 + FLAGS_auto_cl_latency_fluctuate_rate) * _min_latency_us) {
-                next_max_concurrency = std::max(next_max_concurrency, noload_concurrency + FLAGS_auto_cl_min_reserved_concurrency);
-            }
        }
+//        if (avg_latency > (1.0 + _overload_threshold) * _min_latency_us) {
+//            next_max_concurrency = noload_concurrency;
+// //           LOG(INFO) << " >>> " << next_max_concurrency << " " << _min_latency_us / 1000;
+//        } else if (avg_latency < (1.0 + _noload_threshold) * _min_latency_us) {
+//            next_max_concurrency = 
+//                noload_concurrency * (1.0 + _overload_threshold); 
+//  //         LOG(INFO) << " <<< " << next_max_concurrency << " " << _min_latency_us / 1000;
+//        } else {
+//            next_max_concurrency = 
+//                noload_concurrency * (2.0 + _overload_threshold - 
+//                double(avg_latency) / _min_latency_us);
+//   //         LOG(INFO) << " --- " << next_max_concurrency << " " << _min_latency_us / 1000;
+//        }
    }
+    next_max_concurrency = 
+        std::max(next_max_concurrency, FLAGS_auto_cl_min_concurrency);
    if (next_max_concurrency != _max_concurrency) {
        _max_concurrency = next_max_concurrency;

--- a/src/brpc/policy/auto_concurrency_limiter.h
+++ b/src/brpc/policy/auto_concurrency_limiter.h
@@ -51,7 +51,7 @@ private:
    };
    int32_t AddSample(int error_code, int64_t latency_us, int64_t sampling_time_us);
-    int NextResetCount();
+    int64_t NextResetTime();
    // The following methods are not thread safe and can only be called 
    // in AppSample()
@@ -62,12 +62,15 @@ private:
    double peak_qps();
    SampleWindow _sw;
-    int _reset_count;
+    int64_t _reset_start_ms;
+    int64_t _reset_end_ms;
    int64_t _min_latency_us;
-    const double _smooth;
    double _ema_peak_qps;
-    int _rest_noload_count;
    butil::BoundedQueue<double> _qps_bq;
+    const double _smooth;
+    const double _overload_threshold;
    butil::Mutex _sw_mutex;
    bvar::PassiveStatus<int32_t> _max_concurrency_bvar;
    butil::atomic<int64_t> BAIDU_CACHELINE_ALIGNMENT _last_sampling_time_us;

--- a/src/brpc/server.cpp
+++ b/src/brpc/server.cpp
@@ -876,7 +876,7 @@ int Server::StartInternal(const butil::ip_t& ip,
        static_cast<int>(_options.max_concurrency) != 0) {
        _cl = ConcurrencyLimiter::CreateConcurrencyLimiterOrDie(
            _options.max_concurrency);
-        _cl->Expose("Global_Concurrency_Limiter");
+        _cl->Expose("Server_Concurrency_Limiter");
    } else {
        if (_cl) {
            _cl->Destroy();