couchbase
diff --git a/‎engines/ep/CMakeLists.txt‎
Lines changed: 13 additions & 0 deletions b/‎engines/ep/CMakeLists.txt‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎engines/ep/configuration.json‎
Lines changed: 64 additions & 4 deletions b/‎engines/ep/configuration.json‎
Lines changed: 64 additions & 4 deletions
diff --git a/‎engines/ep/src/defragmenter.cc‎
Lines changed: 122 additions & 12 deletions b/‎engines/ep/src/defragmenter.cc‎
Lines changed: 122 additions & 12 deletions
@@ -92,6 +92,9 @@ add_executable(gencode tools/gencode.cc)
 kv_enable_pch(gencode)
 add_executable(genconfig tools/genconfig.cc)
 kv_enable_pch(genconfig)
+
+add_executable(pid_runner tools/pid_runner.cc $<TARGET_OBJECTS:ep_objs>)
+
 if (WIN32)
     # windows need getopt
     target_link_libraries(gencode PRIVATE platform)
@@ -128,6 +131,15 @@ target_link_libraries(kvstore_gen PRIVATE
         ${LIBEVENT_LIBRARIES}
 )
 
+target_link_libraries(pid_runner
+        ep-engine_collections
+        mcd_executor
+        mcbp
+        mcd_time
+        mcd_tracing
+        xattr
+        ${EP_STORAGE_LIBS})
+
 ADD_CUSTOM_COMMAND(OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/src/stats-info.c
                           ${CMAKE_CURRENT_BINARY_DIR}/src/stats-info.h
                   COMMAND
@@ -350,6 +362,7 @@ ADD_LIBRARY(ep_objs OBJECT
             src/mutation_log_entry.cc
             src/paging_visitor.cc
             src/persistence_callback.cc
+            src/pid_controller.cc
             src/pre_link_document_context.cc
             src/pre_link_document_context.h
             src/progress_tracker.cc
 
@@ -315,10 +315,9 @@
         "dcp_noop_mandatory_for_v5_features": {
             "default": "true",
             "descr": "Forces clients to enable noop for v5 features",
-	    "dynamic": true,
+            "dynamic": true,
             "type": "bool"
         },
-
         "defragmenter_enabled": {
             "default": "true",
             "descr": "True if defragmenter task is enabled",
@@ -328,7 +327,7 @@
         "defragmenter_interval": {
             "default": "10.0",
             "descr": "How often defragmenter task should be run (in seconds).",
-	    "dynamic": true,
+            "dynamic": true,
             "type": "float"
         },
         "defragmenter_age_threshold": {
@@ -346,14 +345,75 @@
         "defragmenter_chunk_duration": {
             "default": "20",
             "descr": "Maximum time (in ms) defragmentation task will run for before being paused (and resumed at the next defragmenter_interval).",
-	    "dynamic": true,
+            "dynamic": true,
             "type": "size_t",
             "validator": {
                 "range": {
                     "min": 1
                 }
             }
         },
+        "defragmenter_mode" : {
+            "default": "auto_pid",
+            "descr": "Determines how the defragmenter controls its sleep interval. When static defragmenter_interval is used. When auto_linear, scale the sleep time using a scored defragmentation when it falls between defragmenter_auto_lower_trigger and defragmenter_auto_upper_trigger. When auto_pid use a PID controller to computer reductions in the sleep interval when scored fragmentation is above defragmenter_auto_lower_trigger.",
+            "dynamic": false,
+            "type": "std::string",
+            "validator": {
+                "enum": [
+                    "static",
+                    "auto_linear",
+                    "auto_pid"
+                ]
+            }
+        },
+        "defragmenter_auto_lower_threshold" : {
+            "default": "0.07",
+            "descr": "When mode is not static and scored fragmentation is above this value, a sleep time between defragmenter_auto_min_sleep and defragmenter_auto_max_sleep will be used",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_upper_threshold" : {
+            "default": "0.25",
+            "descr": "When mode is auto_linear and scored fragmentation is above this value, the defragmenter will use defragmenter_auto_min_sleep",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_max_sleep" : {
+            "default": "10.0",
+            "descr": "The maximum sleep that the auto controller can set",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_min_sleep" : {
+            "default": "0.0",
+            "descr": "The minimum sleep that the auto controller can set",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_pid_p" : {
+            "default": "0.3",
+            "descr": "The p term for the PID controller",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_pid_i" : {
+            "default": "0.0000197",
+            "descr": "The i term for the PID controller",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_pid_d" : {
+            "default": "0.0",
+            "descr": "The d term for the PID controller",
+            "dynamic": false,
+            "type": "float"
+        },
+        "defragmenter_auto_pid_dt" : {
+            "default": "30000",
+            "descr": "The dt (interval) term for the PID controller. Value represents milliseconds",
+            "dynamic": false,
+            "type": "size_t"
+        },
         "durability_timeout_task_interval": {
             "default": "25",
             "descr": "Interval (in ms) between subsequent runs of the DurabilityTimeoutTask",
 
@@ -25,22 +25,40 @@ DefragmenterTask::DefragmenterTask(EventuallyPersistentEngine* e,
                                    EPStats& stats_)
     : GlobalTask(e, TaskId::DefragmenterTask, 0, false),
       stats(stats_),
-      epstore_position(engine->getKVBucket()->startPosition()) {
+      epstore_position(engine->getKVBucket()->startPosition()),
+      pid(engine->getConfiguration().getDefragmenterAutoLowerThreshold(),
+          engine->getConfiguration().getDefragmenterAutoPidP(),
+          engine->getConfiguration().getDefragmenterAutoPidI(),
+          engine->getConfiguration().getDefragmenterAutoPidD(),
+          std::chrono::milliseconds{
+                  engine->getConfiguration().getDefragmenterAutoPidDt()}) {
 }
 
 bool DefragmenterTask::run() {
     TRACE_EVENT0("ep-engine/task", "DefragmenterTask");
+    std::chrono::duration<double> sleepTime;
     if (engine->getConfiguration().isDefragmenterEnabled()) {
-        defrag();
+        sleepTime = defrag();
+    } else {
+        sleepTime = std::chrono::duration<double>{
+                engine->getConfiguration().getDefragmenterInterval()};
     }
-    snooze(getSleepTime());
+    snooze(sleepTime.count());
     if (engine->getEpStats().isShutdown) {
         return false;
     }
     return true;
 }
 
-void DefragmenterTask::defrag() {
+std::chrono::duration<double> DefragmenterTask::defrag() {
+    auto currentFragStats = cb::ArenaMalloc::getFragmentationStats(
+            engine->getArenaMallocClient());
+
+    auto sleepAndRun = calculateSleepTimeAndRunState(currentFragStats);
+    if (!sleepAndRun.runDefragger) {
+        return sleepAndRun.sleepTime;
+    }
+
     // Get our pause/resume visitor. If we didn't finish the previous pass,
     // then resume from where we last were, otherwise create a new visitor
     // starting from the beginning.
@@ -61,11 +79,9 @@ void DefragmenterTask::defrag() {
             ss << " resuming from " << epstore_position << ", ";
             ss << prAdapter->getHashtablePosition() << ".";
         }
-        auto fragStats = cb::ArenaMalloc::getFragmentationStats(
-                engine->getArenaMallocClient());
         ss << " Using chunk_duration=" << getChunkDuration().count() << " ms."
            << " mem_used=" << stats.getEstimatedTotalMemoryUsed() << ", "
-           << fragStats;
+           << currentFragStats;
         EP_LOG_DEBUG("{}", ss.str());
     }
 
@@ -119,20 +135,22 @@ void DefragmenterTask::defrag() {
         std::chrono::microseconds duration =
                 std::chrono::duration_cast<std::chrono::microseconds>(end -
                                                                       start);
-        auto fragStats = cb::ArenaMalloc::getFragmentationStats(
-                engine->getArenaMallocClient());
+
         ss << " Took " << duration.count() << " us."
            << " moved " << visitor.getDefragCount() << "/"
            << visitor.getVisitedCount() << " visited documents."
            << " mem_used=" << stats.getEstimatedTotalMemoryUsed() << ", "
-           << fragStats << ". Sleeping for " << getSleepTime() << " seconds.";
+           << cb::ArenaMalloc::getFragmentationStats(
+                      engine->getArenaMallocClient())
+           << ". Sleeping for " << sleepAndRun.sleepTime.count() << " seconds.";
         EP_LOG_DEBUG("{}", ss.str());
     }
 
     // Delete(reset) visitor if it finished.
     if (completed) {
         prAdapter.reset();
     }
+    return sleepAndRun.sleepTime;
 }
 
 void DefragmenterTask::stop() {
@@ -154,8 +172,17 @@ std::chrono::microseconds DefragmenterTask::maxExpectedDuration() const {
     return getChunkDuration() * 10;
 }
 
-double DefragmenterTask::getSleepTime() const {
-    return engine->getConfiguration().getDefragmenterInterval();
+DefragmenterTask::SleepTimeAndRunState
+DefragmenterTask::calculateSleepTimeAndRunState(
+        const cb::FragmentationStats& fragStats) {
+    if (engine->getConfiguration().getDefragmenterMode() == "auto_linear") {
+        return calculateSleepLinear(fragStats);
+    } else if (engine->getConfiguration().getDefragmenterMode() == "auto_pid") {
+        return calculateSleepPID(fragStats);
+    }
+    return {std::chrono::duration<double>{
+                    engine->getConfiguration().getDefragmenterInterval()},
+            true};
 }
 
 size_t DefragmenterTask::getAgeThreshold() const {
@@ -197,3 +224,86 @@ std::chrono::milliseconds DefragmenterTask::getChunkDuration() const {
 DefragmentVisitor& DefragmenterTask::getDefragVisitor() {
     return dynamic_cast<DefragmentVisitor&>(prAdapter->getHTVisitor());
 }
+
+float DefragmenterTask::getScoredFragmentation(
+        const cb::FragmentationStats& fragStats) const {
+    auto lowWater = stats.mem_low_wat.load();
+    auto rss = fragStats.getResidentBytes() > lowWater
+                       ? lowWater
+                       : fragStats.getResidentBytes();
+    return fragStats.getFragmentationRatio() * (double(rss) / double(lowWater));
+}
+
+DefragmenterTask::SleepTimeAndRunState DefragmenterTask::calculateSleepLinear(
+        const cb::FragmentationStats& fragStats) {
+    auto score = getScoredFragmentation(fragStats);
+    bool runDefragger = true;
+
+    const auto& conf = engine->getConfiguration();
+    double rv = 0.0;
+    auto maxSleep = conf.getDefragmenterAutoMaxSleep();
+    auto minSleep = conf.getDefragmenterAutoMinSleep();
+    auto lower = conf.getDefragmenterAutoLowerThreshold();
+    auto upper = conf.getDefragmenterAutoUpperThreshold();
+
+    // Is the 'score' in the range where we will look to reduce sleep by
+    // some amount in relation to how 'bad' the score is?
+    if (score > lower && score < upper) {
+        // Calculate the error (distance from lower)
+        auto error = (score - lower);
+
+        // How many % of our error range is that?
+        auto ePerc = (error / (upper - lower)) * 100.0;
+
+        // And now find the % of the sleep range
+        auto t = ((maxSleep - minSleep) / 100) * ePerc;
+
+        // Finally we will return maxSleep - t. As t gets larger the sleep time
+        // is smaller
+        rv = maxSleep - t;
+    } else if (score < lower) {
+        rv = maxSleep;
+        runDefragger = false;
+    } else {
+        rv = minSleep;
+    }
+
+    return {std::chrono::duration<double>{rv}, runDefragger};
+}
+
+DefragmenterTask::SleepTimeAndRunState DefragmenterTask::calculateSleepPID(
+        const cb::FragmentationStats& fragStats) {
+    auto score = getScoredFragmentation(fragStats);
+    const auto& conf = engine->getConfiguration();
+    auto maxSleep = conf.getDefragmenterAutoMaxSleep();
+    auto minSleep = conf.getDefragmenterAutoMinSleep();
+
+    // If fragmentation goes below our set-point (SP), we can't continue to use
+    // the PID. More general usage and it would be used to "speed up/slow down"
+    // to reach the SP. We can't now force defragmentation up, we're just happy
+    // it's below the SP. In this case reset and when we go over again begin
+    // the ramping
+    if (score < conf.getDefragmenterAutoLowerThreshold()) {
+        // Reset the PID ready for the next time fragmentation increases
+        pid.reset();
+        return {std::chrono::duration<double>{maxSleep}, false};
+    }
+
+    // Above setpoint, use the PID to calculate a correction. This will return
+    // a negative value
+    auto correction = stepPid(score);
+
+    // Add the negative to produce a sleep time
+    auto rv = maxSleep + correction;
+
+    // Don't go below the minimum sleep
+    if (rv < minSleep) {
+        rv = minSleep;
+    }
+
+    return {std::chrono::duration<double>{rv}, true};
+}
+
+float DefragmenterTask::stepPid(float pv) {
+    return pid.step(pv);
+}