Merge pull request #188 from RedisLabs/fix.mem_increase

filipecosta90 · web-flow · commit e6cd4ce0defc · 2022-08-02T23:21:28.000+01:00
Fixed memory usage increasing over time due to per second histogram usage
diff --git a/run_stats.cpp b/run_stats.cpp
@@ -117,6 +117,7 @@ run_stats::run_stats(benchmark_config *config) :
 {
     memset(&m_start_time, 0, sizeof(m_start_time));
     memset(&m_end_time, 0, sizeof(m_end_time));
+    quantiles_list = config->print_percentiles.quantile_list;
 
     if (config->arbitrary_commands->is_defined()) {
         setup_arbitrary_commands(config->arbitrary_commands->size());
@@ -127,6 +128,7 @@ void run_stats::setup_arbitrary_commands(size_t n_arbitrary_commands) {
     m_totals.setup_arbitrary_commands(n_arbitrary_commands);
     m_cur_stats.setup_arbitrary_commands(n_arbitrary_commands);
     m_ar_commands_latency_histograms.resize(n_arbitrary_commands);
+    inst_m_ar_commands_latency_histograms.resize(n_arbitrary_commands);
 }
 
 void run_stats::set_start_time(struct timeval* start_time)
@@ -155,6 +157,16 @@ void run_stats::roll_cur_stats(struct timeval* ts)
 {
     const unsigned int sec = ts_diff(m_start_time, *ts) / 1000000;
     if (sec > m_cur_stats.m_second) {
+        m_cur_stats.m_get_cmd.summarize_quantiles(inst_m_get_latency_histogram,quantiles_list);
+        m_cur_stats.m_set_cmd.summarize_quantiles(inst_m_set_latency_histogram,quantiles_list);
+        m_cur_stats.m_wait_cmd.summarize_quantiles(inst_m_wait_latency_histogram,quantiles_list);
+        for (unsigned int i=0; i<m_cur_stats.m_ar_commands.size(); i++) {
+            m_cur_stats.m_ar_commands[i].summarize_quantiles(inst_m_ar_commands_latency_histograms[i],quantiles_list);
+        hdr_reset(inst_m_ar_commands_latency_histograms[i]);
+        }
+        hdr_reset(inst_m_get_latency_histogram);
+        hdr_reset(inst_m_set_latency_histogram);
+        hdr_reset(inst_m_wait_latency_histogram);
         m_stats.push_back(m_cur_stats);
         m_cur_stats.reset(sec);
     }
@@ -166,7 +178,7 @@ void run_stats::update_get_op(struct timeval* ts, unsigned int bytes, unsigned i
     m_cur_stats.m_get_cmd.update_op(bytes, latency, hits, misses);
     m_totals.update_op(bytes, latency);
     hdr_record_value(m_get_latency_histogram,latency);
-
+    hdr_record_value(inst_m_get_latency_histogram,latency);
 }
 
 void run_stats::update_set_op(struct timeval* ts, unsigned int bytes, unsigned int latency)
@@ -176,6 +188,7 @@ void run_stats::update_set_op(struct timeval* ts, unsigned int bytes, unsigned i
     m_cur_stats.m_set_cmd.update_op(bytes, latency);
     m_totals.update_op(bytes, latency);
     hdr_record_value(m_set_latency_histogram,latency);
+    hdr_record_value(inst_m_set_latency_histogram,latency);
 }
 
 void run_stats::update_moved_get_op(struct timeval* ts, unsigned int bytes, unsigned int latency)
@@ -185,6 +198,7 @@ void run_stats::update_moved_get_op(struct timeval* ts, unsigned int bytes, unsi
     m_cur_stats.m_get_cmd.update_moved_op(bytes, latency);
     m_totals.update_op(bytes, latency);
     hdr_record_value(m_get_latency_histogram,latency);
+    hdr_record_value(inst_m_get_latency_histogram,latency);
 }
 
 void run_stats::update_moved_set_op(struct timeval* ts, unsigned int bytes, unsigned int latency)
@@ -194,6 +208,7 @@ void run_stats::update_moved_set_op(struct timeval* ts, unsigned int bytes, unsi
     m_cur_stats.m_set_cmd.update_moved_op(bytes, latency);
     m_totals.update_op(bytes, latency);
     hdr_record_value(m_set_latency_histogram,latency);
+    hdr_record_value(inst_m_set_latency_histogram,latency);
 }
 
 void run_stats::update_ask_get_op(struct timeval* ts, unsigned int bytes, unsigned int latency)
@@ -203,6 +218,7 @@ void run_stats::update_ask_get_op(struct timeval* ts, unsigned int bytes, unsign
     m_cur_stats.m_get_cmd.update_ask_op(bytes, latency);
     m_totals.update_op(bytes, latency);
     hdr_record_value(m_get_latency_histogram,latency);
+    hdr_record_value(inst_m_get_latency_histogram,latency);
 }
 
 void run_stats::update_ask_set_op(struct timeval* ts, unsigned int bytes, unsigned int latency)
@@ -212,6 +228,7 @@ void run_stats::update_ask_set_op(struct timeval* ts, unsigned int bytes, unsign
     m_cur_stats.m_set_cmd.update_ask_op(bytes, latency);
     m_totals.update_op(bytes, latency);
     hdr_record_value(m_set_latency_histogram,latency);
+    hdr_record_value(inst_m_set_latency_histogram,latency);
 }
 
 void run_stats::update_wait_op(struct timeval *ts, unsigned int latency)
@@ -221,6 +238,7 @@ void run_stats::update_wait_op(struct timeval *ts, unsigned int latency)
     m_cur_stats.m_wait_cmd.update_op(0, latency);
     m_totals.update_op(0, latency);
     hdr_record_value(m_wait_latency_histogram,latency);
+    hdr_record_value(inst_m_wait_latency_histogram,latency);
 }
 
 void run_stats::update_arbitrary_op(struct timeval *ts, unsigned int bytes,
@@ -231,7 +249,9 @@ void run_stats::update_arbitrary_op(struct timeval *ts, unsigned int bytes,
     m_totals.update_op(bytes, latency);
 
     struct hdr_histogram* hist = m_ar_commands_latency_histograms.at(request_index);
+    struct hdr_histogram* inst_hist = inst_m_ar_commands_latency_histograms.at(request_index);
     hdr_record_value(hist,latency);
+    hdr_record_value(inst_hist,latency);
 }
 
 unsigned int run_stats::get_duration(void)
@@ -828,22 +848,23 @@ void result_print_to_json(json_handler * jsonhandler, const char * type, double
             char timestamp_str[16];
             one_sec_cmd_stats cmd_stats = timeserie_stats[i];
             const unsigned int timestamp = timestamps[i];
-            const bool sec_has_samples = hdr_total_count(cmd_stats.latency_histogram)>0;
-            const double sec_avg_latency = sec_has_samples ? hdr_mean(cmd_stats.latency_histogram)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER : 0.0;
-            const double sec_min_latency = has_samples ? hdr_min(cmd_stats.latency_histogram)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER : 0.0;
-            const double sec_max_latency = has_samples ? hdr_max(cmd_stats.latency_histogram)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER : 0.0;
+            const bool sec_has_samples = cmd_stats.m_ops > 0;
             snprintf(timestamp_str,sizeof(timestamp_str)-1,"%d", timestamp);
             jsonhandler->open_nesting(timestamp_str);
-            jsonhandler->write_obj("Count","%lld", hdr_total_count(cmd_stats.latency_histogram));
-            jsonhandler->write_obj("Average Latency","%.2f", sec_avg_latency);
-            jsonhandler->write_obj("Min Latency","%.2f", sec_min_latency);
-            jsonhandler->write_obj("Max Latency","%.2f", sec_max_latency);
-            for (std::size_t i = 0; i < quantile_list.size(); i++){
-                const float quantile = quantile_list[i];
-                char quantile_header[8];
-                snprintf(quantile_header,sizeof(quantile_header)-1,"p%.2f", quantile);
-                const double value = hdr_value_at_percentile(cmd_stats.latency_histogram, quantile )/ (double) LATENCY_HDR_RESULTS_MULTIPLIER;
-                jsonhandler->write_obj((char *)quantile_header,"%.2f", value);
+            jsonhandler->write_obj("Count","%lld", cmd_stats.m_ops);
+            if (sec_has_samples){
+                jsonhandler->write_obj("Average Latency","%.3f", cmd_stats.m_avg_latency);
+                jsonhandler->write_obj("Min Latency","%.3f", cmd_stats.m_min_latency);
+                jsonhandler->write_obj("Max Latency","%.3f", cmd_stats.m_max_latency);
+                for (std::size_t i = 0; i < quantile_list.size(); i++){
+                    if (i < cmd_stats.summarized_quantile_values.size()){
+                        const float quantile = quantile_list[i];
+                        char quantile_header[8];
+                        snprintf(quantile_header,sizeof(quantile_header)-1,"p%.2f", quantile);
+                        const double value = cmd_stats.summarized_quantile_values[i];
+                        jsonhandler->write_obj((char *)quantile_header,"%.3f", value);
+                    }
+                }
             }
             jsonhandler->close_nesting();
         }
@@ -1103,7 +1124,7 @@ void run_stats::print_kb_sec_column(output_table &table) {
     table.add_column(column);
 }
 
-void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& command_list, bool cluster_mode, std::vector<float> quantile_list) {
+void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& command_list, bool cluster_mode) {
     if (jsonhandler != NULL){ // Added for double verification in case someone accidently send NULL.
         jsonhandler->open_nesting("Runtime");
         const unsigned long long start_time_ms = (m_start_time.tv_sec * 1000000 + m_start_time.tv_usec)/1000;
@@ -1133,7 +1154,7 @@ void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& co
                                  cluster_mode ? m_totals.m_ar_commands[i].m_moved_sec : -1,
                                  cluster_mode ? m_totals.m_ar_commands[i].m_ask_sec : -1,
                                  m_totals.m_ar_commands[i].m_bytes_sec,
-                                 quantile_list,
+                                 quantiles_list,
                                  arbitrary_command_latency_histogram,
                                  timestamps,
                                  arbitrary_command_stats
@@ -1149,7 +1170,7 @@ void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& co
                              cluster_mode ? m_totals.m_set_cmd.m_moved_sec : -1,
                              cluster_mode ? m_totals.m_set_cmd.m_ask_sec : -1,
                              m_totals.m_set_cmd.m_bytes_sec,
-                             quantile_list,
+                             quantiles_list,
                              m_set_latency_histogram,
                              timestamps,
                              set_stats
@@ -1160,7 +1181,7 @@ void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& co
                              cluster_mode ? m_totals.m_get_cmd.m_moved_sec : -1,
                              cluster_mode ? m_totals.m_get_cmd.m_ask_sec : -1,
                              m_totals.m_get_cmd.m_bytes_sec,
-                             quantile_list,
+                             quantiles_list,
                              m_get_latency_histogram,
                              timestamps,
                              get_stats
@@ -1171,7 +1192,7 @@ void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& co
                              cluster_mode ? 0.0 : -1,
                              cluster_mode ? 0.0 : -1,
                              0.0,
-                             quantile_list,
+                             quantiles_list,
                              m_wait_latency_histogram,
                              timestamps,
                              wait_stats
@@ -1184,7 +1205,7 @@ void run_stats::print_json(json_handler *jsonhandler, arbitrary_command_list& co
                          cluster_mode ? m_totals.m_moved_sec : -1,
                          cluster_mode ? m_totals.m_ask_sec : -1,
                          m_totals.m_bytes_sec,
-                         quantile_list,
+                         quantiles_list,
                          m_totals.latency_histogram,
                          timestamps,
                          total_stats
@@ -1327,7 +1348,7 @@ void run_stats::print(FILE *out, benchmark_config *config,
             jsonhandler->open_nesting("UNKNOWN STATS");
         }
 
-        print_json(jsonhandler, *config->arbitrary_commands, config->cluster_mode, config->print_percentiles.quantile_list);
+        print_json(jsonhandler, *config->arbitrary_commands, config->cluster_mode);
     }
 
     if (!config->hide_histogram) {
diff --git a/run_stats.h b/run_stats.h
@@ -97,6 +97,7 @@ class run_stats {
     totals m_totals;
 
     std::list<one_second_stats> m_stats;
+    std::vector<float> quantiles_list;
 
     // current second stats ( appended to m_stats and reset every second )
     one_second_stats m_cur_stats;
@@ -106,6 +107,12 @@ class run_stats {
     safe_hdr_histogram m_wait_latency_histogram;
     std::vector<safe_hdr_histogram> m_ar_commands_latency_histograms;
 
+    // instantaneous command stats ( used in the per second latencies )
+    safe_hdr_histogram inst_m_get_latency_histogram;
+    safe_hdr_histogram inst_m_set_latency_histogram;
+    safe_hdr_histogram inst_m_wait_latency_histogram;
+    std::vector<safe_hdr_histogram> inst_m_ar_commands_latency_histograms;
+
     void roll_cur_stats(struct timeval* ts);
 
 public:
@@ -167,7 +174,7 @@ class run_stats {
     void print_avg_latency_column(output_table &table);
     void print_quantile_latency_column(output_table &table, double quantile, char* label);
     void print_kb_sec_column(output_table &table);
-    void print_json(json_handler *jsonhandler, arbitrary_command_list& command_list, bool cluster_mode, std::vector<float> quantile_list);
+    void print_json(json_handler *jsonhandler, arbitrary_command_list& command_list, bool cluster_mode);
     void print_histogram(FILE *out, json_handler* jsonhandler, arbitrary_command_list& command_list);
     void print(FILE *file, benchmark_config *config,
                const char* header = NULL, json_handler* jsonhandler = NULL);
diff --git a/run_stats_types.cpp b/run_stats_types.cpp
@@ -33,7 +33,10 @@ one_sec_cmd_stats::one_sec_cmd_stats() :
     m_misses(0),
     m_moved(0),
     m_ask(0),
-    m_total_latency(0) {
+    m_total_latency(0),
+    m_avg_latency(0.0),
+    m_min_latency(0.0),
+    m_max_latency(0.0) {
 }
 
 
@@ -45,7 +48,10 @@ void one_sec_cmd_stats::reset() {
     m_moved = 0;
     m_ask = 0;
     m_total_latency = 0;
-    hdr_reset(latency_histogram); 
+    m_avg_latency = 0;
+    m_max_latency = 0;
+    m_min_latency = 0;
+    summarized_quantile_values.clear();
 }
 
 void one_sec_cmd_stats::merge(const one_sec_cmd_stats& other) {
@@ -56,14 +62,27 @@ void one_sec_cmd_stats::merge(const one_sec_cmd_stats& other) {
     m_moved += other.m_moved;
     m_ask += other.m_ask;
     m_total_latency += other.m_total_latency;
-    hdr_add(latency_histogram,other.latency_histogram);
+    m_avg_latency = (double) m_total_latency / (double) m_ops / (double) LATENCY_HDR_RESULTS_MULTIPLIER;
+    m_max_latency = other.m_max_latency > m_max_latency ? other.m_max_latency : m_max_latency;
+    m_min_latency = other.m_min_latency < m_min_latency ? other.m_min_latency : m_min_latency;
+}
+
+void one_sec_cmd_stats::summarize_quantiles(safe_hdr_histogram histogram, std::vector<float> quantiles) {
+    const bool has_samples = m_ops>0;
+    for (std::size_t i = 0; i < quantiles.size(); i++){
+        const float quantile = quantiles[i];
+        const double value = hdr_value_at_percentile(histogram, quantile)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER;
+        summarized_quantile_values.push_back(value);
+    }
+    m_avg_latency = has_samples ? hdr_mean(histogram)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER : 0.0;
+    m_max_latency = has_samples ? hdr_max(histogram)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER : 0.0;
+    m_min_latency = has_samples ? hdr_min(histogram)/ (double) LATENCY_HDR_RESULTS_MULTIPLIER : 0.0;
 }
 
 void one_sec_cmd_stats::update_op(unsigned int bytes, unsigned int latency) {
     m_bytes += bytes;
     m_ops++;
     m_total_latency += latency;
-    hdr_record_value(latency_histogram,latency);
 }
 
 void one_sec_cmd_stats::update_op(unsigned int bytes, unsigned int latency,
@@ -148,7 +167,6 @@ void one_second_stats::setup_arbitrary_commands(size_t n_arbitrary_commands) {
     m_ar_commands.setup(n_arbitrary_commands);
 }
 
-
 void one_second_stats::reset(unsigned int second) {
     m_second = second;
     m_get_cmd.reset();
diff --git a/run_stats_types.h b/run_stats_types.h
@@ -82,10 +82,14 @@ class one_sec_cmd_stats {
     unsigned int m_moved;
     unsigned int m_ask;
     unsigned long long int m_total_latency;
-    safe_hdr_histogram latency_histogram;
+    std::vector<double> summarized_quantile_values;
+    double m_avg_latency;
+    double m_min_latency;
+    double m_max_latency;
     one_sec_cmd_stats();
     void reset();
     void merge(const one_sec_cmd_stats& other);
+    void summarize_quantiles(safe_hdr_histogram histogram, std::vector<float> quantiles);
     void update_op(unsigned int bytes, unsigned int latency);
     void update_op(unsigned int bytes, unsigned int latency, unsigned int hits, unsigned int misses);
     void update_moved_op(unsigned int bytes, unsigned int latency);