During changes to kfree_rcu() code, we often check the amount of free memory. As an alternative to checking this manually, this commit adds a measurement in the test itself. It measures four times during the test for available memory, digitally filters these measurements to produce a running average with a weight of 0.5, and compares this digitally filtered value with the amount of available memory at the beginning of the test. We apply the digital filter only once we are more than 25% into the test. At the 25% mark, we just read available memory and don't apply any filtering. This prevents the first sample from skewing the results as we would not consider memory readings that were before memory was allocated. A sample run shows something like: Total time taken by all kfree'ers: 6369738407 ns, loops: 10000, batches: 764, memory footprint: 216MB Signed-off-by: Joel Fernandes (Google) <joel@xxxxxxxxxxxxxxxxx> --- v1->v2: Minor corrections v1->v3: Use long long to prevent 32-bit system's overflow Handle case where some threads start later than others. Start measuring only once 25% into the test. Slightly more accurate. Cc: bristot@xxxxxxxxxx Cc: frextrite@xxxxxxxxx Cc: madhuparnabhowmik04@xxxxxxxxx Cc: urezki@xxxxxxxxx Signed-off-by: Joel Fernandes (Google) <joel@xxxxxxxxxxxxxxxxx> kernel/rcu/rcuperf.c | 23 +++++++++++++++++++++-- 1 file changed, 21 insertions(+), 2 deletions(-) diff --git a/kernel/rcu/rcuperf.c b/kernel/rcu/rcuperf.c index da94b89cd531..67e0f804ea97 100644 --- a/kernel/rcu/rcuperf.c +++ b/kernel/rcu/rcuperf.c @@ -12,6 +12,7 @@ #include <linux/types.h> #include <linux/kernel.h> #include <linux/init.h> +#include <linux/mm.h> #include <linux/module.h> #include <linux/kthread.h> #include <linux/err.h> @@ -604,6 +605,8 @@ struct kfree_obj { struct rcu_head rh; }; +long long mem_begin; + static int kfree_perf_thread(void *arg) { @@ -611,6 +614,7 @@ kfree_perf_thread(void *arg) long me = (long)arg; struct kfree_obj *alloc_ptr; u64 start_time, end_time; + long long mem_during = si_mem_available(); VERBOSE_PERFOUT_STRING("kfree_perf_thread task started"); set_cpus_allowed_ptr(current, cpumask_of(me % nr_cpu_ids)); @@ -626,6 +630,15 @@ kfree_perf_thread(void *arg) } do { + // Moving average of memory availability measurements. + // Start measuring only from when we are at least 25% into the test. + if (loop && kfree_loops > 3 && (loop % (kfree_loops / 4) == 0)) { + if (loop == (kfree_loops / 4)) + mem_during = si_mem_available(); + else + mem_during = (mem_during + si_mem_available()) / 2; + } + for (i = 0; i < kfree_alloc_num; i++) { alloc_ptr = kmalloc(sizeof(struct kfree_obj), GFP_KERNEL); if (!alloc_ptr) @@ -645,9 +658,13 @@ kfree_perf_thread(void *arg) else b_rcu_gp_test_finished = cur_ops->get_gp_seq(); - pr_alert("Total time taken by all kfree'ers: %llu ns, loops: %d, batches: %ld\n", + // The "memory footprint" field represents how much in-flight + // memory is allocated during the test and waiting to be freed. + pr_alert("Total time taken by all kfree'ers: %llu ns, loops: %d, batches: %ld, memory footprint: %lldMB\n", (unsigned long long)(end_time - start_time), kfree_loops, - rcuperf_seq_diff(b_rcu_gp_test_finished, b_rcu_gp_test_started)); + rcuperf_seq_diff(b_rcu_gp_test_finished, b_rcu_gp_test_started), + (mem_begin - mem_during) >> (20 - PAGE_SHIFT)); + if (shutdown) { smp_mb(); /* Assign before wake. */ wake_up(&shutdown_wq); @@ -719,6 +736,8 @@ kfree_perf_init(void) goto unwind; } + mem_begin = si_mem_available(); + for (i = 0; i < kfree_nrealthreads; i++) { firsterr = torture_create_kthread(kfree_perf_thread, (void *)i, kfree_reader_tasks[i]); -- 2.24.1.735.g03f4e72817-goog