There are two approaches when changing the size of the ring buffer page: 1. Destroying all pages and allocating new pages with the new size. 2. Allocating new pages, copying the content of the old pages before destroying them. The first approach is easier, it is selected in the proposed implementation. Changing the ring buffer page size is supposed to not happen frequently. Usually, that size should be set only once, when the buffer is not in use yet and is supposed to be empty. Signed-off-by: Tzvetomir Stoyanov (VMware) <tz.stoyanov@xxxxxxxxx> --- kernel/trace/ring_buffer.c | 95 ++++++++++++++++++++++++++++++++++---- 1 file changed, 86 insertions(+), 9 deletions(-) diff --git a/kernel/trace/ring_buffer.c b/kernel/trace/ring_buffer.c index 9aa245795c3d..39be9b1cf6e0 100644 --- a/kernel/trace/ring_buffer.c +++ b/kernel/trace/ring_buffer.c @@ -368,6 +368,7 @@ static inline int test_time_stamp(u64 delta) /* Max payload is buffer page size - header (8bytes) */ #define BUF_MAX_DATA_SIZE(B) ((B)->page_size - (sizeof(u32) * 2)) +#define BUF_SYS_PAGE_COUNT(B) (((B)->page_size + BUF_PAGE_HDR_SIZE) / PAGE_SIZE) struct rb_irq_work { struct irq_work work; @@ -1521,6 +1522,7 @@ static int __rb_allocate_pages(struct ring_buffer_per_cpu *cpu_buffer, struct buffer_page *bpage, *tmp; bool user_thread = current->mm != NULL; gfp_t mflags; + int psize; long i; /* @@ -1552,6 +1554,12 @@ static int __rb_allocate_pages(struct ring_buffer_per_cpu *cpu_buffer, */ if (user_thread) set_current_oom_origin(); + + /* Buffer page size must be at least one system page */ + psize = BUF_SYS_PAGE_COUNT(cpu_buffer->buffer) - 1; + if (psize < 0) + psize = 0; + for (i = 0; i < nr_pages; i++) { struct page *page; @@ -1564,7 +1572,7 @@ static int __rb_allocate_pages(struct ring_buffer_per_cpu *cpu_buffer, list_add(&bpage->list, pages); - page = alloc_pages_node(cpu_to_node(cpu_buffer->cpu), mflags, 0); + page = alloc_pages_node(cpu_to_node(cpu_buffer->cpu), mflags, psize); if (!page) goto free_pages; bpage->page = page_address(page); @@ -1620,6 +1628,7 @@ rb_allocate_cpu_buffer(struct trace_buffer *buffer, long nr_pages, int cpu) struct ring_buffer_per_cpu *cpu_buffer; struct buffer_page *bpage; struct page *page; + int psize; int ret; cpu_buffer = kzalloc_node(ALIGN(sizeof(*cpu_buffer), cache_line_size()), @@ -1646,7 +1655,13 @@ rb_allocate_cpu_buffer(struct trace_buffer *buffer, long nr_pages, int cpu) rb_check_bpage(cpu_buffer, bpage); cpu_buffer->reader_page = bpage; - page = alloc_pages_node(cpu_to_node(cpu), GFP_KERNEL, 0); + + /* Buffer page size must be at least one system page */ + psize = BUF_SYS_PAGE_COUNT(cpu_buffer->buffer) - 1; + if (psize < 0) + psize = 0; + + page = alloc_pages_node(cpu_to_node(cpu), GFP_KERNEL, psize); if (!page) goto fail_free_reader; bpage->page = page_address(page); @@ -5412,6 +5427,7 @@ void *ring_buffer_alloc_read_page(struct trace_buffer *buffer, int cpu) struct buffer_data_page *bpage = NULL; unsigned long flags; struct page *page; + int psize; if (!cpumask_test_cpu(cpu, buffer->cpumask)) return ERR_PTR(-ENODEV); @@ -5431,8 +5447,13 @@ void *ring_buffer_alloc_read_page(struct trace_buffer *buffer, int cpu) if (bpage) goto out; + /* Buffer page size must be at least one system page */ + psize = BUF_SYS_PAGE_COUNT(cpu_buffer->buffer) - 1; + if (psize < 0) + psize = 0; + page = alloc_pages_node(cpu_to_node(cpu), - GFP_KERNEL | __GFP_NORETRY, 0); + GFP_KERNEL | __GFP_NORETRY, psize); if (!page) return ERR_PTR(-ENOMEM); @@ -5693,10 +5714,70 @@ int ring_buffer_page_size_get(struct trace_buffer *buffer) if (!buffer) return -EINVAL; - return (buffer->page_size + BUF_PAGE_HDR_SIZE) / PAGE_SIZE; + return BUF_SYS_PAGE_COUNT(buffer); } EXPORT_SYMBOL_GPL(ring_buffer_page_size_get); +static int page_size_set(struct trace_buffer *buffer, int size) +{ + struct ring_buffer_per_cpu *cpu_buffer; + int old_size = buffer->page_size; + int nr_pages; + int ret = 0; + int err; + int cpu; + + if (buffer->page_size == size) + return 0; + + /* prevent another thread from changing buffer sizes */ + mutex_lock(&buffer->mutex); + atomic_inc(&buffer->record_disabled); + + /* Make sure all commits have finished */ + synchronize_rcu(); + + buffer->page_size = size; + + for_each_buffer_cpu(buffer, cpu) { + + if (!cpumask_test_cpu(cpu, buffer->cpumask)) + continue; + + nr_pages = buffer->buffers[cpu]->nr_pages; + rb_free_cpu_buffer(buffer->buffers[cpu]); + buffer->buffers[cpu] = rb_allocate_cpu_buffer(buffer, nr_pages, cpu); + } + + atomic_dec(&buffer->record_disabled); + mutex_unlock(&buffer->mutex); + + return 0; + +out_err: + buffer->page_size = old_size; + + for_each_buffer_cpu(buffer, cpu) { + struct buffer_page *bpage, *tmp; + + cpu_buffer = buffer->buffers[cpu]; + + if (list_empty(&cpu_buffer->new_pages)) + continue; + + list_for_each_entry_safe(bpage, tmp, &cpu_buffer->new_pages, list) { + list_del_init(&bpage->list); + free_buffer_page(bpage); + } + atomic_dec(&cpu_buffer->record_disabled); + atomic_dec(&cpu_buffer->resize_disabled); + } + + mutex_unlock(&buffer->mutex); + + return err; +} + /** * ring_buffer_page_size_set - set the size of ring buffer page. * @buffer: The ring_buffer to set the new page size. @@ -5720,11 +5801,7 @@ int ring_buffer_page_size_set(struct trace_buffer *buffer, int pcount) if (psize <= BUF_PAGE_HDR_SIZE) return -EINVAL; - buffer->page_size = psize - BUF_PAGE_HDR_SIZE; - - /* Todo: reset the buffer with the new page size */ - - return 0; + return page_size_set(buffer, psize - BUF_PAGE_HDR_SIZE); } EXPORT_SYMBOL_GPL(ring_buffer_page_size_set); -- 2.31.1