mirror of
https://git.kernel.org/pub/scm/linux/kernel/git/next/linux-next.git
synced 2025-01-01 10:42:11 +00:00
tracing: Update subbuffer with kilobytes not page order
Using page order for deciding what the size of the ring buffer sub buffers are is exposing a bit too much of the implementation. Although the sub buffers are only allocated in orders of pages, allow the user to specify the minimum size of each sub-buffer via kilobytes like they can with the buffer size itself. If the user specifies 3 via: echo 3 > buffer_subbuf_size_kb Then the sub-buffer size will round up to 4kb (on a 4kb page size system). If they specify: echo 6 > buffer_subbuf_size_kb The sub-buffer size will become 8kb. and so on. Link: https://lore.kernel.org/linux-trace-kernel/20231219185631.809766769@goodmis.org Cc: Masami Hiramatsu <mhiramat@kernel.org> Cc: Mark Rutland <mark.rutland@arm.com> Cc: Mathieu Desnoyers <mathieu.desnoyers@efficios.com> Cc: Andrew Morton <akpm@linux-foundation.org> Cc: Tzvetomir Stoyanov <tz.stoyanov@gmail.com> Cc: Vincent Donnefort <vdonnefort@google.com> Cc: Kent Overstreet <kent.overstreet@gmail.com> Signed-off-by: Steven Rostedt (Google) <rostedt@goodmis.org>
This commit is contained in:
parent
1acce70374
commit
2f84b39f48
@ -203,32 +203,26 @@ of ftrace. Here is a list of some of the key files:
|
|||||||
|
|
||||||
This displays the total combined size of all the trace buffers.
|
This displays the total combined size of all the trace buffers.
|
||||||
|
|
||||||
buffer_subbuf_order:
|
buffer_subbuf_size_kb:
|
||||||
|
|
||||||
This sets or displays the sub buffer page size order. The ring buffer
|
This sets or displays the sub buffer size. The ring buffer is broken up
|
||||||
is broken up into several same size "sub buffers". An event can not be
|
into several same size "sub buffers". An event can not be bigger than
|
||||||
bigger than the size of the sub buffer. Normally, the sub buffer is
|
the size of the sub buffer. Normally, the sub buffer is the size of the
|
||||||
the size of the architecture's page (4K on x86). The sub buffer also
|
architecture's page (4K on x86). The sub buffer also contains meta data
|
||||||
contains meta data at the start which also limits the size of an event.
|
at the start which also limits the size of an event. That means when
|
||||||
That means when the sub buffer is a page size, no event can be larger
|
the sub buffer is a page size, no event can be larger than the page
|
||||||
than the page size minus the sub buffer meta data.
|
size minus the sub buffer meta data.
|
||||||
|
|
||||||
The buffer_subbuf_order allows the user to change the size of the sub
|
Note, the buffer_subbuf_size_kb is a way for the user to specify the
|
||||||
buffer. As the sub buffer is a set of pages by the power of 2, thus
|
minimum size of the subbuffer. The kernel may make it bigger due to the
|
||||||
the sub buffer total size is defined by the order:
|
implementation details, or simply fail the operation if the kernel can
|
||||||
|
not handle the request.
|
||||||
|
|
||||||
order size
|
Changing the sub buffer size allows for events to be larger than the
|
||||||
---- ----
|
page size.
|
||||||
0 PAGE_SIZE
|
|
||||||
1 PAGE_SIZE * 2
|
|
||||||
2 PAGE_SIZE * 4
|
|
||||||
3 PAGE_SIZE * 8
|
|
||||||
|
|
||||||
Changing the order will change the sub buffer size allowing for events
|
Note: When changing the sub-buffer size, tracing is stopped and any
|
||||||
to be larger than the page size.
|
data in the ring buffer and the snapshot buffer will be discarded.
|
||||||
|
|
||||||
Note: When changing the order, tracing is stopped and any data in the
|
|
||||||
ring buffer and the snapshot buffer will be discarded.
|
|
||||||
|
|
||||||
free_buffer:
|
free_buffer:
|
||||||
|
|
||||||
|
@ -9384,42 +9384,54 @@ static const struct file_operations buffer_percent_fops = {
|
|||||||
};
|
};
|
||||||
|
|
||||||
static ssize_t
|
static ssize_t
|
||||||
buffer_order_read(struct file *filp, char __user *ubuf, size_t cnt, loff_t *ppos)
|
buffer_subbuf_size_read(struct file *filp, char __user *ubuf, size_t cnt, loff_t *ppos)
|
||||||
{
|
{
|
||||||
struct trace_array *tr = filp->private_data;
|
struct trace_array *tr = filp->private_data;
|
||||||
|
size_t size;
|
||||||
char buf[64];
|
char buf[64];
|
||||||
|
int order;
|
||||||
int r;
|
int r;
|
||||||
|
|
||||||
r = sprintf(buf, "%d\n", ring_buffer_subbuf_order_get(tr->array_buffer.buffer));
|
order = ring_buffer_subbuf_order_get(tr->array_buffer.buffer);
|
||||||
|
size = (PAGE_SIZE << order) / 1024;
|
||||||
|
|
||||||
|
r = sprintf(buf, "%zd\n", size);
|
||||||
|
|
||||||
return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
||||||
}
|
}
|
||||||
|
|
||||||
static ssize_t
|
static ssize_t
|
||||||
buffer_order_write(struct file *filp, const char __user *ubuf,
|
buffer_subbuf_size_write(struct file *filp, const char __user *ubuf,
|
||||||
size_t cnt, loff_t *ppos)
|
size_t cnt, loff_t *ppos)
|
||||||
{
|
{
|
||||||
struct trace_array *tr = filp->private_data;
|
struct trace_array *tr = filp->private_data;
|
||||||
unsigned long val;
|
unsigned long val;
|
||||||
int old_order;
|
int old_order;
|
||||||
|
int order;
|
||||||
|
int pages;
|
||||||
int ret;
|
int ret;
|
||||||
|
|
||||||
ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
|
ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
|
||||||
if (ret)
|
if (ret)
|
||||||
return ret;
|
return ret;
|
||||||
|
|
||||||
|
val *= 1024; /* value passed in is in KB */
|
||||||
|
|
||||||
|
pages = DIV_ROUND_UP(val, PAGE_SIZE);
|
||||||
|
order = fls(pages - 1);
|
||||||
|
|
||||||
/* limit between 1 and 128 system pages */
|
/* limit between 1 and 128 system pages */
|
||||||
if (val < 0 || val > 7)
|
if (order < 0 || order > 7)
|
||||||
return -EINVAL;
|
return -EINVAL;
|
||||||
|
|
||||||
/* Do not allow tracing while changing the order of the ring buffer */
|
/* Do not allow tracing while changing the order of the ring buffer */
|
||||||
tracing_stop_tr(tr);
|
tracing_stop_tr(tr);
|
||||||
|
|
||||||
old_order = ring_buffer_subbuf_order_get(tr->array_buffer.buffer);
|
old_order = ring_buffer_subbuf_order_get(tr->array_buffer.buffer);
|
||||||
if (old_order == val)
|
if (old_order == order)
|
||||||
goto out;
|
goto out;
|
||||||
|
|
||||||
ret = ring_buffer_subbuf_order_set(tr->array_buffer.buffer, val);
|
ret = ring_buffer_subbuf_order_set(tr->array_buffer.buffer, order);
|
||||||
if (ret)
|
if (ret)
|
||||||
goto out;
|
goto out;
|
||||||
|
|
||||||
@ -9428,7 +9440,7 @@ buffer_order_write(struct file *filp, const char __user *ubuf,
|
|||||||
if (!tr->allocated_snapshot)
|
if (!tr->allocated_snapshot)
|
||||||
goto out_max;
|
goto out_max;
|
||||||
|
|
||||||
ret = ring_buffer_subbuf_order_set(tr->max_buffer.buffer, val);
|
ret = ring_buffer_subbuf_order_set(tr->max_buffer.buffer, order);
|
||||||
if (ret) {
|
if (ret) {
|
||||||
/* Put back the old order */
|
/* Put back the old order */
|
||||||
cnt = ring_buffer_subbuf_order_set(tr->array_buffer.buffer, old_order);
|
cnt = ring_buffer_subbuf_order_set(tr->array_buffer.buffer, old_order);
|
||||||
@ -9460,10 +9472,10 @@ buffer_order_write(struct file *filp, const char __user *ubuf,
|
|||||||
return cnt;
|
return cnt;
|
||||||
}
|
}
|
||||||
|
|
||||||
static const struct file_operations buffer_order_fops = {
|
static const struct file_operations buffer_subbuf_size_fops = {
|
||||||
.open = tracing_open_generic_tr,
|
.open = tracing_open_generic_tr,
|
||||||
.read = buffer_order_read,
|
.read = buffer_subbuf_size_read,
|
||||||
.write = buffer_order_write,
|
.write = buffer_subbuf_size_write,
|
||||||
.release = tracing_release_generic_tr,
|
.release = tracing_release_generic_tr,
|
||||||
.llseek = default_llseek,
|
.llseek = default_llseek,
|
||||||
};
|
};
|
||||||
@ -9934,8 +9946,8 @@ init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer)
|
|||||||
trace_create_file("buffer_percent", TRACE_MODE_WRITE, d_tracer,
|
trace_create_file("buffer_percent", TRACE_MODE_WRITE, d_tracer,
|
||||||
tr, &buffer_percent_fops);
|
tr, &buffer_percent_fops);
|
||||||
|
|
||||||
trace_create_file("buffer_subbuf_order", TRACE_MODE_WRITE, d_tracer,
|
trace_create_file("buffer_subbuf_size_kb", TRACE_MODE_WRITE, d_tracer,
|
||||||
tr, &buffer_order_fops);
|
tr, &buffer_subbuf_size_fops);
|
||||||
|
|
||||||
create_trace_options_dir(tr);
|
create_trace_options_dir(tr);
|
||||||
|
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
#!/bin/sh
|
#!/bin/sh
|
||||||
# SPDX-License-Identifier: GPL-2.0
|
# SPDX-License-Identifier: GPL-2.0
|
||||||
# description: Change the ringbuffer sub-buffer order
|
# description: Change the ringbuffer sub-buffer size
|
||||||
# requires: buffer_subbuf_order
|
# requires: buffer_subbuf_size_kb
|
||||||
# flags: instance
|
# flags: instance
|
||||||
|
|
||||||
get_buffer_data_size() {
|
get_buffer_data_size() {
|
||||||
@ -52,8 +52,8 @@ write_buffer() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
test_buffer() {
|
test_buffer() {
|
||||||
orde=$1
|
size_kb=$1
|
||||||
page_size=$((4096<<order))
|
page_size=$((size_kb*1024))
|
||||||
|
|
||||||
size=`get_buffer_data_size`
|
size=`get_buffer_data_size`
|
||||||
|
|
||||||
@ -82,14 +82,14 @@ test_buffer() {
|
|||||||
fi
|
fi
|
||||||
}
|
}
|
||||||
|
|
||||||
ORIG=`cat buffer_subbuf_order`
|
ORIG=`cat buffer_subbuf_size_kb`
|
||||||
|
|
||||||
# Could test bigger orders than 3, but then creating the string
|
# Could test bigger sizes than 32K, but then creating the string
|
||||||
# to write into the ring buffer takes too long
|
# to write into the ring buffer takes too long
|
||||||
for a in 0 1 2 3 ; do
|
for a in 4 8 16 32 ; do
|
||||||
echo $a > buffer_subbuf_order
|
echo $a > buffer_subbuf_size_kb
|
||||||
test_buffer $a
|
test_buffer $a
|
||||||
done
|
done
|
||||||
|
|
||||||
echo $ORIG > buffer_subbuf_order
|
echo $ORIG > buffer_subbuf_size_kb
|
||||||
|
|
Loading…
Reference in New Issue
Block a user