Commit 13791c80 authored by John Ogness's avatar John Ogness Committed by Petr Mladek

printk: avoid prb_first_valid_seq() where possible

If message sizes average larger than expected (more than 32
characters), the data_ring will wrap before the desc_ring. Once the
data_ring wraps, it will start invalidating descriptors. These
invalid descriptors hang around until they are eventually recycled
when the desc_ring wraps. Readers do not care about invalid
descriptors, but they still need to iterate past them. If the
average message size is much larger than 32 characters, then there
will be many invalid descriptors preceding the valid descriptors.

The function prb_first_valid_seq() always begins at the oldest
descriptor and searches for the first valid descriptor. This can
be rather expensive for the above scenario. And, in fact, because
of its heavy usage in /dev/kmsg, there have been reports of long
delays and even RCU stalls.

For code that does not need to search from the oldest record,
replace prb_first_valid_seq() usage with prb_read_valid_*()
functions, which provide a start sequence number to search from.

Fixes: 896fbe20 ("printk: use the lockless ringbuffer")
Reported-by: default avatarkernel test robot <oliver.sang@intel.com>
Reported-by: default avatarJ. Avila <elavila@google.com>
Signed-off-by: default avatarJohn Ogness <john.ogness@linutronix.de>
Reviewed-by: default avatarPetr Mladek <pmladek@suse.com>
Signed-off-by: default avatarPetr Mladek <pmladek@suse.com>
Link: https://lore.kernel.org/r/20210211173152.1629-1-john.ogness@linutronix.de
parent 9bc284ca
...@@ -736,9 +736,9 @@ static ssize_t devkmsg_read(struct file *file, char __user *buf, ...@@ -736,9 +736,9 @@ static ssize_t devkmsg_read(struct file *file, char __user *buf,
logbuf_lock_irq(); logbuf_lock_irq();
} }
if (user->seq < prb_first_valid_seq(prb)) { if (r->info->seq != user->seq) {
/* our last seen message is gone, return error and reset */ /* our last seen message is gone, return error and reset */
user->seq = prb_first_valid_seq(prb); user->seq = r->info->seq;
ret = -EPIPE; ret = -EPIPE;
logbuf_unlock_irq(); logbuf_unlock_irq();
goto out; goto out;
...@@ -813,6 +813,7 @@ static loff_t devkmsg_llseek(struct file *file, loff_t offset, int whence) ...@@ -813,6 +813,7 @@ static loff_t devkmsg_llseek(struct file *file, loff_t offset, int whence)
static __poll_t devkmsg_poll(struct file *file, poll_table *wait) static __poll_t devkmsg_poll(struct file *file, poll_table *wait)
{ {
struct devkmsg_user *user = file->private_data; struct devkmsg_user *user = file->private_data;
struct printk_info info;
__poll_t ret = 0; __poll_t ret = 0;
if (!user) if (!user)
...@@ -821,9 +822,9 @@ static __poll_t devkmsg_poll(struct file *file, poll_table *wait) ...@@ -821,9 +822,9 @@ static __poll_t devkmsg_poll(struct file *file, poll_table *wait)
poll_wait(file, &log_wait, wait); poll_wait(file, &log_wait, wait);
logbuf_lock_irq(); logbuf_lock_irq();
if (prb_read_valid(prb, user->seq, NULL)) { if (prb_read_valid_info(prb, user->seq, &info, NULL)) {
/* return error when data has vanished underneath us */ /* return error when data has vanished underneath us */
if (user->seq < prb_first_valid_seq(prb)) if (info.seq != user->seq)
ret = EPOLLIN|EPOLLRDNORM|EPOLLERR|EPOLLPRI; ret = EPOLLIN|EPOLLRDNORM|EPOLLERR|EPOLLPRI;
else else
ret = EPOLLIN|EPOLLRDNORM; ret = EPOLLIN|EPOLLRDNORM;
...@@ -1560,6 +1561,7 @@ static void syslog_clear(void) ...@@ -1560,6 +1561,7 @@ static void syslog_clear(void)
int do_syslog(int type, char __user *buf, int len, int source) int do_syslog(int type, char __user *buf, int len, int source)
{ {
struct printk_info info;
bool clear = false; bool clear = false;
static int saved_console_loglevel = LOGLEVEL_DEFAULT; static int saved_console_loglevel = LOGLEVEL_DEFAULT;
int error; int error;
...@@ -1630,9 +1632,14 @@ int do_syslog(int type, char __user *buf, int len, int source) ...@@ -1630,9 +1632,14 @@ int do_syslog(int type, char __user *buf, int len, int source)
/* Number of chars in the log buffer */ /* Number of chars in the log buffer */
case SYSLOG_ACTION_SIZE_UNREAD: case SYSLOG_ACTION_SIZE_UNREAD:
logbuf_lock_irq(); logbuf_lock_irq();
if (syslog_seq < prb_first_valid_seq(prb)) { if (!prb_read_valid_info(prb, syslog_seq, &info, NULL)) {
/* No unread messages. */
logbuf_unlock_irq();
return 0;
}
if (info.seq != syslog_seq) {
/* messages are gone, move to first one */ /* messages are gone, move to first one */
syslog_seq = prb_first_valid_seq(prb); syslog_seq = info.seq;
syslog_partial = 0; syslog_partial = 0;
} }
if (source == SYSLOG_FROM_PROC) { if (source == SYSLOG_FROM_PROC) {
...@@ -1644,7 +1651,6 @@ int do_syslog(int type, char __user *buf, int len, int source) ...@@ -1644,7 +1651,6 @@ int do_syslog(int type, char __user *buf, int len, int source)
error = prb_next_seq(prb) - syslog_seq; error = prb_next_seq(prb) - syslog_seq;
} else { } else {
bool time = syslog_partial ? syslog_time : printk_time; bool time = syslog_partial ? syslog_time : printk_time;
struct printk_info info;
unsigned int line_count; unsigned int line_count;
u64 seq; u64 seq;
...@@ -3425,9 +3431,11 @@ bool kmsg_dump_get_buffer(struct kmsg_dumper *dumper, bool syslog, ...@@ -3425,9 +3431,11 @@ bool kmsg_dump_get_buffer(struct kmsg_dumper *dumper, bool syslog,
goto out; goto out;
logbuf_lock_irqsave(flags); logbuf_lock_irqsave(flags);
if (dumper->cur_seq < prb_first_valid_seq(prb)) { if (prb_read_valid_info(prb, dumper->cur_seq, &info, NULL)) {
if (info.seq != dumper->cur_seq) {
/* messages are gone, move to first available one */ /* messages are gone, move to first available one */
dumper->cur_seq = prb_first_valid_seq(prb); dumper->cur_seq = info.seq;
}
} }
/* last entry */ /* last entry */
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment