Commit eca20409 authored by Damien Le Moal's avatar Damien Le Moal Committed by Martin K. Petersen

scsi: block: ioprio: Clean up interface definition

The I/O priority user interface defines the 16-bits ioprio values as the
combination of the upper 3-bits for an I/O priority class and the lower
13-bits as priority data. However, the kernel only uses the lower 3-bits of
the priority data to define priority levels for the RT and BE priority
classes. The data part of an ioprio value is completely ignored for the
IDLE and NONE classes. This is enforced by checks done in
ioprio_check_cap(), which is called for all paths that allow defining an
I/O priority for I/Os: the per-context ioprio_set() system call, aio
interface and io_uring interface.

Clarify this fact in the uapi ioprio.h header file and introduce the
IOPRIO_PRIO_LEVEL_MASK and IOPRIO_PRIO_LEVEL() macros for users to define
and get priority levels in an ioprio value. The coarser macro
IOPRIO_PRIO_DATA() is retained for backward compatibility with old
applications already using it. There is no functional change introduced
with this.

In-kernel users of the IOPRIO_PRIO_DATA() macro which are explicitly
handling I/O priority data as a priority level are modified to use the new
IOPRIO_PRIO_LEVEL() macro without any functional change. Since f2fs is the
only user of this macro not explicitly using that value as a priority
level, it is left unchanged.
Signed-off-by: default avatarDamien Le Moal <dlemoal@kernel.org>
Reviewed-by: default avatarHannes Reinecke <hare@suse.de>
Reviewed-by: default avatarChristoph Hellwig <hch@lst.de>
Signed-off-by: default avatarNiklas Cassel <niklas.cassel@wdc.com>
Link: https://lore.kernel.org/r/20230511011356.227789-2-nks@flawful.orgSigned-off-by: default avatarMartin K. Petersen <martin.petersen@oracle.com>
parent ac9a7868
...@@ -5524,16 +5524,16 @@ bfq_set_next_ioprio_data(struct bfq_queue *bfqq, struct bfq_io_cq *bic) ...@@ -5524,16 +5524,16 @@ bfq_set_next_ioprio_data(struct bfq_queue *bfqq, struct bfq_io_cq *bic)
bfqq->new_ioprio_class = task_nice_ioclass(tsk); bfqq->new_ioprio_class = task_nice_ioclass(tsk);
break; break;
case IOPRIO_CLASS_RT: case IOPRIO_CLASS_RT:
bfqq->new_ioprio = IOPRIO_PRIO_DATA(bic->ioprio); bfqq->new_ioprio = IOPRIO_PRIO_LEVEL(bic->ioprio);
bfqq->new_ioprio_class = IOPRIO_CLASS_RT; bfqq->new_ioprio_class = IOPRIO_CLASS_RT;
break; break;
case IOPRIO_CLASS_BE: case IOPRIO_CLASS_BE:
bfqq->new_ioprio = IOPRIO_PRIO_DATA(bic->ioprio); bfqq->new_ioprio = IOPRIO_PRIO_LEVEL(bic->ioprio);
bfqq->new_ioprio_class = IOPRIO_CLASS_BE; bfqq->new_ioprio_class = IOPRIO_CLASS_BE;
break; break;
case IOPRIO_CLASS_IDLE: case IOPRIO_CLASS_IDLE:
bfqq->new_ioprio_class = IOPRIO_CLASS_IDLE; bfqq->new_ioprio_class = IOPRIO_CLASS_IDLE;
bfqq->new_ioprio = 7; bfqq->new_ioprio = IOPRIO_NR_LEVELS - 1;
break; break;
} }
...@@ -5830,7 +5830,7 @@ static struct bfq_queue *bfq_get_queue(struct bfq_data *bfqd, ...@@ -5830,7 +5830,7 @@ static struct bfq_queue *bfq_get_queue(struct bfq_data *bfqd,
struct bfq_io_cq *bic, struct bfq_io_cq *bic,
bool respawn) bool respawn)
{ {
const int ioprio = IOPRIO_PRIO_DATA(bic->ioprio); const int ioprio = IOPRIO_PRIO_LEVEL(bic->ioprio);
const int ioprio_class = IOPRIO_PRIO_CLASS(bic->ioprio); const int ioprio_class = IOPRIO_PRIO_CLASS(bic->ioprio);
struct bfq_queue **async_bfqq = NULL; struct bfq_queue **async_bfqq = NULL;
struct bfq_queue *bfqq; struct bfq_queue *bfqq;
......
...@@ -33,7 +33,7 @@ ...@@ -33,7 +33,7 @@
int ioprio_check_cap(int ioprio) int ioprio_check_cap(int ioprio)
{ {
int class = IOPRIO_PRIO_CLASS(ioprio); int class = IOPRIO_PRIO_CLASS(ioprio);
int data = IOPRIO_PRIO_DATA(ioprio); int level = IOPRIO_PRIO_LEVEL(ioprio);
switch (class) { switch (class) {
case IOPRIO_CLASS_RT: case IOPRIO_CLASS_RT:
...@@ -49,13 +49,13 @@ int ioprio_check_cap(int ioprio) ...@@ -49,13 +49,13 @@ int ioprio_check_cap(int ioprio)
fallthrough; fallthrough;
/* rt has prio field too */ /* rt has prio field too */
case IOPRIO_CLASS_BE: case IOPRIO_CLASS_BE:
if (data >= IOPRIO_NR_LEVELS || data < 0) if (level >= IOPRIO_NR_LEVELS)
return -EINVAL; return -EINVAL;
break; break;
case IOPRIO_CLASS_IDLE: case IOPRIO_CLASS_IDLE:
break; break;
case IOPRIO_CLASS_NONE: case IOPRIO_CLASS_NONE:
if (data) if (level)
return -EINVAL; return -EINVAL;
break; break;
default: default:
......
...@@ -17,7 +17,7 @@ ...@@ -17,7 +17,7 @@
((data) & IOPRIO_PRIO_MASK)) ((data) & IOPRIO_PRIO_MASK))
/* /*
* These are the io priority groups as implemented by the BFQ and mq-deadline * These are the io priority classes as implemented by the BFQ and mq-deadline
* schedulers. RT is the realtime class, it always gets premium service. For * schedulers. RT is the realtime class, it always gets premium service. For
* ATA disks supporting NCQ IO priority, RT class IOs will be processed using * ATA disks supporting NCQ IO priority, RT class IOs will be processed using
* high priority NCQ commands. BE is the best-effort scheduling class, the * high priority NCQ commands. BE is the best-effort scheduling class, the
...@@ -32,11 +32,20 @@ enum { ...@@ -32,11 +32,20 @@ enum {
}; };
/* /*
* The RT and BE priority classes both support up to 8 priority levels. * The RT and BE priority classes both support up to 8 priority levels that
* can be specified using the lower 3-bits of the priority data.
*/ */
#define IOPRIO_NR_LEVELS 8 #define IOPRIO_LEVEL_NR_BITS 3
#define IOPRIO_BE_NR IOPRIO_NR_LEVELS #define IOPRIO_NR_LEVELS (1 << IOPRIO_LEVEL_NR_BITS)
#define IOPRIO_LEVEL_MASK (IOPRIO_NR_LEVELS - 1)
#define IOPRIO_PRIO_LEVEL(ioprio) ((ioprio) & IOPRIO_LEVEL_MASK)
#define IOPRIO_BE_NR IOPRIO_NR_LEVELS
/*
* Possible values for the "which" argument of the ioprio_get() and
* ioprio_set() system calls (see "man ioprio_set").
*/
enum { enum {
IOPRIO_WHO_PROCESS = 1, IOPRIO_WHO_PROCESS = 1,
IOPRIO_WHO_PGRP, IOPRIO_WHO_PGRP,
...@@ -44,7 +53,7 @@ enum { ...@@ -44,7 +53,7 @@ enum {
}; };
/* /*
* Fallback BE priority level. * Fallback BE class priority level.
*/ */
#define IOPRIO_NORM 4 #define IOPRIO_NORM 4
#define IOPRIO_BE_NORM IOPRIO_NORM #define IOPRIO_BE_NORM IOPRIO_NORM
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment