Commit f70a4792 authored by Jens Axboe's avatar Jens Axboe

Merge tag 'nvme-6.8-2023-12-21' of git://git.infradead.org/nvme into for-6.8/block

Pull NVMe updates from Keith:

"nvme updates for Linux 6.8

 - nvme fabrics spec updates (Guixin, Max)
 - nvme target udpates (Guixin, Evan)
 - nvme attribute refactoring (Daniel)
 - nvme-fc numa fix (Keith)"

* tag 'nvme-6.8-2023-12-21' of git://git.infradead.org/nvme:
  nvme-fc: set numa_node after nvme_init_ctrl
  nvme-fabrics: don't check discovery ioccsz/iorcsz
  nvmet: configfs: use ctrl->instance to track passthru subsystems
  nvme: repack struct nvme_ns_head
  nvme: add csi, ms and nuse to sysfs
  nvme: rename ns attribute group
  nvme: refactor ns info setup function
  nvme: refactor ns info helpers
  nvme: move ns id info to struct nvme_ns_head
  nvmet: remove cntlid_min and cntlid_max check in nvmet_alloc_ctrl
  nvmet: allow identical cntlid_min and cntlid_max settings
  nvme-fabrics: check ioccsz and iorcsz
  nvme: introduce nvme_check_ctrl_fabric_info helper
parents 5165799f 5d51dc8d
...@@ -20,6 +20,7 @@ ...@@ -20,6 +20,7 @@
#include <linux/ptrace.h> #include <linux/ptrace.h>
#include <linux/nvme_ioctl.h> #include <linux/nvme_ioctl.h>
#include <linux/pm_qos.h> #include <linux/pm_qos.h>
#include <linux/ratelimit.h>
#include <asm/unaligned.h> #include <asm/unaligned.h>
#include "nvme.h" #include "nvme.h"
...@@ -312,12 +313,12 @@ static void nvme_log_error(struct request *req) ...@@ -312,12 +313,12 @@ static void nvme_log_error(struct request *req)
struct nvme_request *nr = nvme_req(req); struct nvme_request *nr = nvme_req(req);
if (ns) { if (ns) {
pr_err_ratelimited("%s: %s(0x%x) @ LBA %llu, %llu blocks, %s (sct 0x%x / sc 0x%x) %s%s\n", pr_err_ratelimited("%s: %s(0x%x) @ LBA %llu, %u blocks, %s (sct 0x%x / sc 0x%x) %s%s\n",
ns->disk ? ns->disk->disk_name : "?", ns->disk ? ns->disk->disk_name : "?",
nvme_get_opcode_str(nr->cmd->common.opcode), nvme_get_opcode_str(nr->cmd->common.opcode),
nr->cmd->common.opcode, nr->cmd->common.opcode,
(unsigned long long)nvme_sect_to_lba(ns, blk_rq_pos(req)), nvme_sect_to_lba(ns->head, blk_rq_pos(req)),
(unsigned long long)blk_rq_bytes(req) >> ns->lba_shift, blk_rq_bytes(req) >> ns->head->lba_shift,
nvme_get_error_status_str(nr->status), nvme_get_error_status_str(nr->status),
nr->status >> 8 & 7, /* Status Code Type */ nr->status >> 8 & 7, /* Status Code Type */
nr->status & 0xff, /* Status Code */ nr->status & 0xff, /* Status Code */
...@@ -372,9 +373,12 @@ static inline enum nvme_disposition nvme_decide_disposition(struct request *req) ...@@ -372,9 +373,12 @@ static inline enum nvme_disposition nvme_decide_disposition(struct request *req)
static inline void nvme_end_req_zoned(struct request *req) static inline void nvme_end_req_zoned(struct request *req)
{ {
if (IS_ENABLED(CONFIG_BLK_DEV_ZONED) && if (IS_ENABLED(CONFIG_BLK_DEV_ZONED) &&
req_op(req) == REQ_OP_ZONE_APPEND) req_op(req) == REQ_OP_ZONE_APPEND) {
req->__sector = nvme_lba_to_sect(req->q->queuedata, struct nvme_ns *ns = req->q->queuedata;
req->__sector = nvme_lba_to_sect(ns->head,
le64_to_cpu(nvme_req(req)->result.u64)); le64_to_cpu(nvme_req(req)->result.u64));
}
} }
static inline void nvme_end_req(struct request *req) static inline void nvme_end_req(struct request *req)
...@@ -791,8 +795,8 @@ static blk_status_t nvme_setup_discard(struct nvme_ns *ns, struct request *req, ...@@ -791,8 +795,8 @@ static blk_status_t nvme_setup_discard(struct nvme_ns *ns, struct request *req,
} }
if (queue_max_discard_segments(req->q) == 1) { if (queue_max_discard_segments(req->q) == 1) {
u64 slba = nvme_sect_to_lba(ns, blk_rq_pos(req)); u64 slba = nvme_sect_to_lba(ns->head, blk_rq_pos(req));
u32 nlb = blk_rq_sectors(req) >> (ns->lba_shift - 9); u32 nlb = blk_rq_sectors(req) >> (ns->head->lba_shift - 9);
range[0].cattr = cpu_to_le32(0); range[0].cattr = cpu_to_le32(0);
range[0].nlb = cpu_to_le32(nlb); range[0].nlb = cpu_to_le32(nlb);
...@@ -800,8 +804,9 @@ static blk_status_t nvme_setup_discard(struct nvme_ns *ns, struct request *req, ...@@ -800,8 +804,9 @@ static blk_status_t nvme_setup_discard(struct nvme_ns *ns, struct request *req,
n = 1; n = 1;
} else { } else {
__rq_for_each_bio(bio, req) { __rq_for_each_bio(bio, req) {
u64 slba = nvme_sect_to_lba(ns, bio->bi_iter.bi_sector); u64 slba = nvme_sect_to_lba(ns->head,
u32 nlb = bio->bi_iter.bi_size >> ns->lba_shift; bio->bi_iter.bi_sector);
u32 nlb = bio->bi_iter.bi_size >> ns->head->lba_shift;
if (n < segments) { if (n < segments) {
range[n].cattr = cpu_to_le32(0); range[n].cattr = cpu_to_le32(0);
...@@ -839,7 +844,7 @@ static void nvme_set_ref_tag(struct nvme_ns *ns, struct nvme_command *cmnd, ...@@ -839,7 +844,7 @@ static void nvme_set_ref_tag(struct nvme_ns *ns, struct nvme_command *cmnd,
u64 ref48; u64 ref48;
/* both rw and write zeroes share the same reftag format */ /* both rw and write zeroes share the same reftag format */
switch (ns->guard_type) { switch (ns->head->guard_type) {
case NVME_NVM_NS_16B_GUARD: case NVME_NVM_NS_16B_GUARD:
cmnd->rw.reftag = cpu_to_le32(t10_pi_ref_tag(req)); cmnd->rw.reftag = cpu_to_le32(t10_pi_ref_tag(req));
break; break;
...@@ -867,17 +872,18 @@ static inline blk_status_t nvme_setup_write_zeroes(struct nvme_ns *ns, ...@@ -867,17 +872,18 @@ static inline blk_status_t nvme_setup_write_zeroes(struct nvme_ns *ns,
cmnd->write_zeroes.opcode = nvme_cmd_write_zeroes; cmnd->write_zeroes.opcode = nvme_cmd_write_zeroes;
cmnd->write_zeroes.nsid = cpu_to_le32(ns->head->ns_id); cmnd->write_zeroes.nsid = cpu_to_le32(ns->head->ns_id);
cmnd->write_zeroes.slba = cmnd->write_zeroes.slba =
cpu_to_le64(nvme_sect_to_lba(ns, blk_rq_pos(req))); cpu_to_le64(nvme_sect_to_lba(ns->head, blk_rq_pos(req)));
cmnd->write_zeroes.length = cmnd->write_zeroes.length =
cpu_to_le16((blk_rq_bytes(req) >> ns->lba_shift) - 1); cpu_to_le16((blk_rq_bytes(req) >> ns->head->lba_shift) - 1);
if (!(req->cmd_flags & REQ_NOUNMAP) && (ns->features & NVME_NS_DEAC)) if (!(req->cmd_flags & REQ_NOUNMAP) &&
(ns->head->features & NVME_NS_DEAC))
cmnd->write_zeroes.control |= cpu_to_le16(NVME_WZ_DEAC); cmnd->write_zeroes.control |= cpu_to_le16(NVME_WZ_DEAC);
if (nvme_ns_has_pi(ns)) { if (nvme_ns_has_pi(ns->head)) {
cmnd->write_zeroes.control |= cpu_to_le16(NVME_RW_PRINFO_PRACT); cmnd->write_zeroes.control |= cpu_to_le16(NVME_RW_PRINFO_PRACT);
switch (ns->pi_type) { switch (ns->head->pi_type) {
case NVME_NS_DPS_PI_TYPE1: case NVME_NS_DPS_PI_TYPE1:
case NVME_NS_DPS_PI_TYPE2: case NVME_NS_DPS_PI_TYPE2:
nvme_set_ref_tag(ns, cmnd, req); nvme_set_ref_tag(ns, cmnd, req);
...@@ -909,13 +915,15 @@ static inline blk_status_t nvme_setup_rw(struct nvme_ns *ns, ...@@ -909,13 +915,15 @@ static inline blk_status_t nvme_setup_rw(struct nvme_ns *ns,
cmnd->rw.cdw2 = 0; cmnd->rw.cdw2 = 0;
cmnd->rw.cdw3 = 0; cmnd->rw.cdw3 = 0;
cmnd->rw.metadata = 0; cmnd->rw.metadata = 0;
cmnd->rw.slba = cpu_to_le64(nvme_sect_to_lba(ns, blk_rq_pos(req))); cmnd->rw.slba =
cmnd->rw.length = cpu_to_le16((blk_rq_bytes(req) >> ns->lba_shift) - 1); cpu_to_le64(nvme_sect_to_lba(ns->head, blk_rq_pos(req)));
cmnd->rw.length =
cpu_to_le16((blk_rq_bytes(req) >> ns->head->lba_shift) - 1);
cmnd->rw.reftag = 0; cmnd->rw.reftag = 0;
cmnd->rw.apptag = 0; cmnd->rw.apptag = 0;
cmnd->rw.appmask = 0; cmnd->rw.appmask = 0;
if (ns->ms) { if (ns->head->ms) {
/* /*
* If formated with metadata, the block layer always provides a * If formated with metadata, the block layer always provides a
* metadata buffer if CONFIG_BLK_DEV_INTEGRITY is enabled. Else * metadata buffer if CONFIG_BLK_DEV_INTEGRITY is enabled. Else
...@@ -923,12 +931,12 @@ static inline blk_status_t nvme_setup_rw(struct nvme_ns *ns, ...@@ -923,12 +931,12 @@ static inline blk_status_t nvme_setup_rw(struct nvme_ns *ns,
* namespace capacity to zero to prevent any I/O. * namespace capacity to zero to prevent any I/O.
*/ */
if (!blk_integrity_rq(req)) { if (!blk_integrity_rq(req)) {
if (WARN_ON_ONCE(!nvme_ns_has_pi(ns))) if (WARN_ON_ONCE(!nvme_ns_has_pi(ns->head)))
return BLK_STS_NOTSUPP; return BLK_STS_NOTSUPP;
control |= NVME_RW_PRINFO_PRACT; control |= NVME_RW_PRINFO_PRACT;
} }
switch (ns->pi_type) { switch (ns->head->pi_type) {
case NVME_NS_DPS_PI_TYPE3: case NVME_NS_DPS_PI_TYPE3:
control |= NVME_RW_PRINFO_PRCHK_GUARD; control |= NVME_RW_PRINFO_PRCHK_GUARD;
break; break;
...@@ -1442,7 +1450,7 @@ static int nvme_identify_ns_descs(struct nvme_ctrl *ctrl, ...@@ -1442,7 +1450,7 @@ static int nvme_identify_ns_descs(struct nvme_ctrl *ctrl,
return status; return status;
} }
static int nvme_identify_ns(struct nvme_ctrl *ctrl, unsigned nsid, int nvme_identify_ns(struct nvme_ctrl *ctrl, unsigned nsid,
struct nvme_id_ns **id) struct nvme_id_ns **id)
{ {
struct nvme_command c = { }; struct nvme_command c = { };
...@@ -1658,14 +1666,14 @@ int nvme_getgeo(struct block_device *bdev, struct hd_geometry *geo) ...@@ -1658,14 +1666,14 @@ int nvme_getgeo(struct block_device *bdev, struct hd_geometry *geo)
} }
#ifdef CONFIG_BLK_DEV_INTEGRITY #ifdef CONFIG_BLK_DEV_INTEGRITY
static void nvme_init_integrity(struct gendisk *disk, struct nvme_ns *ns, static void nvme_init_integrity(struct gendisk *disk,
u32 max_integrity_segments) struct nvme_ns_head *head, u32 max_integrity_segments)
{ {
struct blk_integrity integrity = { }; struct blk_integrity integrity = { };
switch (ns->pi_type) { switch (head->pi_type) {
case NVME_NS_DPS_PI_TYPE3: case NVME_NS_DPS_PI_TYPE3:
switch (ns->guard_type) { switch (head->guard_type) {
case NVME_NVM_NS_16B_GUARD: case NVME_NVM_NS_16B_GUARD:
integrity.profile = &t10_pi_type3_crc; integrity.profile = &t10_pi_type3_crc;
integrity.tag_size = sizeof(u16) + sizeof(u32); integrity.tag_size = sizeof(u16) + sizeof(u32);
...@@ -1683,7 +1691,7 @@ static void nvme_init_integrity(struct gendisk *disk, struct nvme_ns *ns, ...@@ -1683,7 +1691,7 @@ static void nvme_init_integrity(struct gendisk *disk, struct nvme_ns *ns,
break; break;
case NVME_NS_DPS_PI_TYPE1: case NVME_NS_DPS_PI_TYPE1:
case NVME_NS_DPS_PI_TYPE2: case NVME_NS_DPS_PI_TYPE2:
switch (ns->guard_type) { switch (head->guard_type) {
case NVME_NVM_NS_16B_GUARD: case NVME_NVM_NS_16B_GUARD:
integrity.profile = &t10_pi_type1_crc; integrity.profile = &t10_pi_type1_crc;
integrity.tag_size = sizeof(u16); integrity.tag_size = sizeof(u16);
...@@ -1704,25 +1712,26 @@ static void nvme_init_integrity(struct gendisk *disk, struct nvme_ns *ns, ...@@ -1704,25 +1712,26 @@ static void nvme_init_integrity(struct gendisk *disk, struct nvme_ns *ns,
break; break;
} }
integrity.tuple_size = ns->ms; integrity.tuple_size = head->ms;
blk_integrity_register(disk, &integrity); blk_integrity_register(disk, &integrity);
blk_queue_max_integrity_segments(disk->queue, max_integrity_segments); blk_queue_max_integrity_segments(disk->queue, max_integrity_segments);
} }
#else #else
static void nvme_init_integrity(struct gendisk *disk, struct nvme_ns *ns, static void nvme_init_integrity(struct gendisk *disk,
u32 max_integrity_segments) struct nvme_ns_head *head, u32 max_integrity_segments)
{ {
} }
#endif /* CONFIG_BLK_DEV_INTEGRITY */ #endif /* CONFIG_BLK_DEV_INTEGRITY */
static void nvme_config_discard(struct gendisk *disk, struct nvme_ns *ns) static void nvme_config_discard(struct nvme_ctrl *ctrl, struct gendisk *disk,
struct nvme_ns_head *head)
{ {
struct nvme_ctrl *ctrl = ns->ctrl;
struct request_queue *queue = disk->queue; struct request_queue *queue = disk->queue;
u32 size = queue_logical_block_size(queue); u32 size = queue_logical_block_size(queue);
if (ctrl->dmrsl && ctrl->dmrsl <= nvme_sect_to_lba(ns, UINT_MAX)) if (ctrl->dmrsl && ctrl->dmrsl <= nvme_sect_to_lba(head, UINT_MAX))
ctrl->max_discard_sectors = nvme_lba_to_sect(ns, ctrl->dmrsl); ctrl->max_discard_sectors =
nvme_lba_to_sect(head, ctrl->dmrsl);
if (ctrl->max_discard_sectors == 0) { if (ctrl->max_discard_sectors == 0) {
blk_queue_max_discard_sectors(queue, 0); blk_queue_max_discard_sectors(queue, 0);
...@@ -1753,21 +1762,21 @@ static bool nvme_ns_ids_equal(struct nvme_ns_ids *a, struct nvme_ns_ids *b) ...@@ -1753,21 +1762,21 @@ static bool nvme_ns_ids_equal(struct nvme_ns_ids *a, struct nvme_ns_ids *b)
a->csi == b->csi; a->csi == b->csi;
} }
static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id) static int nvme_init_ms(struct nvme_ctrl *ctrl, struct nvme_ns_head *head,
struct nvme_id_ns *id)
{ {
bool first = id->dps & NVME_NS_DPS_PI_FIRST; bool first = id->dps & NVME_NS_DPS_PI_FIRST;
unsigned lbaf = nvme_lbaf_index(id->flbas); unsigned lbaf = nvme_lbaf_index(id->flbas);
struct nvme_ctrl *ctrl = ns->ctrl;
struct nvme_command c = { }; struct nvme_command c = { };
struct nvme_id_ns_nvm *nvm; struct nvme_id_ns_nvm *nvm;
int ret = 0; int ret = 0;
u32 elbaf; u32 elbaf;
ns->pi_size = 0; head->pi_size = 0;
ns->ms = le16_to_cpu(id->lbaf[lbaf].ms); head->ms = le16_to_cpu(id->lbaf[lbaf].ms);
if (!(ctrl->ctratt & NVME_CTRL_ATTR_ELBAS)) { if (!(ctrl->ctratt & NVME_CTRL_ATTR_ELBAS)) {
ns->pi_size = sizeof(struct t10_pi_tuple); head->pi_size = sizeof(struct t10_pi_tuple);
ns->guard_type = NVME_NVM_NS_16B_GUARD; head->guard_type = NVME_NVM_NS_16B_GUARD;
goto set_pi; goto set_pi;
} }
...@@ -1776,11 +1785,11 @@ static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1776,11 +1785,11 @@ static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id)
return -ENOMEM; return -ENOMEM;
c.identify.opcode = nvme_admin_identify; c.identify.opcode = nvme_admin_identify;
c.identify.nsid = cpu_to_le32(ns->head->ns_id); c.identify.nsid = cpu_to_le32(head->ns_id);
c.identify.cns = NVME_ID_CNS_CS_NS; c.identify.cns = NVME_ID_CNS_CS_NS;
c.identify.csi = NVME_CSI_NVM; c.identify.csi = NVME_CSI_NVM;
ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, &c, nvm, sizeof(*nvm)); ret = nvme_submit_sync_cmd(ctrl->admin_q, &c, nvm, sizeof(*nvm));
if (ret) if (ret)
goto free_data; goto free_data;
...@@ -1790,13 +1799,13 @@ static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1790,13 +1799,13 @@ static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id)
if (nvme_elbaf_sts(elbaf)) if (nvme_elbaf_sts(elbaf))
goto free_data; goto free_data;
ns->guard_type = nvme_elbaf_guard_type(elbaf); head->guard_type = nvme_elbaf_guard_type(elbaf);
switch (ns->guard_type) { switch (head->guard_type) {
case NVME_NVM_NS_64B_GUARD: case NVME_NVM_NS_64B_GUARD:
ns->pi_size = sizeof(struct crc64_pi_tuple); head->pi_size = sizeof(struct crc64_pi_tuple);
break; break;
case NVME_NVM_NS_16B_GUARD: case NVME_NVM_NS_16B_GUARD:
ns->pi_size = sizeof(struct t10_pi_tuple); head->pi_size = sizeof(struct t10_pi_tuple);
break; break;
default: default:
break; break;
...@@ -1805,25 +1814,25 @@ static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1805,25 +1814,25 @@ static int nvme_init_ms(struct nvme_ns *ns, struct nvme_id_ns *id)
free_data: free_data:
kfree(nvm); kfree(nvm);
set_pi: set_pi:
if (ns->pi_size && (first || ns->ms == ns->pi_size)) if (head->pi_size && (first || head->ms == head->pi_size))
ns->pi_type = id->dps & NVME_NS_DPS_PI_MASK; head->pi_type = id->dps & NVME_NS_DPS_PI_MASK;
else else
ns->pi_type = 0; head->pi_type = 0;
return ret; return ret;
} }
static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id) static int nvme_configure_metadata(struct nvme_ctrl *ctrl,
struct nvme_ns_head *head, struct nvme_id_ns *id)
{ {
struct nvme_ctrl *ctrl = ns->ctrl;
int ret; int ret;
ret = nvme_init_ms(ns, id); ret = nvme_init_ms(ctrl, head, id);
if (ret) if (ret)
return ret; return ret;
ns->features &= ~(NVME_NS_METADATA_SUPPORTED | NVME_NS_EXT_LBAS); head->features &= ~(NVME_NS_METADATA_SUPPORTED | NVME_NS_EXT_LBAS);
if (!ns->ms || !(ctrl->ops->flags & NVME_F_METADATA_SUPPORTED)) if (!head->ms || !(ctrl->ops->flags & NVME_F_METADATA_SUPPORTED))
return 0; return 0;
if (ctrl->ops->flags & NVME_F_FABRICS) { if (ctrl->ops->flags & NVME_F_FABRICS) {
...@@ -1835,7 +1844,7 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1835,7 +1844,7 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
if (WARN_ON_ONCE(!(id->flbas & NVME_NS_FLBAS_META_EXT))) if (WARN_ON_ONCE(!(id->flbas & NVME_NS_FLBAS_META_EXT)))
return 0; return 0;
ns->features |= NVME_NS_EXT_LBAS; head->features |= NVME_NS_EXT_LBAS;
/* /*
* The current fabrics transport drivers support namespace * The current fabrics transport drivers support namespace
...@@ -1846,8 +1855,8 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1846,8 +1855,8 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
* Note, this check will need to be modified if any drivers * Note, this check will need to be modified if any drivers
* gain the ability to use other metadata formats. * gain the ability to use other metadata formats.
*/ */
if (ctrl->max_integrity_segments && nvme_ns_has_pi(ns)) if (ctrl->max_integrity_segments && nvme_ns_has_pi(head))
ns->features |= NVME_NS_METADATA_SUPPORTED; head->features |= NVME_NS_METADATA_SUPPORTED;
} else { } else {
/* /*
* For PCIe controllers, we can't easily remap the separate * For PCIe controllers, we can't easily remap the separate
...@@ -1856,9 +1865,9 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1856,9 +1865,9 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
* We allow extended LBAs for the passthrough interface, though. * We allow extended LBAs for the passthrough interface, though.
*/ */
if (id->flbas & NVME_NS_FLBAS_META_EXT) if (id->flbas & NVME_NS_FLBAS_META_EXT)
ns->features |= NVME_NS_EXT_LBAS; head->features |= NVME_NS_EXT_LBAS;
else else
ns->features |= NVME_NS_METADATA_SUPPORTED; head->features |= NVME_NS_METADATA_SUPPORTED;
} }
return 0; return 0;
} }
...@@ -1881,18 +1890,18 @@ static void nvme_set_queue_limits(struct nvme_ctrl *ctrl, ...@@ -1881,18 +1890,18 @@ static void nvme_set_queue_limits(struct nvme_ctrl *ctrl,
blk_queue_write_cache(q, vwc, vwc); blk_queue_write_cache(q, vwc, vwc);
} }
static void nvme_update_disk_info(struct gendisk *disk, static void nvme_update_disk_info(struct nvme_ctrl *ctrl, struct gendisk *disk,
struct nvme_ns *ns, struct nvme_id_ns *id) struct nvme_ns_head *head, struct nvme_id_ns *id)
{ {
sector_t capacity = nvme_lba_to_sect(ns, le64_to_cpu(id->nsze)); sector_t capacity = nvme_lba_to_sect(head, le64_to_cpu(id->nsze));
u32 bs = 1U << ns->lba_shift; u32 bs = 1U << head->lba_shift;
u32 atomic_bs, phys_bs, io_opt = 0; u32 atomic_bs, phys_bs, io_opt = 0;
/* /*
* The block layer can't support LBA sizes larger than the page size * The block layer can't support LBA sizes larger than the page size
* yet, so catch this early and don't allow block I/O. * yet, so catch this early and don't allow block I/O.
*/ */
if (ns->lba_shift > PAGE_SHIFT) { if (head->lba_shift > PAGE_SHIFT) {
capacity = 0; capacity = 0;
bs = (1 << 9); bs = (1 << 9);
} }
...@@ -1909,7 +1918,7 @@ static void nvme_update_disk_info(struct gendisk *disk, ...@@ -1909,7 +1918,7 @@ static void nvme_update_disk_info(struct gendisk *disk,
if (id->nsfeat & NVME_NS_FEAT_ATOMICS && id->nawupf) if (id->nsfeat & NVME_NS_FEAT_ATOMICS && id->nawupf)
atomic_bs = (1 + le16_to_cpu(id->nawupf)) * bs; atomic_bs = (1 + le16_to_cpu(id->nawupf)) * bs;
else else
atomic_bs = (1 + ns->ctrl->subsys->awupf) * bs; atomic_bs = (1 + ctrl->subsys->awupf) * bs;
} }
if (id->nsfeat & NVME_NS_FEAT_IO_OPT) { if (id->nsfeat & NVME_NS_FEAT_IO_OPT) {
...@@ -1935,20 +1944,20 @@ static void nvme_update_disk_info(struct gendisk *disk, ...@@ -1935,20 +1944,20 @@ static void nvme_update_disk_info(struct gendisk *disk,
* I/O to namespaces with metadata except when the namespace supports * I/O to namespaces with metadata except when the namespace supports
* PI, as it can strip/insert in that case. * PI, as it can strip/insert in that case.
*/ */
if (ns->ms) { if (head->ms) {
if (IS_ENABLED(CONFIG_BLK_DEV_INTEGRITY) && if (IS_ENABLED(CONFIG_BLK_DEV_INTEGRITY) &&
(ns->features & NVME_NS_METADATA_SUPPORTED)) (head->features & NVME_NS_METADATA_SUPPORTED))
nvme_init_integrity(disk, ns, nvme_init_integrity(disk, head,
ns->ctrl->max_integrity_segments); ctrl->max_integrity_segments);
else if (!nvme_ns_has_pi(ns)) else if (!nvme_ns_has_pi(head))
capacity = 0; capacity = 0;
} }
set_capacity_and_notify(disk, capacity); set_capacity_and_notify(disk, capacity);
nvme_config_discard(disk, ns); nvme_config_discard(ctrl, disk, head);
blk_queue_max_write_zeroes_sectors(disk->queue, blk_queue_max_write_zeroes_sectors(disk->queue,
ns->ctrl->max_zeroes_sectors); ctrl->max_zeroes_sectors);
} }
static bool nvme_ns_is_readonly(struct nvme_ns *ns, struct nvme_ns_info *info) static bool nvme_ns_is_readonly(struct nvme_ns *ns, struct nvme_ns_info *info)
...@@ -1971,7 +1980,7 @@ static void nvme_set_chunk_sectors(struct nvme_ns *ns, struct nvme_id_ns *id) ...@@ -1971,7 +1980,7 @@ static void nvme_set_chunk_sectors(struct nvme_ns *ns, struct nvme_id_ns *id)
is_power_of_2(ctrl->max_hw_sectors)) is_power_of_2(ctrl->max_hw_sectors))
iob = ctrl->max_hw_sectors; iob = ctrl->max_hw_sectors;
else else
iob = nvme_lba_to_sect(ns, le16_to_cpu(id->noiob)); iob = nvme_lba_to_sect(ns->head, le16_to_cpu(id->noiob));
if (!iob) if (!iob)
return; return;
...@@ -2031,16 +2040,17 @@ static int nvme_update_ns_info_block(struct nvme_ns *ns, ...@@ -2031,16 +2040,17 @@ static int nvme_update_ns_info_block(struct nvme_ns *ns,
blk_mq_freeze_queue(ns->disk->queue); blk_mq_freeze_queue(ns->disk->queue);
lbaf = nvme_lbaf_index(id->flbas); lbaf = nvme_lbaf_index(id->flbas);
ns->lba_shift = id->lbaf[lbaf].ds; ns->head->lba_shift = id->lbaf[lbaf].ds;
ns->head->nuse = le64_to_cpu(id->nuse);
nvme_set_queue_limits(ns->ctrl, ns->queue); nvme_set_queue_limits(ns->ctrl, ns->queue);
ret = nvme_configure_metadata(ns, id); ret = nvme_configure_metadata(ns->ctrl, ns->head, id);
if (ret < 0) { if (ret < 0) {
blk_mq_unfreeze_queue(ns->disk->queue); blk_mq_unfreeze_queue(ns->disk->queue);
goto out; goto out;
} }
nvme_set_chunk_sectors(ns, id); nvme_set_chunk_sectors(ns, id);
nvme_update_disk_info(ns->disk, ns, id); nvme_update_disk_info(ns->ctrl, ns->disk, ns->head, id);
if (ns->head->ids.csi == NVME_CSI_ZNS) { if (ns->head->ids.csi == NVME_CSI_ZNS) {
ret = nvme_update_zone_info(ns, lbaf); ret = nvme_update_zone_info(ns, lbaf);
...@@ -2057,7 +2067,7 @@ static int nvme_update_ns_info_block(struct nvme_ns *ns, ...@@ -2057,7 +2067,7 @@ static int nvme_update_ns_info_block(struct nvme_ns *ns,
* do not return zeroes. * do not return zeroes.
*/ */
if ((id->dlfeat & 0x7) == 0x1 && (id->dlfeat & (1 << 3))) if ((id->dlfeat & 0x7) == 0x1 && (id->dlfeat & (1 << 3)))
ns->features |= NVME_NS_DEAC; ns->head->features |= NVME_NS_DEAC;
set_disk_ro(ns->disk, nvme_ns_is_readonly(ns, info)); set_disk_ro(ns->disk, nvme_ns_is_readonly(ns, info));
set_bit(NVME_NS_READY, &ns->flags); set_bit(NVME_NS_READY, &ns->flags);
blk_mq_unfreeze_queue(ns->disk->queue); blk_mq_unfreeze_queue(ns->disk->queue);
...@@ -2070,7 +2080,7 @@ static int nvme_update_ns_info_block(struct nvme_ns *ns, ...@@ -2070,7 +2080,7 @@ static int nvme_update_ns_info_block(struct nvme_ns *ns,
if (nvme_ns_head_multipath(ns->head)) { if (nvme_ns_head_multipath(ns->head)) {
blk_mq_freeze_queue(ns->head->disk->queue); blk_mq_freeze_queue(ns->head->disk->queue);
nvme_update_disk_info(ns->head->disk, ns, id); nvme_update_disk_info(ns->ctrl, ns->head->disk, ns->head, id);
set_disk_ro(ns->head->disk, nvme_ns_is_readonly(ns, info)); set_disk_ro(ns->head->disk, nvme_ns_is_readonly(ns, info));
nvme_mpath_revalidate_paths(ns); nvme_mpath_revalidate_paths(ns);
blk_stack_limits(&ns->head->disk->queue->limits, blk_stack_limits(&ns->head->disk->queue->limits,
...@@ -3003,6 +3013,42 @@ static int nvme_init_effects(struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id) ...@@ -3003,6 +3013,42 @@ static int nvme_init_effects(struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id)
return 0; return 0;
} }
static int nvme_check_ctrl_fabric_info(struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id)
{
/*
* In fabrics we need to verify the cntlid matches the
* admin connect
*/
if (ctrl->cntlid != le16_to_cpu(id->cntlid)) {
dev_err(ctrl->device,
"Mismatching cntlid: Connect %u vs Identify %u, rejecting\n",
ctrl->cntlid, le16_to_cpu(id->cntlid));
return -EINVAL;
}
if (!nvme_discovery_ctrl(ctrl) && !ctrl->kas) {
dev_err(ctrl->device,
"keep-alive support is mandatory for fabrics\n");
return -EINVAL;
}
if (!nvme_discovery_ctrl(ctrl) && ctrl->ioccsz < 4) {
dev_err(ctrl->device,
"I/O queue command capsule supported size %d < 4\n",
ctrl->ioccsz);
return -EINVAL;
}
if (!nvme_discovery_ctrl(ctrl) && ctrl->iorcsz < 1) {
dev_err(ctrl->device,
"I/O queue response capsule supported size %d < 1\n",
ctrl->iorcsz);
return -EINVAL;
}
return 0;
}
static int nvme_init_identify(struct nvme_ctrl *ctrl) static int nvme_init_identify(struct nvme_ctrl *ctrl)
{ {
struct nvme_id_ctrl *id; struct nvme_id_ctrl *id;
...@@ -3115,25 +3161,9 @@ static int nvme_init_identify(struct nvme_ctrl *ctrl) ...@@ -3115,25 +3161,9 @@ static int nvme_init_identify(struct nvme_ctrl *ctrl)
ctrl->iorcsz = le32_to_cpu(id->iorcsz); ctrl->iorcsz = le32_to_cpu(id->iorcsz);
ctrl->maxcmd = le16_to_cpu(id->maxcmd); ctrl->maxcmd = le16_to_cpu(id->maxcmd);
/* ret = nvme_check_ctrl_fabric_info(ctrl, id);
* In fabrics we need to verify the cntlid matches the if (ret)
* admin connect
*/
if (ctrl->cntlid != le16_to_cpu(id->cntlid)) {
dev_err(ctrl->device,
"Mismatching cntlid: Connect %u vs Identify "
"%u, rejecting\n",
ctrl->cntlid, le16_to_cpu(id->cntlid));
ret = -EINVAL;
goto out_free;
}
if (!nvme_discovery_ctrl(ctrl) && !ctrl->kas) {
dev_err(ctrl->device,
"keep-alive support is mandatory for fabrics\n");
ret = -EINVAL;
goto out_free; goto out_free;
}
} else { } else {
ctrl->hmpre = le32_to_cpu(id->hmpre); ctrl->hmpre = le32_to_cpu(id->hmpre);
ctrl->hmmin = le32_to_cpu(id->hmmin); ctrl->hmmin = le32_to_cpu(id->hmmin);
...@@ -3392,6 +3422,8 @@ static struct nvme_ns_head *nvme_alloc_ns_head(struct nvme_ctrl *ctrl, ...@@ -3392,6 +3422,8 @@ static struct nvme_ns_head *nvme_alloc_ns_head(struct nvme_ctrl *ctrl,
head->ns_id = info->nsid; head->ns_id = info->nsid;
head->ids = info->ids; head->ids = info->ids;
head->shared = info->is_shared; head->shared = info->is_shared;
ratelimit_state_init(&head->rs_nuse, 5 * HZ, 1);
ratelimit_set_flags(&head->rs_nuse, RATELIMIT_MSG_ON_RELEASE);
kref_init(&head->ref); kref_init(&head->ref);
if (head->ids.csi) { if (head->ids.csi) {
...@@ -3643,7 +3675,7 @@ static void nvme_alloc_ns(struct nvme_ctrl *ctrl, struct nvme_ns_info *info) ...@@ -3643,7 +3675,7 @@ static void nvme_alloc_ns(struct nvme_ctrl *ctrl, struct nvme_ns_info *info)
up_write(&ctrl->namespaces_rwsem); up_write(&ctrl->namespaces_rwsem);
nvme_get_ctrl(ctrl); nvme_get_ctrl(ctrl);
if (device_add_disk(ctrl->device, ns->disk, nvme_ns_id_attr_groups)) if (device_add_disk(ctrl->device, ns->disk, nvme_ns_attr_groups))
goto out_cleanup_ns_from_list; goto out_cleanup_ns_from_list;
if (!nvme_ns_head_multipath(ns->head)) if (!nvme_ns_head_multipath(ns->head))
......
...@@ -3509,10 +3509,6 @@ nvme_fc_init_ctrl(struct device *dev, struct nvmf_ctrl_options *opts, ...@@ -3509,10 +3509,6 @@ nvme_fc_init_ctrl(struct device *dev, struct nvmf_ctrl_options *opts,
ctrl->ctrl.opts = opts; ctrl->ctrl.opts = opts;
ctrl->ctrl.nr_reconnects = 0; ctrl->ctrl.nr_reconnects = 0;
if (lport->dev)
ctrl->ctrl.numa_node = dev_to_node(lport->dev);
else
ctrl->ctrl.numa_node = NUMA_NO_NODE;
INIT_LIST_HEAD(&ctrl->ctrl_list); INIT_LIST_HEAD(&ctrl->ctrl_list);
ctrl->lport = lport; ctrl->lport = lport;
ctrl->rport = rport; ctrl->rport = rport;
...@@ -3557,6 +3553,8 @@ nvme_fc_init_ctrl(struct device *dev, struct nvmf_ctrl_options *opts, ...@@ -3557,6 +3553,8 @@ nvme_fc_init_ctrl(struct device *dev, struct nvmf_ctrl_options *opts,
ret = nvme_init_ctrl(&ctrl->ctrl, dev, &nvme_fc_ctrl_ops, 0); ret = nvme_init_ctrl(&ctrl->ctrl, dev, &nvme_fc_ctrl_ops, 0);
if (ret) if (ret)
goto out_free_queues; goto out_free_queues;
if (lport->dev)
ctrl->ctrl.numa_node = dev_to_node(lport->dev);
/* at this point, teardown path changes to ref counting on nvme ctrl */ /* at this point, teardown path changes to ref counting on nvme ctrl */
......
...@@ -224,10 +224,10 @@ static int nvme_submit_io(struct nvme_ns *ns, struct nvme_user_io __user *uio) ...@@ -224,10 +224,10 @@ static int nvme_submit_io(struct nvme_ns *ns, struct nvme_user_io __user *uio)
return -EINVAL; return -EINVAL;
} }
length = (io.nblocks + 1) << ns->lba_shift; length = (io.nblocks + 1) << ns->head->lba_shift;
if ((io.control & NVME_RW_PRINFO_PRACT) && if ((io.control & NVME_RW_PRINFO_PRACT) &&
ns->ms == sizeof(struct t10_pi_tuple)) { ns->head->ms == sizeof(struct t10_pi_tuple)) {
/* /*
* Protection information is stripped/inserted by the * Protection information is stripped/inserted by the
* controller. * controller.
...@@ -237,11 +237,11 @@ static int nvme_submit_io(struct nvme_ns *ns, struct nvme_user_io __user *uio) ...@@ -237,11 +237,11 @@ static int nvme_submit_io(struct nvme_ns *ns, struct nvme_user_io __user *uio)
meta_len = 0; meta_len = 0;
metadata = NULL; metadata = NULL;
} else { } else {
meta_len = (io.nblocks + 1) * ns->ms; meta_len = (io.nblocks + 1) * ns->head->ms;
metadata = nvme_to_user_ptr(io.metadata); metadata = nvme_to_user_ptr(io.metadata);
} }
if (ns->features & NVME_NS_EXT_LBAS) { if (ns->head->features & NVME_NS_EXT_LBAS) {
length += meta_len; length += meta_len;
meta_len = 0; meta_len = 0;
} else if (meta_len) { } else if (meta_len) {
......
...@@ -579,7 +579,7 @@ static void nvme_mpath_set_live(struct nvme_ns *ns) ...@@ -579,7 +579,7 @@ static void nvme_mpath_set_live(struct nvme_ns *ns)
*/ */
if (!test_and_set_bit(NVME_NSHEAD_DISK_LIVE, &head->flags)) { if (!test_and_set_bit(NVME_NSHEAD_DISK_LIVE, &head->flags)) {
rc = device_add_disk(&head->subsys->dev, head->disk, rc = device_add_disk(&head->subsys->dev, head->disk,
nvme_ns_id_attr_groups); nvme_ns_attr_groups);
if (rc) { if (rc) {
clear_bit(NVME_NSHEAD_DISK_LIVE, &ns->flags); clear_bit(NVME_NSHEAD_DISK_LIVE, &ns->flags);
return; return;
......
...@@ -16,6 +16,7 @@ ...@@ -16,6 +16,7 @@
#include <linux/rcupdate.h> #include <linux/rcupdate.h>
#include <linux/wait.h> #include <linux/wait.h>
#include <linux/t10-pi.h> #include <linux/t10-pi.h>
#include <linux/ratelimit_types.h>
#include <trace/events/block.h> #include <trace/events/block.h>
...@@ -439,13 +440,27 @@ struct nvme_ns_head { ...@@ -439,13 +440,27 @@ struct nvme_ns_head {
struct list_head list; struct list_head list;
struct srcu_struct srcu; struct srcu_struct srcu;
struct nvme_subsystem *subsys; struct nvme_subsystem *subsys;
unsigned ns_id;
struct nvme_ns_ids ids; struct nvme_ns_ids ids;
struct list_head entry; struct list_head entry;
struct kref ref; struct kref ref;
bool shared; bool shared;
int instance; int instance;
struct nvme_effects_log *effects; struct nvme_effects_log *effects;
u64 nuse;
unsigned ns_id;
int lba_shift;
u16 ms;
u16 pi_size;
u8 pi_type;
u8 guard_type;
u16 sgs;
u32 sws;
#ifdef CONFIG_BLK_DEV_ZONED
u64 zsze;
#endif
unsigned long features;
struct ratelimit_state rs_nuse;
struct cdev cdev; struct cdev cdev;
struct device cdev_device; struct device cdev_device;
...@@ -487,17 +502,6 @@ struct nvme_ns { ...@@ -487,17 +502,6 @@ struct nvme_ns {
struct kref kref; struct kref kref;
struct nvme_ns_head *head; struct nvme_ns_head *head;
int lba_shift;
u16 ms;
u16 pi_size;
u16 sgs;
u32 sws;
u8 pi_type;
u8 guard_type;
#ifdef CONFIG_BLK_DEV_ZONED
u64 zsze;
#endif
unsigned long features;
unsigned long flags; unsigned long flags;
#define NVME_NS_REMOVING 0 #define NVME_NS_REMOVING 0
#define NVME_NS_ANA_PENDING 2 #define NVME_NS_ANA_PENDING 2
...@@ -512,9 +516,9 @@ struct nvme_ns { ...@@ -512,9 +516,9 @@ struct nvme_ns {
}; };
/* NVMe ns supports metadata actions by the controller (generate/strip) */ /* NVMe ns supports metadata actions by the controller (generate/strip) */
static inline bool nvme_ns_has_pi(struct nvme_ns *ns) static inline bool nvme_ns_has_pi(struct nvme_ns_head *head)
{ {
return ns->pi_type && ns->ms == ns->pi_size; return head->pi_type && head->ms == head->pi_size;
} }
struct nvme_ctrl_ops { struct nvme_ctrl_ops {
...@@ -646,17 +650,17 @@ static inline int nvme_reset_subsystem(struct nvme_ctrl *ctrl) ...@@ -646,17 +650,17 @@ static inline int nvme_reset_subsystem(struct nvme_ctrl *ctrl)
/* /*
* Convert a 512B sector number to a device logical block number. * Convert a 512B sector number to a device logical block number.
*/ */
static inline u64 nvme_sect_to_lba(struct nvme_ns *ns, sector_t sector) static inline u64 nvme_sect_to_lba(struct nvme_ns_head *head, sector_t sector)
{ {
return sector >> (ns->lba_shift - SECTOR_SHIFT); return sector >> (head->lba_shift - SECTOR_SHIFT);
} }
/* /*
* Convert a device logical block number to a 512B sector number. * Convert a device logical block number to a 512B sector number.
*/ */
static inline sector_t nvme_lba_to_sect(struct nvme_ns *ns, u64 lba) static inline sector_t nvme_lba_to_sect(struct nvme_ns_head *head, u64 lba)
{ {
return lba << (ns->lba_shift - SECTOR_SHIFT); return lba << (head->lba_shift - SECTOR_SHIFT);
} }
/* /*
...@@ -862,10 +866,12 @@ int nvme_ns_chr_uring_cmd(struct io_uring_cmd *ioucmd, ...@@ -862,10 +866,12 @@ int nvme_ns_chr_uring_cmd(struct io_uring_cmd *ioucmd,
unsigned int issue_flags); unsigned int issue_flags);
int nvme_ns_head_chr_uring_cmd(struct io_uring_cmd *ioucmd, int nvme_ns_head_chr_uring_cmd(struct io_uring_cmd *ioucmd,
unsigned int issue_flags); unsigned int issue_flags);
int nvme_identify_ns(struct nvme_ctrl *ctrl, unsigned nsid,
struct nvme_id_ns **id);
int nvme_getgeo(struct block_device *bdev, struct hd_geometry *geo); int nvme_getgeo(struct block_device *bdev, struct hd_geometry *geo);
int nvme_dev_uring_cmd(struct io_uring_cmd *ioucmd, unsigned int issue_flags); int nvme_dev_uring_cmd(struct io_uring_cmd *ioucmd, unsigned int issue_flags);
extern const struct attribute_group *nvme_ns_id_attr_groups[]; extern const struct attribute_group *nvme_ns_attr_groups[];
extern const struct pr_ops nvme_pr_ops; extern const struct pr_ops nvme_pr_ops;
extern const struct block_device_operations nvme_ns_head_ops; extern const struct block_device_operations nvme_ns_head_ops;
extern const struct attribute_group nvme_dev_attrs_group; extern const struct attribute_group nvme_dev_attrs_group;
......
...@@ -1418,7 +1418,7 @@ static int nvme_rdma_map_sg_pi(struct nvme_rdma_queue *queue, ...@@ -1418,7 +1418,7 @@ static int nvme_rdma_map_sg_pi(struct nvme_rdma_queue *queue,
goto mr_put; goto mr_put;
nvme_rdma_set_sig_attrs(blk_get_integrity(bio->bi_bdev->bd_disk), c, nvme_rdma_set_sig_attrs(blk_get_integrity(bio->bi_bdev->bd_disk), c,
req->mr->sig_attrs, ns->pi_type); req->mr->sig_attrs, ns->head->pi_type);
nvme_rdma_set_prot_checks(c, &req->mr->sig_attrs->check_mask); nvme_rdma_set_prot_checks(c, &req->mr->sig_attrs->check_mask);
ib_update_fast_reg_key(req->mr, ib_inc_rkey(req->mr->rkey)); ib_update_fast_reg_key(req->mr, ib_inc_rkey(req->mr->rkey));
...@@ -2012,7 +2012,7 @@ static blk_status_t nvme_rdma_queue_rq(struct blk_mq_hw_ctx *hctx, ...@@ -2012,7 +2012,7 @@ static blk_status_t nvme_rdma_queue_rq(struct blk_mq_hw_ctx *hctx,
queue->pi_support && queue->pi_support &&
(c->common.opcode == nvme_cmd_write || (c->common.opcode == nvme_cmd_write ||
c->common.opcode == nvme_cmd_read) && c->common.opcode == nvme_cmd_read) &&
nvme_ns_has_pi(ns)) nvme_ns_has_pi(ns->head))
req->use_sig_mr = true; req->use_sig_mr = true;
else else
req->use_sig_mr = false; req->use_sig_mr = false;
......
...@@ -114,12 +114,97 @@ static ssize_t nsid_show(struct device *dev, struct device_attribute *attr, ...@@ -114,12 +114,97 @@ static ssize_t nsid_show(struct device *dev, struct device_attribute *attr,
} }
static DEVICE_ATTR_RO(nsid); static DEVICE_ATTR_RO(nsid);
static struct attribute *nvme_ns_id_attrs[] = { static ssize_t csi_show(struct device *dev, struct device_attribute *attr,
char *buf)
{
return sysfs_emit(buf, "%u\n", dev_to_ns_head(dev)->ids.csi);
}
static DEVICE_ATTR_RO(csi);
static ssize_t metadata_bytes_show(struct device *dev,
struct device_attribute *attr, char *buf)
{
return sysfs_emit(buf, "%u\n", dev_to_ns_head(dev)->ms);
}
static DEVICE_ATTR_RO(metadata_bytes);
static int ns_head_update_nuse(struct nvme_ns_head *head)
{
struct nvme_id_ns *id;
struct nvme_ns *ns;
int srcu_idx, ret = -EWOULDBLOCK;
/* Avoid issuing commands too often by rate limiting the update */
if (!__ratelimit(&head->rs_nuse))
return 0;
srcu_idx = srcu_read_lock(&head->srcu);
ns = nvme_find_path(head);
if (!ns)
goto out_unlock;
ret = nvme_identify_ns(ns->ctrl, head->ns_id, &id);
if (ret)
goto out_unlock;
head->nuse = le64_to_cpu(id->nuse);
kfree(id);
out_unlock:
srcu_read_unlock(&head->srcu, srcu_idx);
return ret;
}
static int ns_update_nuse(struct nvme_ns *ns)
{
struct nvme_id_ns *id;
int ret;
/* Avoid issuing commands too often by rate limiting the update. */
if (!__ratelimit(&ns->head->rs_nuse))
return 0;
ret = nvme_identify_ns(ns->ctrl, ns->head->ns_id, &id);
if (ret)
goto out_free_id;
ns->head->nuse = le64_to_cpu(id->nuse);
out_free_id:
kfree(id);
return ret;
}
static ssize_t nuse_show(struct device *dev, struct device_attribute *attr,
char *buf)
{
struct nvme_ns_head *head = dev_to_ns_head(dev);
struct gendisk *disk = dev_to_disk(dev);
struct block_device *bdev = disk->part0;
int ret;
if (IS_ENABLED(CONFIG_NVME_MULTIPATH) &&
bdev->bd_disk->fops == &nvme_ns_head_ops)
ret = ns_head_update_nuse(head);
else
ret = ns_update_nuse(bdev->bd_disk->private_data);
if (ret)
return ret;
return sysfs_emit(buf, "%llu\n", head->nuse);
}
static DEVICE_ATTR_RO(nuse);
static struct attribute *nvme_ns_attrs[] = {
&dev_attr_wwid.attr, &dev_attr_wwid.attr,
&dev_attr_uuid.attr, &dev_attr_uuid.attr,
&dev_attr_nguid.attr, &dev_attr_nguid.attr,
&dev_attr_eui.attr, &dev_attr_eui.attr,
&dev_attr_csi.attr,
&dev_attr_nsid.attr, &dev_attr_nsid.attr,
&dev_attr_metadata_bytes.attr,
&dev_attr_nuse.attr,
#ifdef CONFIG_NVME_MULTIPATH #ifdef CONFIG_NVME_MULTIPATH
&dev_attr_ana_grpid.attr, &dev_attr_ana_grpid.attr,
&dev_attr_ana_state.attr, &dev_attr_ana_state.attr,
...@@ -127,7 +212,7 @@ static struct attribute *nvme_ns_id_attrs[] = { ...@@ -127,7 +212,7 @@ static struct attribute *nvme_ns_id_attrs[] = {
NULL, NULL,
}; };
static umode_t nvme_ns_id_attrs_are_visible(struct kobject *kobj, static umode_t nvme_ns_attrs_are_visible(struct kobject *kobj,
struct attribute *a, int n) struct attribute *a, int n)
{ {
struct device *dev = container_of(kobj, struct device, kobj); struct device *dev = container_of(kobj, struct device, kobj);
...@@ -157,13 +242,13 @@ static umode_t nvme_ns_id_attrs_are_visible(struct kobject *kobj, ...@@ -157,13 +242,13 @@ static umode_t nvme_ns_id_attrs_are_visible(struct kobject *kobj,
return a->mode; return a->mode;
} }
static const struct attribute_group nvme_ns_id_attr_group = { static const struct attribute_group nvme_ns_attr_group = {
.attrs = nvme_ns_id_attrs, .attrs = nvme_ns_attrs,
.is_visible = nvme_ns_id_attrs_are_visible, .is_visible = nvme_ns_attrs_are_visible,
}; };
const struct attribute_group *nvme_ns_id_attr_groups[] = { const struct attribute_group *nvme_ns_attr_groups[] = {
&nvme_ns_id_attr_group, &nvme_ns_attr_group,
NULL, NULL,
}; };
......
...@@ -11,7 +11,7 @@ int nvme_revalidate_zones(struct nvme_ns *ns) ...@@ -11,7 +11,7 @@ int nvme_revalidate_zones(struct nvme_ns *ns)
{ {
struct request_queue *q = ns->queue; struct request_queue *q = ns->queue;
blk_queue_chunk_sectors(q, ns->zsze); blk_queue_chunk_sectors(q, ns->head->zsze);
blk_queue_max_zone_append_sectors(q, ns->ctrl->max_zone_append); blk_queue_max_zone_append_sectors(q, ns->ctrl->max_zone_append);
return blk_revalidate_disk_zones(ns->disk, NULL); return blk_revalidate_disk_zones(ns->disk, NULL);
...@@ -99,11 +99,12 @@ int nvme_update_zone_info(struct nvme_ns *ns, unsigned lbaf) ...@@ -99,11 +99,12 @@ int nvme_update_zone_info(struct nvme_ns *ns, unsigned lbaf)
goto free_data; goto free_data;
} }
ns->zsze = nvme_lba_to_sect(ns, le64_to_cpu(id->lbafe[lbaf].zsze)); ns->head->zsze =
if (!is_power_of_2(ns->zsze)) { nvme_lba_to_sect(ns->head, le64_to_cpu(id->lbafe[lbaf].zsze));
if (!is_power_of_2(ns->head->zsze)) {
dev_warn(ns->ctrl->device, dev_warn(ns->ctrl->device,
"invalid zone size:%llu for namespace:%u\n", "invalid zone size:%llu for namespace:%u\n",
ns->zsze, ns->head->ns_id); ns->head->zsze, ns->head->ns_id);
status = -ENODEV; status = -ENODEV;
goto free_data; goto free_data;
} }
...@@ -128,7 +129,7 @@ static void *nvme_zns_alloc_report_buffer(struct nvme_ns *ns, ...@@ -128,7 +129,7 @@ static void *nvme_zns_alloc_report_buffer(struct nvme_ns *ns,
sizeof(struct nvme_zone_descriptor); sizeof(struct nvme_zone_descriptor);
nr_zones = min_t(unsigned int, nr_zones, nr_zones = min_t(unsigned int, nr_zones,
get_capacity(ns->disk) >> ilog2(ns->zsze)); get_capacity(ns->disk) >> ilog2(ns->head->zsze));
bufsize = sizeof(struct nvme_zone_report) + bufsize = sizeof(struct nvme_zone_report) +
nr_zones * sizeof(struct nvme_zone_descriptor); nr_zones * sizeof(struct nvme_zone_descriptor);
...@@ -147,7 +148,8 @@ static void *nvme_zns_alloc_report_buffer(struct nvme_ns *ns, ...@@ -147,7 +148,8 @@ static void *nvme_zns_alloc_report_buffer(struct nvme_ns *ns,
return NULL; return NULL;
} }
static int nvme_zone_parse_entry(struct nvme_ns *ns, static int nvme_zone_parse_entry(struct nvme_ctrl *ctrl,
struct nvme_ns_head *head,
struct nvme_zone_descriptor *entry, struct nvme_zone_descriptor *entry,
unsigned int idx, report_zones_cb cb, unsigned int idx, report_zones_cb cb,
void *data) void *data)
...@@ -155,20 +157,20 @@ static int nvme_zone_parse_entry(struct nvme_ns *ns, ...@@ -155,20 +157,20 @@ static int nvme_zone_parse_entry(struct nvme_ns *ns,
struct blk_zone zone = { }; struct blk_zone zone = { };
if ((entry->zt & 0xf) != NVME_ZONE_TYPE_SEQWRITE_REQ) { if ((entry->zt & 0xf) != NVME_ZONE_TYPE_SEQWRITE_REQ) {
dev_err(ns->ctrl->device, "invalid zone type %#x\n", dev_err(ctrl->device, "invalid zone type %#x\n",
entry->zt); entry->zt);
return -EINVAL; return -EINVAL;
} }
zone.type = BLK_ZONE_TYPE_SEQWRITE_REQ; zone.type = BLK_ZONE_TYPE_SEQWRITE_REQ;
zone.cond = entry->zs >> 4; zone.cond = entry->zs >> 4;
zone.len = ns->zsze; zone.len = head->zsze;
zone.capacity = nvme_lba_to_sect(ns, le64_to_cpu(entry->zcap)); zone.capacity = nvme_lba_to_sect(head, le64_to_cpu(entry->zcap));
zone.start = nvme_lba_to_sect(ns, le64_to_cpu(entry->zslba)); zone.start = nvme_lba_to_sect(head, le64_to_cpu(entry->zslba));
if (zone.cond == BLK_ZONE_COND_FULL) if (zone.cond == BLK_ZONE_COND_FULL)
zone.wp = zone.start + zone.len; zone.wp = zone.start + zone.len;
else else
zone.wp = nvme_lba_to_sect(ns, le64_to_cpu(entry->wp)); zone.wp = nvme_lba_to_sect(head, le64_to_cpu(entry->wp));
return cb(&zone, idx, data); return cb(&zone, idx, data);
} }
...@@ -196,11 +198,11 @@ int nvme_ns_report_zones(struct nvme_ns *ns, sector_t sector, ...@@ -196,11 +198,11 @@ int nvme_ns_report_zones(struct nvme_ns *ns, sector_t sector,
c.zmr.zrasf = NVME_ZRASF_ZONE_REPORT_ALL; c.zmr.zrasf = NVME_ZRASF_ZONE_REPORT_ALL;
c.zmr.pr = NVME_REPORT_ZONE_PARTIAL; c.zmr.pr = NVME_REPORT_ZONE_PARTIAL;
sector &= ~(ns->zsze - 1); sector &= ~(ns->head->zsze - 1);
while (zone_idx < nr_zones && sector < get_capacity(ns->disk)) { while (zone_idx < nr_zones && sector < get_capacity(ns->disk)) {
memset(report, 0, buflen); memset(report, 0, buflen);
c.zmr.slba = cpu_to_le64(nvme_sect_to_lba(ns, sector)); c.zmr.slba = cpu_to_le64(nvme_sect_to_lba(ns->head, sector));
ret = nvme_submit_sync_cmd(ns->queue, &c, report, buflen); ret = nvme_submit_sync_cmd(ns->queue, &c, report, buflen);
if (ret) { if (ret) {
if (ret > 0) if (ret > 0)
...@@ -213,14 +215,15 @@ int nvme_ns_report_zones(struct nvme_ns *ns, sector_t sector, ...@@ -213,14 +215,15 @@ int nvme_ns_report_zones(struct nvme_ns *ns, sector_t sector,
break; break;
for (i = 0; i < nz && zone_idx < nr_zones; i++) { for (i = 0; i < nz && zone_idx < nr_zones; i++) {
ret = nvme_zone_parse_entry(ns, &report->entries[i], ret = nvme_zone_parse_entry(ns->ctrl, ns->head,
&report->entries[i],
zone_idx, cb, data); zone_idx, cb, data);
if (ret) if (ret)
goto out_free; goto out_free;
zone_idx++; zone_idx++;
} }
sector += ns->zsze * nz; sector += ns->head->zsze * nz;
} }
if (zone_idx > 0) if (zone_idx > 0)
...@@ -239,7 +242,7 @@ blk_status_t nvme_setup_zone_mgmt_send(struct nvme_ns *ns, struct request *req, ...@@ -239,7 +242,7 @@ blk_status_t nvme_setup_zone_mgmt_send(struct nvme_ns *ns, struct request *req,
c->zms.opcode = nvme_cmd_zone_mgmt_send; c->zms.opcode = nvme_cmd_zone_mgmt_send;
c->zms.nsid = cpu_to_le32(ns->head->ns_id); c->zms.nsid = cpu_to_le32(ns->head->ns_id);
c->zms.slba = cpu_to_le64(nvme_sect_to_lba(ns, blk_rq_pos(req))); c->zms.slba = cpu_to_le64(nvme_sect_to_lba(ns->head, blk_rq_pos(req)));
c->zms.zsa = action; c->zms.zsa = action;
if (req_op(req) == REQ_OP_ZONE_RESET_ALL) if (req_op(req) == REQ_OP_ZONE_RESET_ALL)
......
...@@ -1274,7 +1274,7 @@ static ssize_t nvmet_subsys_attr_cntlid_min_store(struct config_item *item, ...@@ -1274,7 +1274,7 @@ static ssize_t nvmet_subsys_attr_cntlid_min_store(struct config_item *item,
return -EINVAL; return -EINVAL;
down_write(&nvmet_config_sem); down_write(&nvmet_config_sem);
if (cntlid_min >= to_subsys(item)->cntlid_max) if (cntlid_min > to_subsys(item)->cntlid_max)
goto out_unlock; goto out_unlock;
to_subsys(item)->cntlid_min = cntlid_min; to_subsys(item)->cntlid_min = cntlid_min;
up_write(&nvmet_config_sem); up_write(&nvmet_config_sem);
...@@ -1304,7 +1304,7 @@ static ssize_t nvmet_subsys_attr_cntlid_max_store(struct config_item *item, ...@@ -1304,7 +1304,7 @@ static ssize_t nvmet_subsys_attr_cntlid_max_store(struct config_item *item,
return -EINVAL; return -EINVAL;
down_write(&nvmet_config_sem); down_write(&nvmet_config_sem);
if (cntlid_max <= to_subsys(item)->cntlid_min) if (cntlid_max < to_subsys(item)->cntlid_min)
goto out_unlock; goto out_unlock;
to_subsys(item)->cntlid_max = cntlid_max; to_subsys(item)->cntlid_max = cntlid_max;
up_write(&nvmet_config_sem); up_write(&nvmet_config_sem);
......
...@@ -1425,9 +1425,6 @@ u16 nvmet_alloc_ctrl(const char *subsysnqn, const char *hostnqn, ...@@ -1425,9 +1425,6 @@ u16 nvmet_alloc_ctrl(const char *subsysnqn, const char *hostnqn,
if (!ctrl->sqs) if (!ctrl->sqs)
goto out_free_changed_ns_list; goto out_free_changed_ns_list;
if (subsys->cntlid_min > subsys->cntlid_max)
goto out_free_sqs;
ret = ida_alloc_range(&cntlid_ida, ret = ida_alloc_range(&cntlid_ida,
subsys->cntlid_min, subsys->cntlid_max, subsys->cntlid_min, subsys->cntlid_max,
GFP_KERNEL); GFP_KERNEL);
......
...@@ -602,7 +602,7 @@ int nvmet_passthru_ctrl_enable(struct nvmet_subsys *subsys) ...@@ -602,7 +602,7 @@ int nvmet_passthru_ctrl_enable(struct nvmet_subsys *subsys)
goto out_put_file; goto out_put_file;
} }
old = xa_cmpxchg(&passthru_subsystems, ctrl->cntlid, NULL, old = xa_cmpxchg(&passthru_subsystems, ctrl->instance, NULL,
subsys, GFP_KERNEL); subsys, GFP_KERNEL);
if (xa_is_err(old)) { if (xa_is_err(old)) {
ret = xa_err(old); ret = xa_err(old);
...@@ -635,7 +635,7 @@ int nvmet_passthru_ctrl_enable(struct nvmet_subsys *subsys) ...@@ -635,7 +635,7 @@ int nvmet_passthru_ctrl_enable(struct nvmet_subsys *subsys)
static void __nvmet_passthru_ctrl_disable(struct nvmet_subsys *subsys) static void __nvmet_passthru_ctrl_disable(struct nvmet_subsys *subsys)
{ {
if (subsys->passthru_ctrl) { if (subsys->passthru_ctrl) {
xa_erase(&passthru_subsystems, subsys->passthru_ctrl->cntlid); xa_erase(&passthru_subsystems, subsys->passthru_ctrl->instance);
module_put(subsys->passthru_ctrl->ops->module); module_put(subsys->passthru_ctrl->ops->module);
nvme_put_ctrl(subsys->passthru_ctrl); nvme_put_ctrl(subsys->passthru_ctrl);
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment