Skip to content

Commit b2750f1

Browse files
committed
Merge tag 'nvme-5.17-2022-02-24' of git://git.infradead.org/nvme into block-5.17
Pull NVMe fixes from Christoph: "nvme fixes for Linux 5.17 - send H2CData PDUs based on MAXH2CDATA (Varun Prakash) - fix passthrough to namespaces with unsupported features (me)" * tag 'nvme-5.17-2022-02-24' of git://git.infradead.org/nvme: nvme-tcp: send H2CData PDUs based on MAXH2CDATA nvme: also mark passthrough-only namespaces ready in nvme_update_ns_info nvme: don't return an error from nvme_configure_metadata
2 parents bb49c6f + c2700d2 commit b2750f1

File tree

3 files changed

+58
-25
lines changed

3 files changed

+58
-25
lines changed

drivers/nvme/host/core.c

Lines changed: 8 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1723,7 +1723,7 @@ static int nvme_setup_streams_ns(struct nvme_ctrl *ctrl, struct nvme_ns *ns,
17231723
return 0;
17241724
}
17251725

1726-
static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
1726+
static void nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
17271727
{
17281728
struct nvme_ctrl *ctrl = ns->ctrl;
17291729

@@ -1739,15 +1739,16 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
17391739

17401740
ns->features &= ~(NVME_NS_METADATA_SUPPORTED | NVME_NS_EXT_LBAS);
17411741
if (!ns->ms || !(ctrl->ops->flags & NVME_F_METADATA_SUPPORTED))
1742-
return 0;
1742+
return;
1743+
17431744
if (ctrl->ops->flags & NVME_F_FABRICS) {
17441745
/*
17451746
* The NVMe over Fabrics specification only supports metadata as
17461747
* part of the extended data LBA. We rely on HCA/HBA support to
17471748
* remap the separate metadata buffer from the block layer.
17481749
*/
17491750
if (WARN_ON_ONCE(!(id->flbas & NVME_NS_FLBAS_META_EXT)))
1750-
return -EINVAL;
1751+
return;
17511752

17521753
ns->features |= NVME_NS_EXT_LBAS;
17531754

@@ -1774,8 +1775,6 @@ static int nvme_configure_metadata(struct nvme_ns *ns, struct nvme_id_ns *id)
17741775
else
17751776
ns->features |= NVME_NS_METADATA_SUPPORTED;
17761777
}
1777-
1778-
return 0;
17791778
}
17801779

17811780
static void nvme_set_queue_limits(struct nvme_ctrl *ctrl,
@@ -1916,9 +1915,7 @@ static int nvme_update_ns_info(struct nvme_ns *ns, struct nvme_id_ns *id)
19161915
ns->lba_shift = id->lbaf[lbaf].ds;
19171916
nvme_set_queue_limits(ns->ctrl, ns->queue);
19181917

1919-
ret = nvme_configure_metadata(ns, id);
1920-
if (ret)
1921-
goto out_unfreeze;
1918+
nvme_configure_metadata(ns, id);
19221919
nvme_set_chunk_sectors(ns, id);
19231920
nvme_update_disk_info(ns->disk, ns, id);
19241921

@@ -1934,7 +1931,7 @@ static int nvme_update_ns_info(struct nvme_ns *ns, struct nvme_id_ns *id)
19341931
if (blk_queue_is_zoned(ns->queue)) {
19351932
ret = nvme_revalidate_zones(ns);
19361933
if (ret && !nvme_first_scan(ns->disk))
1937-
goto out;
1934+
return ret;
19381935
}
19391936

19401937
if (nvme_ns_head_multipath(ns->head)) {
@@ -1949,16 +1946,16 @@ static int nvme_update_ns_info(struct nvme_ns *ns, struct nvme_id_ns *id)
19491946
return 0;
19501947

19511948
out_unfreeze:
1952-
blk_mq_unfreeze_queue(ns->disk->queue);
1953-
out:
19541949
/*
19551950
* If probing fails due an unsupported feature, hide the block device,
19561951
* but still allow other access.
19571952
*/
19581953
if (ret == -ENODEV) {
19591954
ns->disk->flags |= GENHD_FL_HIDDEN;
1955+
set_bit(NVME_NS_READY, &ns->flags);
19601956
ret = 0;
19611957
}
1958+
blk_mq_unfreeze_queue(ns->disk->queue);
19621959
return ret;
19631960
}
19641961

drivers/nvme/host/tcp.c

Lines changed: 49 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -44,6 +44,8 @@ struct nvme_tcp_request {
4444
u32 data_len;
4545
u32 pdu_len;
4646
u32 pdu_sent;
47+
u32 h2cdata_left;
48+
u32 h2cdata_offset;
4749
u16 ttag;
4850
__le16 status;
4951
struct list_head entry;
@@ -95,6 +97,7 @@ struct nvme_tcp_queue {
9597
struct nvme_tcp_request *request;
9698

9799
int queue_size;
100+
u32 maxh2cdata;
98101
size_t cmnd_capsule_len;
99102
struct nvme_tcp_ctrl *ctrl;
100103
unsigned long flags;
@@ -572,23 +575,26 @@ static int nvme_tcp_handle_comp(struct nvme_tcp_queue *queue,
572575
return ret;
573576
}
574577

575-
static void nvme_tcp_setup_h2c_data_pdu(struct nvme_tcp_request *req,
576-
struct nvme_tcp_r2t_pdu *pdu)
578+
static void nvme_tcp_setup_h2c_data_pdu(struct nvme_tcp_request *req)
577579
{
578580
struct nvme_tcp_data_pdu *data = req->pdu;
579581
struct nvme_tcp_queue *queue = req->queue;
580582
struct request *rq = blk_mq_rq_from_pdu(req);
583+
u32 h2cdata_sent = req->pdu_len;
581584
u8 hdgst = nvme_tcp_hdgst_len(queue);
582585
u8 ddgst = nvme_tcp_ddgst_len(queue);
583586

584587
req->state = NVME_TCP_SEND_H2C_PDU;
585588
req->offset = 0;
586-
req->pdu_len = le32_to_cpu(pdu->r2t_length);
589+
req->pdu_len = min(req->h2cdata_left, queue->maxh2cdata);
587590
req->pdu_sent = 0;
591+
req->h2cdata_left -= req->pdu_len;
592+
req->h2cdata_offset += h2cdata_sent;
588593

589594
memset(data, 0, sizeof(*data));
590595
data->hdr.type = nvme_tcp_h2c_data;
591-
data->hdr.flags = NVME_TCP_F_DATA_LAST;
596+
if (!req->h2cdata_left)
597+
data->hdr.flags = NVME_TCP_F_DATA_LAST;
592598
if (queue->hdr_digest)
593599
data->hdr.flags |= NVME_TCP_F_HDGST;
594600
if (queue->data_digest)
@@ -597,9 +603,9 @@ static void nvme_tcp_setup_h2c_data_pdu(struct nvme_tcp_request *req,
597603
data->hdr.pdo = data->hdr.hlen + hdgst;
598604
data->hdr.plen =
599605
cpu_to_le32(data->hdr.hlen + hdgst + req->pdu_len + ddgst);
600-
data->ttag = pdu->ttag;
606+
data->ttag = req->ttag;
601607
data->command_id = nvme_cid(rq);
602-
data->data_offset = pdu->r2t_offset;
608+
data->data_offset = cpu_to_le32(req->h2cdata_offset);
603609
data->data_length = cpu_to_le32(req->pdu_len);
604610
}
605611

@@ -609,6 +615,7 @@ static int nvme_tcp_handle_r2t(struct nvme_tcp_queue *queue,
609615
struct nvme_tcp_request *req;
610616
struct request *rq;
611617
u32 r2t_length = le32_to_cpu(pdu->r2t_length);
618+
u32 r2t_offset = le32_to_cpu(pdu->r2t_offset);
612619

613620
rq = nvme_find_rq(nvme_tcp_tagset(queue), pdu->command_id);
614621
if (!rq) {
@@ -633,14 +640,19 @@ static int nvme_tcp_handle_r2t(struct nvme_tcp_queue *queue,
633640
return -EPROTO;
634641
}
635642

636-
if (unlikely(le32_to_cpu(pdu->r2t_offset) < req->data_sent)) {
643+
if (unlikely(r2t_offset < req->data_sent)) {
637644
dev_err(queue->ctrl->ctrl.device,
638645
"req %d unexpected r2t offset %u (expected %zu)\n",
639-
rq->tag, le32_to_cpu(pdu->r2t_offset), req->data_sent);
646+
rq->tag, r2t_offset, req->data_sent);
640647
return -EPROTO;
641648
}
642649

643-
nvme_tcp_setup_h2c_data_pdu(req, pdu);
650+
req->pdu_len = 0;
651+
req->h2cdata_left = r2t_length;
652+
req->h2cdata_offset = r2t_offset;
653+
req->ttag = pdu->ttag;
654+
655+
nvme_tcp_setup_h2c_data_pdu(req);
644656
nvme_tcp_queue_request(req, false, true);
645657

646658
return 0;
@@ -928,6 +940,7 @@ static int nvme_tcp_try_send_data(struct nvme_tcp_request *req)
928940
{
929941
struct nvme_tcp_queue *queue = req->queue;
930942
int req_data_len = req->data_len;
943+
u32 h2cdata_left = req->h2cdata_left;
931944

932945
while (true) {
933946
struct page *page = nvme_tcp_req_cur_page(req);
@@ -972,7 +985,10 @@ static int nvme_tcp_try_send_data(struct nvme_tcp_request *req)
972985
req->state = NVME_TCP_SEND_DDGST;
973986
req->offset = 0;
974987
} else {
975-
nvme_tcp_done_send_req(queue);
988+
if (h2cdata_left)
989+
nvme_tcp_setup_h2c_data_pdu(req);
990+
else
991+
nvme_tcp_done_send_req(queue);
976992
}
977993
return 1;
978994
}
@@ -1030,9 +1046,14 @@ static int nvme_tcp_try_send_data_pdu(struct nvme_tcp_request *req)
10301046
if (queue->hdr_digest && !req->offset)
10311047
nvme_tcp_hdgst(queue->snd_hash, pdu, sizeof(*pdu));
10321048

1033-
ret = kernel_sendpage(queue->sock, virt_to_page(pdu),
1034-
offset_in_page(pdu) + req->offset, len,
1035-
MSG_DONTWAIT | MSG_MORE | MSG_SENDPAGE_NOTLAST);
1049+
if (!req->h2cdata_left)
1050+
ret = kernel_sendpage(queue->sock, virt_to_page(pdu),
1051+
offset_in_page(pdu) + req->offset, len,
1052+
MSG_DONTWAIT | MSG_MORE | MSG_SENDPAGE_NOTLAST);
1053+
else
1054+
ret = sock_no_sendpage(queue->sock, virt_to_page(pdu),
1055+
offset_in_page(pdu) + req->offset, len,
1056+
MSG_DONTWAIT | MSG_MORE);
10361057
if (unlikely(ret <= 0))
10371058
return ret;
10381059

@@ -1052,6 +1073,7 @@ static int nvme_tcp_try_send_ddgst(struct nvme_tcp_request *req)
10521073
{
10531074
struct nvme_tcp_queue *queue = req->queue;
10541075
size_t offset = req->offset;
1076+
u32 h2cdata_left = req->h2cdata_left;
10551077
int ret;
10561078
struct msghdr msg = { .msg_flags = MSG_DONTWAIT };
10571079
struct kvec iov = {
@@ -1069,7 +1091,10 @@ static int nvme_tcp_try_send_ddgst(struct nvme_tcp_request *req)
10691091
return ret;
10701092

10711093
if (offset + ret == NVME_TCP_DIGEST_LENGTH) {
1072-
nvme_tcp_done_send_req(queue);
1094+
if (h2cdata_left)
1095+
nvme_tcp_setup_h2c_data_pdu(req);
1096+
else
1097+
nvme_tcp_done_send_req(queue);
10731098
return 1;
10741099
}
10751100

@@ -1261,6 +1286,7 @@ static int nvme_tcp_init_connection(struct nvme_tcp_queue *queue)
12611286
struct msghdr msg = {};
12621287
struct kvec iov;
12631288
bool ctrl_hdgst, ctrl_ddgst;
1289+
u32 maxh2cdata;
12641290
int ret;
12651291

12661292
icreq = kzalloc(sizeof(*icreq), GFP_KERNEL);
@@ -1344,6 +1370,14 @@ static int nvme_tcp_init_connection(struct nvme_tcp_queue *queue)
13441370
goto free_icresp;
13451371
}
13461372

1373+
maxh2cdata = le32_to_cpu(icresp->maxdata);
1374+
if ((maxh2cdata % 4) || (maxh2cdata < NVME_TCP_MIN_MAXH2CDATA)) {
1375+
pr_err("queue %d: invalid maxh2cdata returned %u\n",
1376+
nvme_tcp_queue_id(queue), maxh2cdata);
1377+
goto free_icresp;
1378+
}
1379+
queue->maxh2cdata = maxh2cdata;
1380+
13471381
ret = 0;
13481382
free_icresp:
13491383
kfree(icresp);
@@ -2329,6 +2363,7 @@ static blk_status_t nvme_tcp_setup_cmd_pdu(struct nvme_ns *ns,
23292363
req->data_sent = 0;
23302364
req->pdu_len = 0;
23312365
req->pdu_sent = 0;
2366+
req->h2cdata_left = 0;
23322367
req->data_len = blk_rq_nr_phys_segments(rq) ?
23332368
blk_rq_payload_bytes(rq) : 0;
23342369
req->curr_bio = rq->bio;

include/linux/nvme-tcp.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,7 @@
1212
#define NVME_TCP_DISC_PORT 8009
1313
#define NVME_TCP_ADMIN_CCSZ SZ_8K
1414
#define NVME_TCP_DIGEST_LENGTH 4
15+
#define NVME_TCP_MIN_MAXH2CDATA 4096
1516

1617
enum nvme_tcp_pfv {
1718
NVME_TCP_PFV_1_0 = 0x0,

0 commit comments

Comments
 (0)