diff options
Diffstat (limited to 'drivers/nvme')
| -rw-r--r-- | drivers/nvme/host/apple.c | 55 | ||||
| -rw-r--r-- | drivers/nvme/host/core.c | 10 | ||||
| -rw-r--r-- | drivers/nvme/host/fc.c | 68 | ||||
| -rw-r--r-- | drivers/nvme/host/ioctl.c | 3 | ||||
| -rw-r--r-- | drivers/nvme/host/pci.c | 14 | ||||
| -rw-r--r-- | drivers/nvme/host/sysfs.c | 2 | ||||
| -rw-r--r-- | drivers/nvme/host/tcp.c | 50 | ||||
| -rw-r--r-- | drivers/nvme/target/admin-cmd.c | 1 | ||||
| -rw-r--r-- | drivers/nvme/target/core.c | 40 | ||||
| -rw-r--r-- | drivers/nvme/target/fabrics-cmd.c | 2 | ||||
| -rw-r--r-- | drivers/nvme/target/io-cmd-bdev.c | 2 | ||||
| -rw-r--r-- | drivers/nvme/target/nvmet.h | 16 | ||||
| -rw-r--r-- | drivers/nvme/target/pci-epf.c | 39 | ||||
| -rw-r--r-- | drivers/nvme/target/rdma.c | 33 | 
14 files changed, 196 insertions, 139 deletions
| diff --git a/drivers/nvme/host/apple.c b/drivers/nvme/host/apple.c index 1de11b722f04..a060f69558e7 100644 --- a/drivers/nvme/host/apple.c +++ b/drivers/nvme/host/apple.c @@ -1011,25 +1011,37 @@ static void apple_nvme_reset_work(struct work_struct *work)  		ret = apple_rtkit_shutdown(anv->rtk);  		if (ret)  			goto out; + +		writel(0, anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL);  	} -	writel(0, anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); +	/* +	 * Only do the soft-reset if the CPU is not running, which means either we +	 * or the previous stage shut it down cleanly. +	 */ +	if (!(readl(anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL) & +		APPLE_ANS_COPROC_CPU_CONTROL_RUN)) { -	ret = reset_control_assert(anv->reset); -	if (ret) -		goto out; +		ret = reset_control_assert(anv->reset); +		if (ret) +			goto out; -	ret = apple_rtkit_reinit(anv->rtk); -	if (ret) -		goto out; +		ret = apple_rtkit_reinit(anv->rtk); +		if (ret) +			goto out; -	ret = reset_control_deassert(anv->reset); -	if (ret) -		goto out; +		ret = reset_control_deassert(anv->reset); +		if (ret) +			goto out; + +		writel(APPLE_ANS_COPROC_CPU_CONTROL_RUN, +		       anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); + +		ret = apple_rtkit_boot(anv->rtk); +	} else { +		ret = apple_rtkit_wake(anv->rtk); +	} -	writel(APPLE_ANS_COPROC_CPU_CONTROL_RUN, -	       anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); -	ret = apple_rtkit_boot(anv->rtk);  	if (ret) {  		dev_err(anv->dev, "ANS did not boot");  		goto out; @@ -1516,6 +1528,7 @@ static struct apple_nvme *apple_nvme_alloc(struct platform_device *pdev)  	return anv;  put_dev: +	apple_nvme_detach_genpd(anv);  	put_device(anv->dev);  	return ERR_PTR(ret);  } @@ -1549,6 +1562,7 @@ out_uninit_ctrl:  	nvme_uninit_ctrl(&anv->ctrl);  out_put_ctrl:  	nvme_put_ctrl(&anv->ctrl); +	apple_nvme_detach_genpd(anv);  	return ret;  } @@ -1563,9 +1577,12 @@ static void apple_nvme_remove(struct platform_device *pdev)  	apple_nvme_disable(anv, true);  	nvme_uninit_ctrl(&anv->ctrl); -	if (apple_rtkit_is_running(anv->rtk)) +	if (apple_rtkit_is_running(anv->rtk)) {  		apple_rtkit_shutdown(anv->rtk); +		writel(0, anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); +	} +  	apple_nvme_detach_genpd(anv);  } @@ -1574,8 +1591,11 @@ static void apple_nvme_shutdown(struct platform_device *pdev)  	struct apple_nvme *anv = platform_get_drvdata(pdev);  	apple_nvme_disable(anv, true); -	if (apple_rtkit_is_running(anv->rtk)) +	if (apple_rtkit_is_running(anv->rtk)) {  		apple_rtkit_shutdown(anv->rtk); + +		writel(0, anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); +	}  }  static int apple_nvme_resume(struct device *dev) @@ -1592,10 +1612,11 @@ static int apple_nvme_suspend(struct device *dev)  	apple_nvme_disable(anv, true); -	if (apple_rtkit_is_running(anv->rtk)) +	if (apple_rtkit_is_running(anv->rtk)) {  		ret = apple_rtkit_shutdown(anv->rtk); -	writel(0, anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); +		writel(0, anv->mmio_coproc + APPLE_ANS_COPROC_CPU_CONTROL); +	}  	return ret;  } diff --git a/drivers/nvme/host/core.c b/drivers/nvme/host/core.c index 40046770f1bf..f028913e2e62 100644 --- a/drivers/nvme/host/core.c +++ b/drivers/nvme/host/core.c @@ -564,8 +564,6 @@ bool nvme_change_ctrl_state(struct nvme_ctrl *ctrl,  	switch (new_state) {  	case NVME_CTRL_LIVE:  		switch (old_state) { -		case NVME_CTRL_NEW: -		case NVME_CTRL_RESETTING:  		case NVME_CTRL_CONNECTING:  			changed = true;  			fallthrough; @@ -1700,7 +1698,13 @@ int nvme_set_queue_count(struct nvme_ctrl *ctrl, int *count)  	status = nvme_set_features(ctrl, NVME_FEAT_NUM_QUEUES, q_count, NULL, 0,  			&result); -	if (status < 0) + +	/* +	 * It's either a kernel error or the host observed a connection +	 * lost. In either case it's not possible communicate with the +	 * controller and thus enter the error code path. +	 */ +	if (status < 0 || status == NVME_SC_HOST_PATH_ERROR)  		return status;  	/* diff --git a/drivers/nvme/host/fc.c b/drivers/nvme/host/fc.c index 094be164ffdc..b9929a5a7f4e 100644 --- a/drivers/nvme/host/fc.c +++ b/drivers/nvme/host/fc.c @@ -785,49 +785,8 @@ nvme_fc_ctrl_connectivity_loss(struct nvme_fc_ctrl *ctrl)  		"NVME-FC{%d}: controller connectivity lost. Awaiting "  		"Reconnect", ctrl->cnum); -	switch (nvme_ctrl_state(&ctrl->ctrl)) { -	case NVME_CTRL_NEW: -	case NVME_CTRL_LIVE: -		/* -		 * Schedule a controller reset. The reset will terminate the -		 * association and schedule the reconnect timer.  Reconnects -		 * will be attempted until either the ctlr_loss_tmo -		 * (max_retries * connect_delay) expires or the remoteport's -		 * dev_loss_tmo expires. -		 */ -		if (nvme_reset_ctrl(&ctrl->ctrl)) { -			dev_warn(ctrl->ctrl.device, -				"NVME-FC{%d}: Couldn't schedule reset.\n", -				ctrl->cnum); -			nvme_delete_ctrl(&ctrl->ctrl); -		} -		break; - -	case NVME_CTRL_CONNECTING: -		/* -		 * The association has already been terminated and the -		 * controller is attempting reconnects.  No need to do anything -		 * futher.  Reconnects will be attempted until either the -		 * ctlr_loss_tmo (max_retries * connect_delay) expires or the -		 * remoteport's dev_loss_tmo expires. -		 */ -		break; - -	case NVME_CTRL_RESETTING: -		/* -		 * Controller is already in the process of terminating the -		 * association.  No need to do anything further. The reconnect -		 * step will kick in naturally after the association is -		 * terminated. -		 */ -		break; - -	case NVME_CTRL_DELETING: -	case NVME_CTRL_DELETING_NOIO: -	default: -		/* no action to take - let it delete */ -		break; -	} +	set_bit(ASSOC_FAILED, &ctrl->flags); +	nvme_reset_ctrl(&ctrl->ctrl);  }  /** @@ -2079,7 +2038,8 @@ done:  		nvme_fc_complete_rq(rq);  check_error: -	if (terminate_assoc && ctrl->ctrl.state != NVME_CTRL_RESETTING) +	if (terminate_assoc && +	    nvme_ctrl_state(&ctrl->ctrl) != NVME_CTRL_RESETTING)  		queue_work(nvme_reset_wq, &ctrl->ioerr_work);  } @@ -2533,6 +2493,8 @@ __nvme_fc_abort_outstanding_ios(struct nvme_fc_ctrl *ctrl, bool start_queues)  static void  nvme_fc_error_recovery(struct nvme_fc_ctrl *ctrl, char *errmsg)  { +	enum nvme_ctrl_state state = nvme_ctrl_state(&ctrl->ctrl); +  	/*  	 * if an error (io timeout, etc) while (re)connecting, the remote  	 * port requested terminating of the association (disconnect_ls) @@ -2540,9 +2502,8 @@ nvme_fc_error_recovery(struct nvme_fc_ctrl *ctrl, char *errmsg)  	 * the controller.  Abort any ios on the association and let the  	 * create_association error path resolve things.  	 */ -	if (ctrl->ctrl.state == NVME_CTRL_CONNECTING) { +	if (state == NVME_CTRL_CONNECTING) {  		__nvme_fc_abort_outstanding_ios(ctrl, true); -		set_bit(ASSOC_FAILED, &ctrl->flags);  		dev_warn(ctrl->ctrl.device,  			"NVME-FC{%d}: transport error during (re)connect\n",  			ctrl->cnum); @@ -2550,7 +2511,7 @@ nvme_fc_error_recovery(struct nvme_fc_ctrl *ctrl, char *errmsg)  	}  	/* Otherwise, only proceed if in LIVE state - e.g. on first error */ -	if (ctrl->ctrl.state != NVME_CTRL_LIVE) +	if (state != NVME_CTRL_LIVE)  		return;  	dev_warn(ctrl->ctrl.device, @@ -3061,7 +3022,6 @@ nvme_fc_create_association(struct nvme_fc_ctrl *ctrl)  	struct nvmefc_ls_rcv_op *disls = NULL;  	unsigned long flags;  	int ret; -	bool changed;  	++ctrl->ctrl.nr_reconnects; @@ -3172,12 +3132,13 @@ nvme_fc_create_association(struct nvme_fc_ctrl *ctrl)  	if (ret)  		goto out_term_aen_ops; -	changed = nvme_change_ctrl_state(&ctrl->ctrl, NVME_CTRL_LIVE); +	if (!nvme_change_ctrl_state(&ctrl->ctrl, NVME_CTRL_LIVE)) { +		ret = -EIO; +		goto out_term_aen_ops; +	}  	ctrl->ctrl.nr_reconnects = 0; - -	if (changed) -		nvme_start_ctrl(&ctrl->ctrl); +	nvme_start_ctrl(&ctrl->ctrl);  	return 0;	/* Success */ @@ -3578,8 +3539,7 @@ nvme_fc_init_ctrl(struct device *dev, struct nvmf_ctrl_options *opts,  	list_add_tail(&ctrl->ctrl_list, &rport->ctrl_list);  	spin_unlock_irqrestore(&rport->lock, flags); -	if (!nvme_change_ctrl_state(&ctrl->ctrl, NVME_CTRL_RESETTING) || -	    !nvme_change_ctrl_state(&ctrl->ctrl, NVME_CTRL_CONNECTING)) { +	if (!nvme_change_ctrl_state(&ctrl->ctrl, NVME_CTRL_CONNECTING)) {  		dev_err(ctrl->ctrl.device,  			"NVME-FC{%d}: failed to init ctrl state\n", ctrl->cnum);  		goto fail_ctrl; diff --git a/drivers/nvme/host/ioctl.c b/drivers/nvme/host/ioctl.c index e8930146847a..b1b46c2713e1 100644 --- a/drivers/nvme/host/ioctl.c +++ b/drivers/nvme/host/ioctl.c @@ -283,8 +283,7 @@ static bool nvme_validate_passthru_nsid(struct nvme_ctrl *ctrl,  {  	if (ns && nsid != ns->head->ns_id) {  		dev_err(ctrl->device, -			"%s: nsid (%u) in cmd does not match nsid (%u)" -			"of namespace\n", +			"%s: nsid (%u) in cmd does not match nsid (%u) of namespace\n",  			current->comm, nsid, ns->head->ns_id);  		return false;  	} diff --git a/drivers/nvme/host/pci.c b/drivers/nvme/host/pci.c index 278bed4e35bb..950289405ef2 100644 --- a/drivers/nvme/host/pci.c +++ b/drivers/nvme/host/pci.c @@ -2153,14 +2153,6 @@ static int nvme_alloc_host_mem_multi(struct nvme_dev *dev, u64 preferred,  	return 0;  out_free_bufs: -	while (--i >= 0) { -		size_t size = le32_to_cpu(descs[i].size) * NVME_CTRL_PAGE_SIZE; - -		dma_free_attrs(dev->dev, size, bufs[i], -			       le64_to_cpu(descs[i].addr), -			       DMA_ATTR_NO_KERNEL_MAPPING | DMA_ATTR_NO_WARN); -	} -  	kfree(bufs);  out_free_descs:  	dma_free_coherent(dev->dev, descs_size, descs, descs_dma); @@ -3147,7 +3139,9 @@ static unsigned long check_vendor_combination_bug(struct pci_dev *pdev)  		 * because of high power consumption (> 2 Watt) in s2idle  		 * sleep. Only some boards with Intel CPU are affected.  		 */ -		if (dmi_match(DMI_BOARD_NAME, "GMxPXxx") || +		if (dmi_match(DMI_BOARD_NAME, "DN50Z-140HC-YD") || +		    dmi_match(DMI_BOARD_NAME, "GMxPXxx") || +		    dmi_match(DMI_BOARD_NAME, "GXxMRXx") ||  		    dmi_match(DMI_BOARD_NAME, "PH4PG31") ||  		    dmi_match(DMI_BOARD_NAME, "PH4PRX1_PH6PRX1") ||  		    dmi_match(DMI_BOARD_NAME, "PH6PG01_PH6PG71")) @@ -3712,6 +3706,8 @@ static const struct pci_device_id nvme_id_table[] = {  		.driver_data = NVME_QUIRK_BOGUS_NID, },  	{ PCI_DEVICE(0x1cc1, 0x5350),   /* ADATA XPG GAMMIX S50 */  		.driver_data = NVME_QUIRK_BOGUS_NID, }, +	{ PCI_DEVICE(0x1dbe, 0x5216),   /* Acer/INNOGRIT FA100/5216 NVMe SSD */ +		.driver_data = NVME_QUIRK_BOGUS_NID, },  	{ PCI_DEVICE(0x1dbe, 0x5236),   /* ADATA XPG GAMMIX S70 */  		.driver_data = NVME_QUIRK_BOGUS_NID, },  	{ PCI_DEVICE(0x1e49, 0x0021),   /* ZHITAI TiPro5000 NVMe SSD */ diff --git a/drivers/nvme/host/sysfs.c b/drivers/nvme/host/sysfs.c index b68a9e5f1ea3..3a41b9ab0f13 100644 --- a/drivers/nvme/host/sysfs.c +++ b/drivers/nvme/host/sysfs.c @@ -792,7 +792,7 @@ static umode_t nvme_tls_attrs_are_visible(struct kobject *kobj,  	return a->mode;  } -const struct attribute_group nvme_tls_attrs_group = { +static const struct attribute_group nvme_tls_attrs_group = {  	.attrs		= nvme_tls_attrs,  	.is_visible	= nvme_tls_attrs_are_visible,  }; diff --git a/drivers/nvme/host/tcp.c b/drivers/nvme/host/tcp.c index 841238f38fdd..8a9131c95a3d 100644 --- a/drivers/nvme/host/tcp.c +++ b/drivers/nvme/host/tcp.c @@ -763,6 +763,40 @@ static int nvme_tcp_handle_r2t(struct nvme_tcp_queue *queue,  	return 0;  } +static void nvme_tcp_handle_c2h_term(struct nvme_tcp_queue *queue, +		struct nvme_tcp_term_pdu *pdu) +{ +	u16 fes; +	const char *msg; +	u32 plen = le32_to_cpu(pdu->hdr.plen); + +	static const char * const msg_table[] = { +		[NVME_TCP_FES_INVALID_PDU_HDR] = "Invalid PDU Header Field", +		[NVME_TCP_FES_PDU_SEQ_ERR] = "PDU Sequence Error", +		[NVME_TCP_FES_HDR_DIGEST_ERR] = "Header Digest Error", +		[NVME_TCP_FES_DATA_OUT_OF_RANGE] = "Data Transfer Out Of Range", +		[NVME_TCP_FES_R2T_LIMIT_EXCEEDED] = "R2T Limit Exceeded", +		[NVME_TCP_FES_UNSUPPORTED_PARAM] = "Unsupported Parameter", +	}; + +	if (plen < NVME_TCP_MIN_C2HTERM_PLEN || +	    plen > NVME_TCP_MAX_C2HTERM_PLEN) { +		dev_err(queue->ctrl->ctrl.device, +			"Received a malformed C2HTermReq PDU (plen = %u)\n", +			plen); +		return; +	} + +	fes = le16_to_cpu(pdu->fes); +	if (fes && fes < ARRAY_SIZE(msg_table)) +		msg = msg_table[fes]; +	else +		msg = "Unknown"; + +	dev_err(queue->ctrl->ctrl.device, +		"Received C2HTermReq (FES = %s)\n", msg); +} +  static int nvme_tcp_recv_pdu(struct nvme_tcp_queue *queue, struct sk_buff *skb,  		unsigned int *offset, size_t *len)  { @@ -784,6 +818,15 @@ static int nvme_tcp_recv_pdu(struct nvme_tcp_queue *queue, struct sk_buff *skb,  		return 0;  	hdr = queue->pdu; +	if (unlikely(hdr->type == nvme_tcp_c2h_term)) { +		/* +		 * C2HTermReq never includes Header or Data digests. +		 * Skip the checks. +		 */ +		nvme_tcp_handle_c2h_term(queue, (void *)queue->pdu); +		return -EINVAL; +	} +  	if (queue->hdr_digest) {  		ret = nvme_tcp_verify_hdgst(queue, queue->pdu, hdr->hlen);  		if (unlikely(ret)) @@ -1449,11 +1492,14 @@ static int nvme_tcp_init_connection(struct nvme_tcp_queue *queue)  		msg.msg_control = cbuf;  		msg.msg_controllen = sizeof(cbuf);  	} +	msg.msg_flags = MSG_WAITALL;  	ret = kernel_recvmsg(queue->sock, &msg, &iov, 1,  			iov.iov_len, msg.msg_flags); -	if (ret < 0) { +	if (ret < sizeof(*icresp)) {  		pr_warn("queue %d: failed to receive icresp, error %d\n",  			nvme_tcp_queue_id(queue), ret); +		if (ret >= 0) +			ret = -ECONNRESET;  		goto free_icresp;  	}  	ret = -ENOTCONN; @@ -1565,7 +1611,7 @@ static bool nvme_tcp_poll_queue(struct nvme_tcp_queue *queue)  			  ctrl->io_queues[HCTX_TYPE_POLL];  } -/** +/*   * Track the number of queues assigned to each cpu using a global per-cpu   * counter and select the least used cpu from the mq_map. Our goal is to spread   * different controllers I/O threads across different cpu cores. diff --git a/drivers/nvme/target/admin-cmd.c b/drivers/nvme/target/admin-cmd.c index e670dc185a96..acc138bbf8f2 100644 --- a/drivers/nvme/target/admin-cmd.c +++ b/drivers/nvme/target/admin-cmd.c @@ -1068,6 +1068,7 @@ static void nvme_execute_identify_ns_nvm(struct nvmet_req *req)  		goto out;  	}  	status = nvmet_copy_to_sgl(req, 0, id, sizeof(*id)); +	kfree(id);  out:  	nvmet_req_complete(req, status);  } diff --git a/drivers/nvme/target/core.c b/drivers/nvme/target/core.c index cdc4a09a6e8a..2e741696f371 100644 --- a/drivers/nvme/target/core.c +++ b/drivers/nvme/target/core.c @@ -606,6 +606,9 @@ int nvmet_ns_enable(struct nvmet_ns *ns)  			goto out_dev_put;  	} +	if (percpu_ref_init(&ns->ref, nvmet_destroy_namespace, 0, GFP_KERNEL)) +		goto out_pr_exit; +  	nvmet_ns_changed(subsys, ns->nsid);  	ns->enabled = true;  	xa_set_mark(&subsys->namespaces, ns->nsid, NVMET_NS_ENABLED); @@ -613,6 +616,9 @@ int nvmet_ns_enable(struct nvmet_ns *ns)  out_unlock:  	mutex_unlock(&subsys->lock);  	return ret; +out_pr_exit: +	if (ns->pr.enable) +		nvmet_pr_exit_ns(ns);  out_dev_put:  	list_for_each_entry(ctrl, &subsys->ctrls, subsys_entry)  		pci_dev_put(radix_tree_delete(&ctrl->p2p_ns_map, ns->nsid)); @@ -638,6 +644,19 @@ void nvmet_ns_disable(struct nvmet_ns *ns)  	mutex_unlock(&subsys->lock); +	/* +	 * Now that we removed the namespaces from the lookup list, we +	 * can kill the per_cpu ref and wait for any remaining references +	 * to be dropped, as well as a RCU grace period for anyone only +	 * using the namepace under rcu_read_lock().  Note that we can't +	 * use call_rcu here as we need to ensure the namespaces have +	 * been fully destroyed before unloading the module. +	 */ +	percpu_ref_kill(&ns->ref); +	synchronize_rcu(); +	wait_for_completion(&ns->disable_done); +	percpu_ref_exit(&ns->ref); +  	if (ns->pr.enable)  		nvmet_pr_exit_ns(ns); @@ -660,22 +679,6 @@ void nvmet_ns_free(struct nvmet_ns *ns)  	if (ns->nsid == subsys->max_nsid)  		subsys->max_nsid = nvmet_max_nsid(subsys); -	mutex_unlock(&subsys->lock); - -	/* -	 * Now that we removed the namespaces from the lookup list, we -	 * can kill the per_cpu ref and wait for any remaining references -	 * to be dropped, as well as a RCU grace period for anyone only -	 * using the namepace under rcu_read_lock().  Note that we can't -	 * use call_rcu here as we need to ensure the namespaces have -	 * been fully destroyed before unloading the module. -	 */ -	percpu_ref_kill(&ns->ref); -	synchronize_rcu(); -	wait_for_completion(&ns->disable_done); -	percpu_ref_exit(&ns->ref); - -	mutex_lock(&subsys->lock);  	subsys->nr_namespaces--;  	mutex_unlock(&subsys->lock); @@ -705,9 +708,6 @@ struct nvmet_ns *nvmet_ns_alloc(struct nvmet_subsys *subsys, u32 nsid)  	ns->nsid = nsid;  	ns->subsys = subsys; -	if (percpu_ref_init(&ns->ref, nvmet_destroy_namespace, 0, GFP_KERNEL)) -		goto out_free; -  	if (ns->nsid > subsys->max_nsid)  		subsys->max_nsid = nsid; @@ -730,8 +730,6 @@ struct nvmet_ns *nvmet_ns_alloc(struct nvmet_subsys *subsys, u32 nsid)  	return ns;  out_exit:  	subsys->max_nsid = nvmet_max_nsid(subsys); -	percpu_ref_exit(&ns->ref); -out_free:  	kfree(ns);  out_unlock:  	mutex_unlock(&subsys->lock); diff --git a/drivers/nvme/target/fabrics-cmd.c b/drivers/nvme/target/fabrics-cmd.c index a7ff05b3be29..eb406c90c167 100644 --- a/drivers/nvme/target/fabrics-cmd.c +++ b/drivers/nvme/target/fabrics-cmd.c @@ -287,7 +287,7 @@ static void nvmet_execute_admin_connect(struct nvmet_req *req)  	args.subsysnqn = d->subsysnqn;  	args.hostnqn = d->hostnqn;  	args.hostid = &d->hostid; -	args.kato = c->kato; +	args.kato = le32_to_cpu(c->kato);  	ctrl = nvmet_alloc_ctrl(&args);  	if (!ctrl) diff --git a/drivers/nvme/target/io-cmd-bdev.c b/drivers/nvme/target/io-cmd-bdev.c index c1f574fe3280..83be0657e6df 100644 --- a/drivers/nvme/target/io-cmd-bdev.c +++ b/drivers/nvme/target/io-cmd-bdev.c @@ -272,7 +272,7 @@ static void nvmet_bdev_execute_rw(struct nvmet_req *req)  		iter_flags = SG_MITER_FROM_SG;  	} -	if (req->cmd->rw.control & NVME_RW_LR) +	if (req->cmd->rw.control & cpu_to_le16(NVME_RW_LR))  		opf |= REQ_FAILFAST_DEV;  	if (is_pci_p2pdma_page(sg_page(req->sg))) diff --git a/drivers/nvme/target/nvmet.h b/drivers/nvme/target/nvmet.h index b540216c0c9a..d2c1233981e1 100644 --- a/drivers/nvme/target/nvmet.h +++ b/drivers/nvme/target/nvmet.h @@ -589,7 +589,7 @@ struct nvmet_alloc_ctrl_args {  	const struct nvmet_fabrics_ops *ops;  	struct device		*p2p_client;  	u32			kato; -	u32			result; +	__le32			result;  	u16			error_loc;  	u16			status;  }; @@ -784,37 +784,37 @@ u16 nvmet_report_invalid_opcode(struct nvmet_req *req);  static inline bool nvmet_cc_en(u32 cc)  { -	return (cc >> NVME_CC_EN_SHIFT) & 0x1; +	return (cc & NVME_CC_ENABLE) >> NVME_CC_EN_SHIFT;  }  static inline u8 nvmet_cc_css(u32 cc)  { -	return (cc >> NVME_CC_CSS_SHIFT) & 0x7; +	return (cc & NVME_CC_CSS_MASK) >> NVME_CC_CSS_SHIFT;  }  static inline u8 nvmet_cc_mps(u32 cc)  { -	return (cc >> NVME_CC_MPS_SHIFT) & 0xf; +	return (cc & NVME_CC_MPS_MASK) >> NVME_CC_MPS_SHIFT;  }  static inline u8 nvmet_cc_ams(u32 cc)  { -	return (cc >> NVME_CC_AMS_SHIFT) & 0x7; +	return (cc & NVME_CC_AMS_MASK) >> NVME_CC_AMS_SHIFT;  }  static inline u8 nvmet_cc_shn(u32 cc)  { -	return (cc >> NVME_CC_SHN_SHIFT) & 0x3; +	return (cc & NVME_CC_SHN_MASK) >> NVME_CC_SHN_SHIFT;  }  static inline u8 nvmet_cc_iosqes(u32 cc)  { -	return (cc >> NVME_CC_IOSQES_SHIFT) & 0xf; +	return (cc & NVME_CC_IOSQES_MASK) >> NVME_CC_IOSQES_SHIFT;  }  static inline u8 nvmet_cc_iocqes(u32 cc)  { -	return (cc >> NVME_CC_IOCQES_SHIFT) & 0xf; +	return (cc & NVME_CC_IOCQES_MASK) >> NVME_CC_IOCQES_SHIFT;  }  /* Convert a 32-bit number to a 16-bit 0's based number */ diff --git a/drivers/nvme/target/pci-epf.c b/drivers/nvme/target/pci-epf.c index ac30b42cc622..565d2bd36dcd 100644 --- a/drivers/nvme/target/pci-epf.c +++ b/drivers/nvme/target/pci-epf.c @@ -46,7 +46,7 @@ static DEFINE_MUTEX(nvmet_pci_epf_ports_mutex);  /*   * BAR CC register and SQ polling intervals.   */ -#define NVMET_PCI_EPF_CC_POLL_INTERVAL	msecs_to_jiffies(5) +#define NVMET_PCI_EPF_CC_POLL_INTERVAL	msecs_to_jiffies(10)  #define NVMET_PCI_EPF_SQ_POLL_INTERVAL	msecs_to_jiffies(5)  #define NVMET_PCI_EPF_SQ_POLL_IDLE	msecs_to_jiffies(5000) @@ -1694,6 +1694,7 @@ static void nvmet_pci_epf_poll_sqs_work(struct work_struct *work)  	struct nvmet_pci_epf_ctrl *ctrl =  		container_of(work, struct nvmet_pci_epf_ctrl, poll_sqs.work);  	struct nvmet_pci_epf_queue *sq; +	unsigned long limit = jiffies;  	unsigned long last = 0;  	int i, nr_sqs; @@ -1708,6 +1709,16 @@ static void nvmet_pci_epf_poll_sqs_work(struct work_struct *work)  				nr_sqs++;  		} +		/* +		 * If we have been running for a while, reschedule to let other +		 * tasks run and to avoid RCU stalls. +		 */ +		if (time_is_before_jiffies(limit + secs_to_jiffies(1))) { +			cond_resched(); +			limit = jiffies; +			continue; +		} +  		if (nr_sqs) {  			last = jiffies;  			continue; @@ -1822,14 +1833,14 @@ static int nvmet_pci_epf_enable_ctrl(struct nvmet_pci_epf_ctrl *ctrl)  	if (ctrl->io_sqes < sizeof(struct nvme_command)) {  		dev_err(ctrl->dev, "Unsupported I/O SQES %zu (need %zu)\n",  			ctrl->io_sqes, sizeof(struct nvme_command)); -		return -EINVAL; +		goto err;  	}  	ctrl->io_cqes = 1UL << nvmet_cc_iocqes(ctrl->cc);  	if (ctrl->io_cqes < sizeof(struct nvme_completion)) {  		dev_err(ctrl->dev, "Unsupported I/O CQES %zu (need %zu)\n",  			ctrl->io_sqes, sizeof(struct nvme_completion)); -		return -EINVAL; +		goto err;  	}  	/* Create the admin queue. */ @@ -1844,7 +1855,7 @@ static int nvmet_pci_epf_enable_ctrl(struct nvmet_pci_epf_ctrl *ctrl)  				qsize, pci_addr, 0);  	if (status != NVME_SC_SUCCESS) {  		dev_err(ctrl->dev, "Failed to create admin completion queue\n"); -		return -EINVAL; +		goto err;  	}  	qsize = aqa & 0x00000fff; @@ -1854,17 +1865,22 @@ static int nvmet_pci_epf_enable_ctrl(struct nvmet_pci_epf_ctrl *ctrl)  	if (status != NVME_SC_SUCCESS) {  		dev_err(ctrl->dev, "Failed to create admin submission queue\n");  		nvmet_pci_epf_delete_cq(ctrl->tctrl, 0); -		return -EINVAL; +		goto err;  	}  	ctrl->sq_ab = NVMET_PCI_EPF_SQ_AB;  	ctrl->irq_vector_threshold = NVMET_PCI_EPF_IV_THRESHOLD;  	ctrl->enabled = true; +	ctrl->csts = NVME_CSTS_RDY;  	/* Start polling the controller SQs. */  	schedule_delayed_work(&ctrl->poll_sqs, 0);  	return 0; + +err: +	ctrl->csts = 0; +	return -EINVAL;  }  static void nvmet_pci_epf_disable_ctrl(struct nvmet_pci_epf_ctrl *ctrl) @@ -1889,6 +1905,8 @@ static void nvmet_pci_epf_disable_ctrl(struct nvmet_pci_epf_ctrl *ctrl)  	/* Delete the admin queue last. */  	nvmet_pci_epf_delete_sq(ctrl->tctrl, 0);  	nvmet_pci_epf_delete_cq(ctrl->tctrl, 0); + +	ctrl->csts &= ~NVME_CSTS_RDY;  }  static void nvmet_pci_epf_poll_cc_work(struct work_struct *work) @@ -1903,19 +1921,19 @@ static void nvmet_pci_epf_poll_cc_work(struct work_struct *work)  	old_cc = ctrl->cc;  	new_cc = nvmet_pci_epf_bar_read32(ctrl, NVME_REG_CC); +	if (new_cc == old_cc) +		goto reschedule_work; +  	ctrl->cc = new_cc;  	if (nvmet_cc_en(new_cc) && !nvmet_cc_en(old_cc)) {  		ret = nvmet_pci_epf_enable_ctrl(ctrl);  		if (ret) -			return; -		ctrl->csts |= NVME_CSTS_RDY; +			goto reschedule_work;  	} -	if (!nvmet_cc_en(new_cc) && nvmet_cc_en(old_cc)) { +	if (!nvmet_cc_en(new_cc) && nvmet_cc_en(old_cc))  		nvmet_pci_epf_disable_ctrl(ctrl); -		ctrl->csts &= ~NVME_CSTS_RDY; -	}  	if (nvmet_cc_shn(new_cc) && !nvmet_cc_shn(old_cc)) {  		nvmet_pci_epf_disable_ctrl(ctrl); @@ -1928,6 +1946,7 @@ static void nvmet_pci_epf_poll_cc_work(struct work_struct *work)  	nvmet_update_cc(ctrl->tctrl, ctrl->cc);  	nvmet_pci_epf_bar_write32(ctrl, NVME_REG_CSTS, ctrl->csts); +reschedule_work:  	schedule_delayed_work(&ctrl->poll_cc, NVMET_PCI_EPF_CC_POLL_INTERVAL);  } diff --git a/drivers/nvme/target/rdma.c b/drivers/nvme/target/rdma.c index 1afd93026f9b..2a4536ef6184 100644 --- a/drivers/nvme/target/rdma.c +++ b/drivers/nvme/target/rdma.c @@ -996,6 +996,27 @@ out_err:  	nvmet_req_complete(&cmd->req, status);  } +static bool nvmet_rdma_recv_not_live(struct nvmet_rdma_queue *queue, +		struct nvmet_rdma_rsp *rsp) +{ +	unsigned long flags; +	bool ret = true; + +	spin_lock_irqsave(&queue->state_lock, flags); +	/* +	 * recheck queue state is not live to prevent a race condition +	 * with RDMA_CM_EVENT_ESTABLISHED handler. +	 */ +	if (queue->state == NVMET_RDMA_Q_LIVE) +		ret = false; +	else if (queue->state == NVMET_RDMA_Q_CONNECTING) +		list_add_tail(&rsp->wait_list, &queue->rsp_wait_list); +	else +		nvmet_rdma_put_rsp(rsp); +	spin_unlock_irqrestore(&queue->state_lock, flags); +	return ret; +} +  static void nvmet_rdma_recv_done(struct ib_cq *cq, struct ib_wc *wc)  {  	struct nvmet_rdma_cmd *cmd = @@ -1038,17 +1059,9 @@ static void nvmet_rdma_recv_done(struct ib_cq *cq, struct ib_wc *wc)  	rsp->n_rdma = 0;  	rsp->invalidate_rkey = 0; -	if (unlikely(queue->state != NVMET_RDMA_Q_LIVE)) { -		unsigned long flags; - -		spin_lock_irqsave(&queue->state_lock, flags); -		if (queue->state == NVMET_RDMA_Q_CONNECTING) -			list_add_tail(&rsp->wait_list, &queue->rsp_wait_list); -		else -			nvmet_rdma_put_rsp(rsp); -		spin_unlock_irqrestore(&queue->state_lock, flags); +	if (unlikely(queue->state != NVMET_RDMA_Q_LIVE) && +	    nvmet_rdma_recv_not_live(queue, rsp))  		return; -	}  	nvmet_rdma_handle_command(queue, rsp);  } | 
