Lines Matching defs:ctrl
149 static void nvme_remove_invalid_namespaces(struct nvme_ctrl *ctrl,
151 static void nvme_update_keep_alive(struct nvme_ctrl *ctrl,
154 void nvme_queue_scan(struct nvme_ctrl *ctrl)
159 if (nvme_ctrl_state(ctrl) == NVME_CTRL_LIVE && ctrl->tagset)
160 queue_work(nvme_wq, &ctrl->scan_work);
169 int nvme_try_sched_reset(struct nvme_ctrl *ctrl)
171 if (nvme_ctrl_state(ctrl) != NVME_CTRL_RESETTING)
173 if (!queue_work(nvme_reset_wq, &ctrl->reset_work))
181 struct nvme_ctrl *ctrl = container_of(to_delayed_work(work),
184 if (nvme_ctrl_state(ctrl) != NVME_CTRL_CONNECTING)
187 set_bit(NVME_CTRL_FAILFAST_EXPIRED, &ctrl->flags);
188 dev_info(ctrl->device, "failfast expired\n");
189 nvme_kick_requeue_lists(ctrl);
192 static inline void nvme_start_failfast_work(struct nvme_ctrl *ctrl)
194 if (!ctrl->opts || ctrl->opts->fast_io_fail_tmo == -1)
197 schedule_delayed_work(&ctrl->failfast_work,
198 ctrl->opts->fast_io_fail_tmo * HZ);
201 static inline void nvme_stop_failfast_work(struct nvme_ctrl *ctrl)
203 if (!ctrl->opts)
206 cancel_delayed_work_sync(&ctrl->failfast_work);
207 clear_bit(NVME_CTRL_FAILFAST_EXPIRED, &ctrl->flags);
211 int nvme_reset_ctrl(struct nvme_ctrl *ctrl)
213 if (!nvme_change_ctrl_state(ctrl, NVME_CTRL_RESETTING))
215 if (!queue_work(nvme_reset_wq, &ctrl->reset_work))
221 int nvme_reset_ctrl_sync(struct nvme_ctrl *ctrl)
225 ret = nvme_reset_ctrl(ctrl);
227 flush_work(&ctrl->reset_work);
228 if (nvme_ctrl_state(ctrl) != NVME_CTRL_LIVE)
235 static void nvme_do_delete_ctrl(struct nvme_ctrl *ctrl)
237 dev_info(ctrl->device,
238 "Removing ctrl: NQN \"%s\"\n", nvmf_ctrl_subsysnqn(ctrl));
240 flush_work(&ctrl->reset_work);
241 nvme_stop_ctrl(ctrl);
242 nvme_remove_namespaces(ctrl);
243 ctrl->ops->delete_ctrl(ctrl);
244 nvme_uninit_ctrl(ctrl);
249 struct nvme_ctrl *ctrl =
252 nvme_do_delete_ctrl(ctrl);
255 int nvme_delete_ctrl(struct nvme_ctrl *ctrl)
257 if (!nvme_change_ctrl_state(ctrl, NVME_CTRL_DELETING))
259 if (!queue_work(nvme_delete_wq, &ctrl->delete_work))
265 void nvme_delete_ctrl_sync(struct nvme_ctrl *ctrl)
271 nvme_get_ctrl(ctrl);
272 if (nvme_change_ctrl_state(ctrl, NVME_CTRL_DELETING))
273 nvme_do_delete_ctrl(ctrl);
274 nvme_put_ctrl(ctrl);
327 delay = nvme_req(req)->ctrl->crdt[crd - 1] * 100;
355 dev_name(nr->ctrl->device),
372 ns ? ns->disk->disk_name : dev_name(nr->ctrl->device),
456 struct nvme_ctrl *ctrl = nvme_req(req)->ctrl;
469 if (ctrl->kas &&
470 req->deadline - req->timeout >= ctrl->ka_last_check_time)
471 ctrl->comp_seen = true;
485 queue_work(nvme_wq, &ctrl->dhchap_auth_work);
534 void nvme_cancel_tagset(struct nvme_ctrl *ctrl)
536 if (ctrl->tagset) {
537 blk_mq_tagset_busy_iter(ctrl->tagset,
538 nvme_cancel_request, ctrl);
539 blk_mq_tagset_wait_completed_request(ctrl->tagset);
544 void nvme_cancel_admin_tagset(struct nvme_ctrl *ctrl)
546 if (ctrl->admin_tagset) {
547 blk_mq_tagset_busy_iter(ctrl->admin_tagset,
548 nvme_cancel_request, ctrl);
549 blk_mq_tagset_wait_completed_request(ctrl->admin_tagset);
554 bool nvme_change_ctrl_state(struct nvme_ctrl *ctrl,
561 spin_lock_irqsave(&ctrl->lock, flags);
563 old_state = nvme_ctrl_state(ctrl);
629 WRITE_ONCE(ctrl->state, new_state);
630 wake_up_all(&ctrl->state_wq);
633 spin_unlock_irqrestore(&ctrl->lock, flags);
639 nvme_stop_failfast_work(ctrl);
640 nvme_kick_requeue_lists(ctrl);
643 nvme_start_failfast_work(ctrl);
653 bool nvme_wait_reset(struct nvme_ctrl *ctrl)
655 wait_event(ctrl->state_wq,
656 nvme_change_ctrl_state(ctrl, NVME_CTRL_RESETTING) ||
657 nvme_state_terminal(ctrl));
658 return nvme_ctrl_state(ctrl) == NVME_CTRL_RESETTING;
690 nvme_put_ctrl(ns->ctrl);
725 logging_enabled = nr->ctrl->passthru_err_log_enabled;
752 blk_status_t nvme_fail_nonready_command(struct nvme_ctrl *ctrl,
755 enum nvme_ctrl_state state = nvme_ctrl_state(ctrl);
760 !test_bit(NVME_CTRL_FAILFAST_EXPIRED, &ctrl->flags) &&
767 bool __nvme_check_ready(struct nvme_ctrl *ctrl, struct request *rq,
780 if (rq->q == ctrl->admin_q && (req->flags & NVME_REQ_USERCMD))
783 if (ctrl->ops->flags & NVME_F_FABRICS) {
837 if (test_and_set_bit_lock(0, &ns->ctrl->discard_page_busy))
840 range = page_address(ns->ctrl->discard_page);
867 if (virt_to_page(range) == ns->ctrl->discard_page)
868 clear_bit_unlock(0, &ns->ctrl->discard_page_busy);
921 if (ns->ctrl->quirks & NVME_QUIRK_DEALLOCATE_ZEROES)
1046 struct nvme_ctrl *ctrl = nvme_req(req)->ctrl;
1048 if (req->special_vec.bv_page == ctrl->discard_page)
1049 clear_bit_unlock(0, &ctrl->discard_page_busy);
1182 u32 nvme_command_effects(struct nvme_ctrl *ctrl, struct nvme_ns *ns, u8 opcode)
1189 dev_warn_once(ctrl->device,
1200 effects = le32_to_cpu(ctrl->effects->acs[opcode]);
1211 u32 nvme_passthru_start(struct nvme_ctrl *ctrl, struct nvme_ns *ns, u8 opcode)
1213 u32 effects = nvme_command_effects(ctrl, ns, opcode);
1220 mutex_lock(&ctrl->scan_lock);
1221 mutex_lock(&ctrl->subsys->lock);
1222 nvme_mpath_start_freeze(ctrl->subsys);
1223 nvme_mpath_wait_freeze(ctrl->subsys);
1224 nvme_start_freeze(ctrl);
1225 nvme_wait_freeze(ctrl);
1231 void nvme_passthru_end(struct nvme_ctrl *ctrl, struct nvme_ns *ns, u32 effects,
1235 nvme_unfreeze(ctrl);
1236 nvme_mpath_unfreeze(ctrl->subsys);
1237 mutex_unlock(&ctrl->subsys->lock);
1238 mutex_unlock(&ctrl->scan_lock);
1242 &ctrl->flags)) {
1243 dev_info(ctrl->device,
1248 nvme_queue_scan(ctrl);
1249 flush_work(&ctrl->scan_work);
1264 nvme_update_keep_alive(ctrl, cmd);
1282 static unsigned long nvme_keep_alive_work_period(struct nvme_ctrl *ctrl)
1284 unsigned long delay = ctrl->kato * HZ / 2;
1292 if (ctrl->ctratt & NVME_CTRL_ATTR_TBKAS)
1297 static void nvme_queue_keep_alive_work(struct nvme_ctrl *ctrl)
1300 unsigned long delay = nvme_keep_alive_work_period(ctrl);
1301 unsigned long ka_next_check_tm = ctrl->ka_last_check_time + delay;
1308 queue_delayed_work(nvme_wq, &ctrl->ka_work, delay);
1314 struct nvme_ctrl *ctrl = rq->end_io_data;
1316 unsigned long delay = nvme_keep_alive_work_period(ctrl);
1317 enum nvme_ctrl_state state = nvme_ctrl_state(ctrl);
1326 dev_warn(ctrl->device, "long keepalive RTT (%u ms)\n",
1334 dev_err(ctrl->device,
1340 ctrl->ka_last_check_time = jiffies;
1341 ctrl->comp_seen = false;
1343 queue_delayed_work(nvme_wq, &ctrl->ka_work, delay);
1349 struct nvme_ctrl *ctrl = container_of(to_delayed_work(work),
1351 bool comp_seen = ctrl->comp_seen;
1354 ctrl->ka_last_check_time = jiffies;
1356 if ((ctrl->ctratt & NVME_CTRL_ATTR_TBKAS) && comp_seen) {
1357 dev_dbg(ctrl->device,
1359 ctrl->comp_seen = false;
1360 nvme_queue_keep_alive_work(ctrl);
1364 rq = blk_mq_alloc_request(ctrl->admin_q, nvme_req_op(&ctrl->ka_cmd),
1368 dev_err(ctrl->device, "keep-alive failed: %ld\n", PTR_ERR(rq));
1369 nvme_reset_ctrl(ctrl);
1372 nvme_init_request(rq, &ctrl->ka_cmd);
1374 rq->timeout = ctrl->kato * HZ;
1376 rq->end_io_data = ctrl;
1380 static void nvme_start_keep_alive(struct nvme_ctrl *ctrl)
1382 if (unlikely(ctrl->kato == 0))
1385 nvme_queue_keep_alive_work(ctrl);
1388 void nvme_stop_keep_alive(struct nvme_ctrl *ctrl)
1390 if (unlikely(ctrl->kato == 0))
1393 cancel_delayed_work_sync(&ctrl->ka_work);
1397 static void nvme_update_keep_alive(struct nvme_ctrl *ctrl,
1403 dev_info(ctrl->device,
1405 ctrl->kato * 1000 / 2, new_kato * 1000 / 2);
1407 nvme_stop_keep_alive(ctrl);
1408 ctrl->kato = new_kato;
1409 nvme_start_keep_alive(ctrl);
1412 static bool nvme_id_cns_ok(struct nvme_ctrl *ctrl, u8 cns)
1417 if (ctrl->vs >= NVME_VS(1, 2, 0))
1428 if (ctrl->vs >= NVME_VS(1, 1, 0) &&
1429 !(ctrl->quirks & NVME_QUIRK_IDENTIFY_CNS))
1460 static int nvme_process_ns_desc(struct nvme_ctrl *ctrl, struct nvme_ns_ids *ids,
1463 const char *warn_str = "ctrl returned bogus length:";
1469 dev_warn(ctrl->device, "%s %d for NVME_NIDT_EUI64\n",
1473 if (ctrl->quirks & NVME_QUIRK_BOGUS_NID)
1479 dev_warn(ctrl->device, "%s %d for NVME_NIDT_NGUID\n",
1483 if (ctrl->quirks & NVME_QUIRK_BOGUS_NID)
1489 dev_warn(ctrl->device, "%s %d for NVME_NIDT_UUID\n",
1493 if (ctrl->quirks & NVME_QUIRK_BOGUS_NID)
1499 dev_warn(ctrl->device, "%s %d for NVME_NIDT_CSI\n",
1512 static int nvme_identify_ns_descs(struct nvme_ctrl *ctrl,
1520 if (ctrl->vs < NVME_VS(1, 3, 0) && !nvme_multi_css(ctrl))
1522 if (ctrl->quirks & NVME_QUIRK_NO_NS_DESC_LIST)
1533 status = nvme_submit_sync_cmd(ctrl->admin_q, &c, data,
1536 dev_warn(ctrl->device,
1548 len = nvme_process_ns_desc(ctrl, &info->ids, cur, &csi_seen);
1555 if (nvme_multi_css(ctrl) && !csi_seen) {
1556 dev_warn(ctrl->device, "Command set not reported for nsid:%d\n",
1566 int nvme_identify_ns(struct nvme_ctrl *ctrl, unsigned nsid,
1581 error = nvme_submit_sync_cmd(ctrl->admin_q, &c, *id, sizeof(**id));
1583 dev_warn(ctrl->device, "Identify namespace failed (%d)\n", error);
1590 static int nvme_ns_info_from_identify(struct nvme_ctrl *ctrl,
1597 ret = nvme_identify_ns(ctrl, info->nsid, &id);
1612 if (ctrl->quirks & NVME_QUIRK_BOGUS_NID) {
1613 dev_info(ctrl->device,
1616 if (ctrl->vs >= NVME_VS(1, 1, 0) &&
1619 if (ctrl->vs >= NVME_VS(1, 2, 0) &&
1629 static int nvme_ns_info_from_id_cs_indep(struct nvme_ctrl *ctrl,
1644 ret = nvme_submit_sync_cmd(ctrl->admin_q, &c, id, sizeof(*id));
1693 int nvme_set_queue_count(struct nvme_ctrl *ctrl, int *count)
1699 status = nvme_set_features(ctrl, NVME_FEAT_NUM_QUEUES, q_count, NULL, 0,
1716 dev_err(ctrl->device, "Could not set queue count (%d)\n", status);
1731 static void nvme_enable_aen(struct nvme_ctrl *ctrl)
1733 u32 result, supported_aens = ctrl->oaes & NVME_AEN_SUPPORTED;
1739 status = nvme_set_features(ctrl, NVME_FEAT_ASYNC_EVENT, supported_aens,
1742 dev_warn(ctrl->device, "Failed to configure AEN (cfg %x)\n",
1745 queue_work(nvme_wq, &ctrl->async_event_work);
1756 if (!try_module_get(ns->ctrl->ops->module))
1770 module_put(ns->ctrl->ops->module);
1858 struct nvme_ctrl *ctrl = ns->ctrl;
1860 if (ctrl->dmrsl && ctrl->dmrsl <= nvme_sect_to_lba(ns->head, UINT_MAX))
1862 nvme_lba_to_sect(ns->head, ctrl->dmrsl);
1863 else if (ctrl->oncs & NVME_CTRL_ONCS_DSM)
1870 if (ctrl->dmrl)
1871 lim->max_discard_segments = ctrl->dmrl;
1884 static int nvme_identify_ns_nvm(struct nvme_ctrl *ctrl, unsigned int nsid,
1900 ret = nvme_submit_sync_cmd(ctrl->admin_q, &c, nvm, sizeof(*nvm));
1936 static void nvme_configure_metadata(struct nvme_ctrl *ctrl,
1944 if (!head->ms || !(ctrl->ops->flags & NVME_F_METADATA_SUPPORTED))
1947 if (nvm && (ctrl->ctratt & NVME_CTRL_ATTR_ELBAS)) {
1963 if (ctrl->ops->flags & NVME_F_FABRICS) {
1983 if (ctrl->max_integrity_segments && nvme_ns_has_pi(head))
2017 static u32 nvme_max_drv_segments(struct nvme_ctrl *ctrl)
2019 return ctrl->max_hw_sectors / (NVME_CTRL_PAGE_SIZE >> SECTOR_SHIFT) + 1;
2022 static void nvme_set_ctrl_limits(struct nvme_ctrl *ctrl,
2025 lim->max_hw_sectors = ctrl->max_hw_sectors;
2027 min_not_zero(nvme_max_drv_segments(ctrl), ctrl->max_segments));
2028 lim->max_integrity_segments = ctrl->max_integrity_segments;
2062 atomic_bs = (1 + ns->ctrl->subsys->awupf) * bs;
2084 if ((ns->ctrl->quirks & NVME_QUIRK_DEALLOCATE_ZEROES) &&
2085 (ns->ctrl->oncs & NVME_CTRL_ONCS_DSM))
2088 lim->max_write_zeroes_sectors = ns->ctrl->max_zeroes_sectors;
2106 struct nvme_ctrl *ctrl = ns->ctrl;
2109 if ((ctrl->quirks & NVME_QUIRK_STRIPE_SIZE) &&
2110 is_power_of_2(ctrl->max_hw_sectors))
2111 iob = ctrl->max_hw_sectors;
2143 nvme_set_ctrl_limits(ns->ctrl, &lim);
2168 ret = nvme_identify_ns(ns->ctrl, info->nsid, &id);
2180 if (ns->ctrl->ctratt & NVME_CTRL_ATTR_ELBAS) {
2181 ret = nvme_identify_ns_nvm(ns->ctrl, info->nsid, &nvm);
2199 nvme_set_ctrl_limits(ns->ctrl, &lim);
2200 nvme_configure_metadata(ns->ctrl, ns->head, id, nvm, info);
2209 if ((ns->ctrl->vwc & NVME_CTRL_VWC_PRESENT) && !info->no_vwc)
2267 dev_info(ns->ctrl->device,
2279 dev_info(ns->ctrl->device,
2371 struct nvme_ctrl *ctrl = data;
2382 return __nvme_submit_sync_cmd(ctrl->admin_q, &cmd, NULL, buffer, len,
2386 static void nvme_configure_opal(struct nvme_ctrl *ctrl, bool was_suspended)
2388 if (ctrl->oacs & NVME_CTRL_OACS_SEC_SUPP) {
2389 if (!ctrl->opal_dev)
2390 ctrl->opal_dev = init_opal_dev(ctrl, &nvme_sec_submit);
2392 opal_unlock_from_suspend(ctrl->opal_dev);
2394 free_opal_dev(ctrl->opal_dev);
2395 ctrl->opal_dev = NULL;
2399 static void nvme_configure_opal(struct nvme_ctrl *ctrl, bool was_suspended)
2427 static int nvme_wait_ready(struct nvme_ctrl *ctrl, u32 mask, u32 val,
2434 while ((ret = ctrl->ops->reg_read32(ctrl, NVME_REG_CSTS, &csts)) == 0) {
2444 dev_err(ctrl->device,
2454 int nvme_disable_ctrl(struct nvme_ctrl *ctrl, bool shutdown)
2458 ctrl->ctrl_config &= ~NVME_CC_SHN_MASK;
2460 ctrl->ctrl_config |= NVME_CC_SHN_NORMAL;
2462 ctrl->ctrl_config &= ~NVME_CC_ENABLE;
2464 ret = ctrl->ops->reg_write32(ctrl, NVME_REG_CC, ctrl->ctrl_config);
2469 return nvme_wait_ready(ctrl, NVME_CSTS_SHST_MASK,
2471 ctrl->shutdown_timeout, "shutdown");
2473 if (ctrl->quirks & NVME_QUIRK_DELAY_BEFORE_CHK_RDY)
2475 return nvme_wait_ready(ctrl, NVME_CSTS_RDY, 0,
2476 (NVME_CAP_TIMEOUT(ctrl->cap) + 1) / 2, "reset");
2480 int nvme_enable_ctrl(struct nvme_ctrl *ctrl)
2486 ret = ctrl->ops->reg_read64(ctrl, NVME_REG_CAP, &ctrl->cap);
2488 dev_err(ctrl->device, "Reading CAP failed (%d)\n", ret);
2491 dev_page_min = NVME_CAP_MPSMIN(ctrl->cap) + 12;
2494 dev_err(ctrl->device,
2500 if (NVME_CAP_CSS(ctrl->cap) & NVME_CAP_CSS_CSI)
2501 ctrl->ctrl_config = NVME_CC_CSS_CSI;
2503 ctrl->ctrl_config = NVME_CC_CSS_NVM;
2511 ctrl->ctrl_config &= ~NVME_CC_CRIME;
2513 ctrl->ctrl_config |= (NVME_CTRL_PAGE_SHIFT - 12) << NVME_CC_MPS_SHIFT;
2514 ctrl->ctrl_config |= NVME_CC_AMS_RR | NVME_CC_SHN_NONE;
2515 ctrl->ctrl_config |= NVME_CC_IOSQES | NVME_CC_IOCQES;
2516 ret = ctrl->ops->reg_write32(ctrl, NVME_REG_CC, ctrl->ctrl_config);
2521 ret = ctrl->ops->reg_read64(ctrl, NVME_REG_CAP, &ctrl->cap);
2525 timeout = NVME_CAP_TIMEOUT(ctrl->cap);
2526 if (ctrl->cap & NVME_CAP_CRMS_CRWMS) {
2529 ret = ctrl->ops->reg_read32(ctrl, NVME_REG_CRTO, &crto);
2531 dev_err(ctrl->device, "Reading CRTO failed (%d)\n",
2544 dev_warn_once(ctrl->device, "bad crto:%x cap:%llx\n",
2545 crto, ctrl->cap);
2550 ctrl->ctrl_config |= NVME_CC_ENABLE;
2551 ret = ctrl->ops->reg_write32(ctrl, NVME_REG_CC, ctrl->ctrl_config);
2554 return nvme_wait_ready(ctrl, NVME_CSTS_RDY, NVME_CSTS_RDY,
2559 static int nvme_configure_timestamp(struct nvme_ctrl *ctrl)
2564 if (!(ctrl->oncs & NVME_CTRL_ONCS_TIMESTAMP))
2568 ret = nvme_set_features(ctrl, NVME_FEAT_TIMESTAMP, 0, &ts, sizeof(ts),
2571 dev_warn_once(ctrl->device,
2576 static int nvme_configure_host_options(struct nvme_ctrl *ctrl)
2583 if (ctrl->crdt[0])
2585 if (ctrl->ctratt & NVME_CTRL_ATTR_ELBAS)
2597 ret = nvme_set_features(ctrl, NVME_FEAT_HOST_BEHAVIOR, 0,
2657 static int nvme_configure_apst(struct nvme_ctrl *ctrl)
2672 if (!ctrl->apsta)
2675 if (ctrl->npss > 31) {
2676 dev_warn(ctrl->device, "NPSS is invalid; not using APST\n");
2684 if (!ctrl->apst_enabled || ctrl->ps_max_latency_us == 0) {
2686 dev_dbg(ctrl->device, "APST disabled\n");
2696 for (state = (int)ctrl->npss; state >= 0; state--) {
2706 if (state == ctrl->npss &&
2707 (ctrl->quirks & NVME_QUIRK_NO_DEEPEST_PS))
2714 if (!(ctrl->psd[state].flags & NVME_PS_FLAGS_NON_OP_STATE))
2717 exit_latency_us = (u64)le32_to_cpu(ctrl->psd[state].exit_lat);
2718 if (exit_latency_us > ctrl->ps_max_latency_us)
2722 le32_to_cpu(ctrl->psd[state].entry_lat);
2747 dev_dbg(ctrl->device, "APST enabled but no non-operational states are available\n");
2749 dev_dbg(ctrl->device, "APST enabled: max PS = %d, max round-trip latency = %lluus, table = %*phN\n",
2754 ret = nvme_set_features(ctrl, NVME_FEAT_AUTO_PST, apste,
2757 dev_err(ctrl->device, "failed to set APST feature (%d)\n", ret);
2764 struct nvme_ctrl *ctrl = dev_get_drvdata(dev);
2777 if (ctrl->ps_max_latency_us != latency) {
2778 ctrl->ps_max_latency_us = latency;
2779 if (nvme_ctrl_state(ctrl) == NVME_CTRL_LIVE)
2780 nvme_configure_apst(ctrl);
2875 static void nvme_init_subnqn(struct nvme_subsystem *subsys, struct nvme_ctrl *ctrl,
2881 if(!(ctrl->quirks & NVME_QUIRK_IGNORE_DEV_SUBNQN)) {
2888 if (ctrl->vs >= NVME_VS(1, 2, 1))
2889 dev_warn(ctrl->device, "missing or invalid SUBNQN field.\n");
2964 static inline bool nvme_discovery_ctrl(struct nvme_ctrl *ctrl)
2966 return ctrl->opts && ctrl->opts->discovery_nqn;
2970 struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id)
2980 if (tmp->cntlid == ctrl->cntlid) {
2981 dev_err(ctrl->device,
2983 ctrl->cntlid, dev_name(tmp->device),
2989 nvme_discovery_ctrl(ctrl))
2992 dev_err(ctrl->device,
3000 static int nvme_init_subsystem(struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id)
3014 nvme_init_subnqn(subsys, ctrl, id);
3027 if (nvme_discovery_ctrl(ctrl) && subsys->subtype != NVME_NQN_DISC) {
3028 dev_err(ctrl->device,
3040 dev_set_name(&subsys->dev, "nvme-subsys%d", ctrl->instance);
3049 if (!nvme_validate_cntlid(subsys, ctrl, id)) {
3056 dev_err(ctrl->device,
3065 ret = sysfs_create_link(&subsys->dev.kobj, &ctrl->device->kobj,
3066 dev_name(ctrl->device));
3068 dev_err(ctrl->device,
3074 subsys->instance = ctrl->instance;
3075 ctrl->subsys = subsys;
3076 list_add_tail(&ctrl->subsys_entry, &subsys->ctrls);
3087 int nvme_get_log(struct nvme_ctrl *ctrl, u32 nsid, u8 log_page, u8 lsp, u8 csi,
3103 return nvme_submit_sync_cmd(ctrl->admin_q, &c, log, size);
3106 static int nvme_get_effects_log(struct nvme_ctrl *ctrl, u8 csi,
3109 struct nvme_effects_log *old, *cel = xa_load(&ctrl->cels, csi);
3119 ret = nvme_get_log(ctrl, 0x00, NVME_LOG_CMD_EFFECTS, 0, csi,
3126 old = xa_store(&ctrl->cels, csi, cel, GFP_KERNEL);
3136 static inline u32 nvme_mps_to_sectors(struct nvme_ctrl *ctrl, u32 units)
3138 u32 page_shift = NVME_CAP_MPSMIN(ctrl->cap) + 12, val;
3145 static int nvme_init_non_mdts_limits(struct nvme_ctrl *ctrl)
3157 if ((ctrl->oncs & NVME_CTRL_ONCS_WRITE_ZEROES) &&
3158 !(ctrl->quirks & NVME_QUIRK_DISABLE_WRITE_ZEROES))
3159 ctrl->max_zeroes_sectors = ctrl->max_hw_sectors;
3161 ctrl->max_zeroes_sectors = 0;
3163 if (ctrl->subsys->subtype != NVME_NQN_NVME ||
3164 !nvme_id_cns_ok(ctrl, NVME_ID_CNS_CS_CTRL) ||
3165 test_bit(NVME_CTRL_SKIP_ID_CNS_CS, &ctrl->flags))
3176 ret = nvme_submit_sync_cmd(ctrl->admin_q, &c, id, sizeof(*id));
3180 ctrl->dmrl = id->dmrl;
3181 ctrl->dmrsl = le32_to_cpu(id->dmrsl);
3183 ctrl->max_zeroes_sectors = nvme_mps_to_sectors(ctrl, id->wzsl);
3187 set_bit(NVME_CTRL_SKIP_ID_CNS_CS, &ctrl->flags);
3192 static int nvme_init_effects_log(struct nvme_ctrl *ctrl,
3201 old = xa_store(&ctrl->cels, csi, effects, GFP_KERNEL);
3211 static void nvme_init_known_nvm_effects(struct nvme_ctrl *ctrl)
3213 struct nvme_effects_log *log = ctrl->effects;
3243 static int nvme_init_effects(struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id)
3247 if (ctrl->effects)
3251 ret = nvme_get_effects_log(ctrl, NVME_CSI_NVM, &ctrl->effects);
3256 if (!ctrl->effects) {
3257 ret = nvme_init_effects_log(ctrl, NVME_CSI_NVM, &ctrl->effects);
3262 nvme_init_known_nvm_effects(ctrl);
3266 static int nvme_check_ctrl_fabric_info(struct nvme_ctrl *ctrl, struct nvme_id_ctrl *id)
3272 if (ctrl->cntlid != le16_to_cpu(id->cntlid)) {
3273 dev_err(ctrl->device,
3275 ctrl->cntlid, le16_to_cpu(id->cntlid));
3279 if (!nvme_discovery_ctrl(ctrl) && !ctrl->kas) {
3280 dev_err(ctrl->device,
3285 if (!nvme_discovery_ctrl(ctrl) && ctrl->ioccsz < 4) {
3286 dev_err(ctrl->device,
3288 ctrl->ioccsz);
3292 if (!nvme_discovery_ctrl(ctrl) && ctrl->iorcsz < 1) {
3293 dev_err(ctrl->device,
3295 ctrl->iorcsz);
3299 if (!ctrl->maxcmd) {
3300 dev_warn(ctrl->device,
3302 ctrl->maxcmd = ctrl->sqsize + 1;
3308 static int nvme_init_identify(struct nvme_ctrl *ctrl)
3316 ret = nvme_identify_ctrl(ctrl, &id);
3318 dev_err(ctrl->device, "Identify Controller failed (%d)\n", ret);
3322 if (!(ctrl->ops->flags & NVME_F_FABRICS))
3323 ctrl->cntlid = le16_to_cpu(id->cntlid);
3325 if (!ctrl->identified) {
3338 ctrl->quirks |= core_quirks[i].quirks;
3341 ret = nvme_init_subsystem(ctrl, id);
3345 ret = nvme_init_effects(ctrl, id);
3349 memcpy(ctrl->subsys->firmware_rev, id->fr,
3350 sizeof(ctrl->subsys->firmware_rev));
3352 if (force_apst && (ctrl->quirks & NVME_QUIRK_NO_DEEPEST_PS)) {
3353 dev_warn(ctrl->device, "forcibly allowing all power states due to nvme_core.force_apst -- use at your own risk\n");
3354 ctrl->quirks &= ~NVME_QUIRK_NO_DEEPEST_PS;
3357 ctrl->crdt[0] = le16_to_cpu(id->crdt1);
3358 ctrl->crdt[1] = le16_to_cpu(id->crdt2);
3359 ctrl->crdt[2] = le16_to_cpu(id->crdt3);
3361 ctrl->oacs = le16_to_cpu(id->oacs);
3362 ctrl->oncs = le16_to_cpu(id->oncs);
3363 ctrl->mtfa = le16_to_cpu(id->mtfa);
3364 ctrl->oaes = le32_to_cpu(id->oaes);
3365 ctrl->wctemp = le16_to_cpu(id->wctemp);
3366 ctrl->cctemp = le16_to_cpu(id->cctemp);
3368 atomic_set(&ctrl->abort_limit, id->acl + 1);
3369 ctrl->vwc = id->vwc;
3371 max_hw_sectors = nvme_mps_to_sectors(ctrl, id->mdts);
3374 ctrl->max_hw_sectors =
3375 min_not_zero(ctrl->max_hw_sectors, max_hw_sectors);
3377 lim = queue_limits_start_update(ctrl->admin_q);
3378 nvme_set_ctrl_limits(ctrl, &lim);
3379 ret = queue_limits_commit_update(ctrl->admin_q, &lim);
3383 ctrl->sgls = le32_to_cpu(id->sgls);
3384 ctrl->kas = le16_to_cpu(id->kas);
3385 ctrl->max_namespaces = le32_to_cpu(id->mnan);
3386 ctrl->ctratt = le32_to_cpu(id->ctratt);
3388 ctrl->cntrltype = id->cntrltype;
3389 ctrl->dctype = id->dctype;
3395 ctrl->shutdown_timeout = clamp_t(unsigned int, transition_time,
3398 if (ctrl->shutdown_timeout != shutdown_timeout)
3399 dev_info(ctrl->device,
3401 ctrl->shutdown_timeout);
3403 ctrl->shutdown_timeout = shutdown_timeout;
3405 ctrl->npss = id->npss;
3406 ctrl->apsta = id->apsta;
3407 prev_apst_enabled = ctrl->apst_enabled;
3408 if (ctrl->quirks & NVME_QUIRK_NO_APST) {
3410 dev_warn(ctrl->device, "forcibly allowing APST due to nvme_core.force_apst -- use at your own risk\n");
3411 ctrl->apst_enabled = true;
3413 ctrl->apst_enabled = false;
3416 ctrl->apst_enabled = id->apsta;
3418 memcpy(ctrl->psd, id->psd, sizeof(ctrl->psd));
3420 if (ctrl->ops->flags & NVME_F_FABRICS) {
3421 ctrl->icdoff = le16_to_cpu(id->icdoff);
3422 ctrl->ioccsz = le32_to_cpu(id->ioccsz);
3423 ctrl->iorcsz = le32_to_cpu(id->iorcsz);
3424 ctrl->maxcmd = le16_to_cpu(id->maxcmd);
3426 ret = nvme_check_ctrl_fabric_info(ctrl, id);
3430 ctrl->hmpre = le32_to_cpu(id->hmpre);
3431 ctrl->hmmin = le32_to_cpu(id->hmmin);
3432 ctrl->hmminds = le32_to_cpu(id->hmminds);
3433 ctrl->hmmaxd = le16_to_cpu(id->hmmaxd);
3436 ret = nvme_mpath_init_identify(ctrl, id);
3440 if (ctrl->apst_enabled && !prev_apst_enabled)
3441 dev_pm_qos_expose_latency_tolerance(ctrl->device);
3442 else if (!ctrl->apst_enabled && prev_apst_enabled)
3443 dev_pm_qos_hide_latency_tolerance(ctrl->device);
3455 int nvme_init_ctrl_finish(struct nvme_ctrl *ctrl, bool was_suspended)
3459 ret = ctrl->ops->reg_read32(ctrl, NVME_REG_VS, &ctrl->vs);
3461 dev_err(ctrl->device, "Reading VS failed (%d)\n", ret);
3465 ctrl->sqsize = min_t(u16, NVME_CAP_MQES(ctrl->cap), ctrl->sqsize);
3467 if (ctrl->vs >= NVME_VS(1, 1, 0))
3468 ctrl->subsystem = NVME_CAP_NSSRC(ctrl->cap);
3470 ret = nvme_init_identify(ctrl);
3474 ret = nvme_configure_apst(ctrl);
3478 ret = nvme_configure_timestamp(ctrl);
3482 ret = nvme_configure_host_options(ctrl);
3486 nvme_configure_opal(ctrl, was_suspended);
3488 if (!ctrl->identified && !nvme_discovery_ctrl(ctrl)) {
3493 ret = nvme_hwmon_init(ctrl);
3498 clear_bit(NVME_CTRL_DIRTY_CAPABILITY, &ctrl->flags);
3499 ctrl->identified = true;
3501 nvme_start_keep_alive(ctrl);
3509 struct nvme_ctrl *ctrl =
3512 switch (nvme_ctrl_state(ctrl)) {
3519 nvme_get_ctrl(ctrl);
3520 if (!try_module_get(ctrl->ops->module)) {
3521 nvme_put_ctrl(ctrl);
3525 file->private_data = ctrl;
3531 struct nvme_ctrl *ctrl =
3534 module_put(ctrl->ops->module);
3535 nvme_put_ctrl(ctrl);
3548 static struct nvme_ns_head *nvme_find_ns_head(struct nvme_ctrl *ctrl,
3553 lockdep_assert_held(&ctrl->subsys->lock);
3555 list_for_each_entry(h, &ctrl->subsys->nsheads, entry) {
3561 if (h->ns_id != nsid || !nvme_is_unique_nsid(ctrl, h))
3651 ns->cdev_device.parent = ns->ctrl->device;
3653 ns->ctrl->instance, ns->head->instance);
3658 ns->ctrl->ops->module);
3661 static struct nvme_ns_head *nvme_alloc_ns_head(struct nvme_ctrl *ctrl,
3675 ret = ida_alloc_min(&ctrl->subsys->ns_ida, 1, GFP_KERNEL);
3683 head->subsys = ctrl->subsys;
3693 ret = nvme_get_effects_log(ctrl, head->ids.csi, &head->effects);
3697 head->effects = ctrl->effects;
3699 ret = nvme_mpath_alloc_disk(ctrl, head);
3703 list_add_tail(&head->entry, &ctrl->subsys->nsheads);
3705 kref_get(&ctrl->subsys->ref);
3711 ida_free(&ctrl->subsys->ns_ida, head->instance);
3748 struct nvme_ctrl *ctrl = ns->ctrl;
3752 ret = nvme_global_check_duplicate_ids(ctrl->subsys, &info->ids);
3770 nvme_print_device_info(ctrl);
3771 if ((ns->ctrl->ops->flags & NVME_F_FABRICS) || /* !PCIe */
3772 ((ns->ctrl->subsys->cmic & NVME_CTRL_CMIC_MULTI_CTRL) &&
3774 dev_err(ctrl->device,
3780 dev_err(ctrl->device,
3782 dev_err(ctrl->device,
3787 ctrl->quirks |= NVME_QUIRK_BOGUS_NID;
3790 mutex_lock(&ctrl->subsys->lock);
3791 head = nvme_find_ns_head(ctrl, info->nsid);
3793 ret = nvme_subsys_check_duplicate_ids(ctrl->subsys, &info->ids);
3795 dev_err(ctrl->device,
3800 head = nvme_alloc_ns_head(ctrl, info);
3808 dev_err(ctrl->device,
3814 dev_err(ctrl->device,
3821 dev_warn(ctrl->device,
3824 dev_warn_once(ctrl->device,
3831 mutex_unlock(&ctrl->subsys->lock);
3837 mutex_unlock(&ctrl->subsys->lock);
3841 struct nvme_ns *nvme_find_get_ns(struct nvme_ctrl *ctrl, unsigned nsid)
3846 srcu_idx = srcu_read_lock(&ctrl->srcu);
3847 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
3848 srcu_read_lock_held(&ctrl->srcu)) {
3858 srcu_read_unlock(&ctrl->srcu, srcu_idx);
3870 list_for_each_entry_reverse(tmp, &ns->ctrl->namespaces, list) {
3876 list_add(&ns->list, &ns->ctrl->namespaces);
3879 static void nvme_alloc_ns(struct nvme_ctrl *ctrl, struct nvme_ns_info *info)
3884 int node = ctrl->numa_node;
3890 if (ctrl->opts && ctrl->opts->data_digest)
3892 if (ctrl->ops->supports_pci_p2pdma &&
3893 ctrl->ops->supports_pci_p2pdma(ctrl))
3896 disk = blk_mq_alloc_disk(ctrl->tagset, &lim, ns);
3904 ns->ctrl = ctrl;
3922 sprintf(disk->disk_name, "nvme%dc%dn%d", ctrl->subsys->instance,
3923 ctrl->instance, ns->head->instance);
3926 sprintf(disk->disk_name, "nvme%dn%d", ctrl->subsys->instance,
3929 sprintf(disk->disk_name, "nvme%dn%d", ctrl->instance,
3936 mutex_lock(&ctrl->namespaces_lock);
3938 * Ensure that no namespaces are added to the ctrl list after the queues
3941 if (test_bit(NVME_CTRL_FROZEN, &ctrl->flags)) {
3942 mutex_unlock(&ctrl->namespaces_lock);
3946 mutex_unlock(&ctrl->namespaces_lock);
3947 synchronize_srcu(&ctrl->srcu);
3948 nvme_get_ctrl(ctrl);
3950 if (device_add_disk(ctrl->device, ns->disk, nvme_ns_attr_groups))
3969 nvme_put_ctrl(ctrl);
3970 mutex_lock(&ctrl->namespaces_lock);
3972 mutex_unlock(&ctrl->namespaces_lock);
3973 synchronize_srcu(&ctrl->srcu);
3975 mutex_lock(&ctrl->subsys->lock);
3979 mutex_unlock(&ctrl->subsys->lock);
4008 mutex_lock(&ns->ctrl->subsys->lock);
4014 mutex_unlock(&ns->ctrl->subsys->lock);
4023 mutex_lock(&ns->ctrl->namespaces_lock);
4025 mutex_unlock(&ns->ctrl->namespaces_lock);
4026 synchronize_srcu(&ns->ctrl->srcu);
4033 static void nvme_ns_remove_by_nsid(struct nvme_ctrl *ctrl, u32 nsid)
4035 struct nvme_ns *ns = nvme_find_get_ns(ctrl, nsid);
4048 dev_err(ns->ctrl->device,
4065 static void nvme_scan_ns(struct nvme_ctrl *ctrl, unsigned nsid)
4071 if (nvme_identify_ns_descs(ctrl, &info))
4074 if (info.ids.csi != NVME_CSI_NVM && !nvme_multi_css(ctrl)) {
4075 dev_warn(ctrl->device,
4085 if ((ctrl->cap & NVME_CAP_CRMS_CRIMS) ||
4087 ctrl->vs >= NVME_VS(2, 0, 0))
4088 ret = nvme_ns_info_from_id_cs_indep(ctrl, &info);
4090 ret = nvme_ns_info_from_identify(ctrl, &info);
4093 nvme_ns_remove_by_nsid(ctrl, nsid);
4102 ns = nvme_find_get_ns(ctrl, nsid);
4107 nvme_alloc_ns(ctrl, &info);
4113 * @ctrl: Controller on which namespaces are being scanned
4123 struct nvme_ctrl *ctrl;
4137 nvme_scan_ns(scan_info->ctrl, nsid);
4140 static void nvme_remove_invalid_namespaces(struct nvme_ctrl *ctrl,
4146 mutex_lock(&ctrl->namespaces_lock);
4147 list_for_each_entry_safe(ns, next, &ctrl->namespaces, list) {
4150 synchronize_srcu(&ctrl->srcu);
4154 mutex_unlock(&ctrl->namespaces_lock);
4160 static int nvme_scan_ns_list(struct nvme_ctrl *ctrl)
4173 scan_info.ctrl = ctrl;
4182 ret = nvme_submit_sync_cmd(ctrl->admin_q, &cmd, ns_list,
4185 dev_warn(ctrl->device,
4199 nvme_ns_remove_by_nsid(ctrl, prev);
4204 nvme_remove_invalid_namespaces(ctrl, prev);
4211 static void nvme_scan_ns_sequential(struct nvme_ctrl *ctrl)
4216 if (nvme_identify_ctrl(ctrl, &id))
4222 nvme_scan_ns(ctrl, i);
4224 nvme_remove_invalid_namespaces(ctrl, nn);
4227 static void nvme_clear_changed_ns_log(struct nvme_ctrl *ctrl)
4243 error = nvme_get_log(ctrl, NVME_NSID_ALL, NVME_LOG_CHANGED_NS, 0,
4246 dev_warn(ctrl->device,
4254 struct nvme_ctrl *ctrl =
4258 /* No tagset on a live ctrl means IO queues could not created */
4259 if (nvme_ctrl_state(ctrl) != NVME_CTRL_LIVE || !ctrl->tagset)
4269 ret = nvme_init_non_mdts_limits(ctrl);
4271 dev_warn(ctrl->device,
4276 if (test_and_clear_bit(NVME_AER_NOTICE_NS_CHANGED, &ctrl->events)) {
4277 dev_info(ctrl->device, "rescanning namespaces.\n");
4278 nvme_clear_changed_ns_log(ctrl);
4281 mutex_lock(&ctrl->scan_lock);
4282 if (!nvme_id_cns_ok(ctrl, NVME_ID_CNS_NS_ACTIVE_LIST)) {
4283 nvme_scan_ns_sequential(ctrl);
4290 ret = nvme_scan_ns_list(ctrl);
4292 nvme_scan_ns_sequential(ctrl);
4294 mutex_unlock(&ctrl->scan_lock);
4302 void nvme_remove_namespaces(struct nvme_ctrl *ctrl)
4312 nvme_mpath_clear_ctrl_paths(ctrl);
4318 nvme_unquiesce_io_queues(ctrl);
4321 flush_work(&ctrl->scan_work);
4329 if (nvme_ctrl_state(ctrl) == NVME_CTRL_DEAD)
4330 nvme_mark_namespaces_dead(ctrl);
4333 nvme_change_ctrl_state(ctrl, NVME_CTRL_DELETING_NOIO);
4335 mutex_lock(&ctrl->namespaces_lock);
4336 list_splice_init_rcu(&ctrl->namespaces, &ns_list, synchronize_rcu);
4337 mutex_unlock(&ctrl->namespaces_lock);
4338 synchronize_srcu(&ctrl->srcu);
4347 const struct nvme_ctrl *ctrl =
4349 struct nvmf_ctrl_options *opts = ctrl->opts;
4352 ret = add_uevent_var(env, "NVME_TRTYPE=%s", ctrl->ops->name);
4377 static void nvme_change_uevent(struct nvme_ctrl *ctrl, char *envdata)
4381 kobject_uevent_env(&ctrl->device->kobj, KOBJ_CHANGE, envp);
4384 static void nvme_aen_uevent(struct nvme_ctrl *ctrl)
4387 u32 aen_result = ctrl->aen_result;
4389 ctrl->aen_result = 0;
4396 kobject_uevent_env(&ctrl->device->kobj, KOBJ_CHANGE, envp);
4402 struct nvme_ctrl *ctrl =
4405 nvme_aen_uevent(ctrl);
4409 * flushing ctrl async_event_work after changing the controller state
4412 if (nvme_ctrl_state(ctrl) == NVME_CTRL_LIVE)
4413 ctrl->ops->submit_async_event(ctrl);
4416 static bool nvme_ctrl_pp_status(struct nvme_ctrl *ctrl)
4421 if (ctrl->ops->reg_read32(ctrl, NVME_REG_CSTS, &csts))
4427 return ((ctrl->ctrl_config & NVME_CC_ENABLE) && (csts & NVME_CSTS_PP));
4430 static void nvme_get_fw_slot_info(struct nvme_ctrl *ctrl)
4439 if (nvme_get_log(ctrl, NVME_NSID_ALL, NVME_LOG_FW_SLOT, 0, NVME_CSI_NVM,
4441 dev_warn(ctrl->device, "Get FW SLOT INFO log error\n");
4448 dev_info(ctrl->device,
4453 memcpy(ctrl->subsys->firmware_rev, &log->frs[cur_fw_slot - 1],
4454 sizeof(ctrl->subsys->firmware_rev));
4462 struct nvme_ctrl *ctrl = container_of(work,
4466 nvme_auth_stop(ctrl);
4468 if (ctrl->mtfa)
4470 msecs_to_jiffies(ctrl->mtfa * 100);
4475 nvme_quiesce_io_queues(ctrl);
4476 while (nvme_ctrl_pp_status(ctrl)) {
4478 dev_warn(ctrl->device,
4480 nvme_try_sched_reset(ctrl);
4486 if (!nvme_change_ctrl_state(ctrl, NVME_CTRL_LIVE))
4489 nvme_unquiesce_io_queues(ctrl);
4491 nvme_get_fw_slot_info(ctrl);
4493 queue_work(nvme_wq, &ctrl->async_event_work);
4506 static bool nvme_handle_aen_notice(struct nvme_ctrl *ctrl, u32 result)
4513 set_bit(NVME_AER_NOTICE_NS_CHANGED, &ctrl->events);
4514 nvme_queue_scan(ctrl);
4522 if (nvme_change_ctrl_state(ctrl, NVME_CTRL_RESETTING)) {
4524 queue_work(nvme_wq, &ctrl->fw_act_work);
4529 if (!ctrl->ana_log_buf)
4531 queue_work(nvme_wq, &ctrl->ana_work);
4535 ctrl->aen_result = result;
4538 dev_warn(ctrl->device, "async event result %08x\n", result);
4543 static void nvme_handle_aer_persistent_error(struct nvme_ctrl *ctrl)
4545 dev_warn(ctrl->device,
4547 nvme_reset_ctrl(ctrl);
4550 void nvme_complete_async_event(struct nvme_ctrl *ctrl, __le16 status,
4561 trace_nvme_async_event(ctrl, result);
4564 requeue = nvme_handle_aen_notice(ctrl, result);
4572 nvme_handle_aer_persistent_error(ctrl);
4579 ctrl->aen_result = result;
4586 queue_work(nvme_wq, &ctrl->async_event_work);
4590 int nvme_alloc_admin_tag_set(struct nvme_ctrl *ctrl, struct blk_mq_tag_set *set,
4599 if (ctrl->ops->flags & NVME_F_FABRICS)
4602 set->numa_node = ctrl->numa_node;
4603 if (ctrl->ops->flags & NVME_F_BLOCKING)
4606 set->driver_data = ctrl;
4613 ctrl->admin_q = blk_mq_alloc_queue(set, &lim, NULL);
4614 if (IS_ERR(ctrl->admin_q)) {
4615 ret = PTR_ERR(ctrl->admin_q);
4619 if (ctrl->ops->flags & NVME_F_FABRICS) {
4620 ctrl->fabrics_q = blk_mq_alloc_queue(set, NULL, NULL);
4621 if (IS_ERR(ctrl->fabrics_q)) {
4622 ret = PTR_ERR(ctrl->fabrics_q);
4627 ctrl->admin_tagset = set;
4631 blk_mq_destroy_queue(ctrl->admin_q);
4632 blk_put_queue(ctrl->admin_q);
4635 ctrl->admin_q = NULL;
4636 ctrl->fabrics_q = NULL;
4641 void nvme_remove_admin_tag_set(struct nvme_ctrl *ctrl)
4647 nvme_stop_keep_alive(ctrl);
4648 blk_mq_destroy_queue(ctrl->admin_q);
4649 blk_put_queue(ctrl->admin_q);
4650 if (ctrl->ops->flags & NVME_F_FABRICS) {
4651 blk_mq_destroy_queue(ctrl->fabrics_q);
4652 blk_put_queue(ctrl->fabrics_q);
4654 blk_mq_free_tag_set(ctrl->admin_tagset);
4658 int nvme_alloc_io_tag_set(struct nvme_ctrl *ctrl, struct blk_mq_tag_set *set,
4666 set->queue_depth = min_t(unsigned, ctrl->sqsize, BLK_MQ_MAX_DEPTH - 1);
4671 if (ctrl->quirks & NVME_QUIRK_SHARED_TAGS)
4673 else if (ctrl->ops->flags & NVME_F_FABRICS)
4676 set->numa_node = ctrl->numa_node;
4677 if (ctrl->ops->flags & NVME_F_BLOCKING)
4680 set->driver_data = ctrl;
4681 set->nr_hw_queues = ctrl->queue_count - 1;
4688 if (ctrl->ops->flags & NVME_F_FABRICS) {
4693 ctrl->connect_q = blk_mq_alloc_queue(set, &lim, NULL);
4694 if (IS_ERR(ctrl->connect_q)) {
4695 ret = PTR_ERR(ctrl->connect_q);
4700 ctrl->tagset = set;
4705 ctrl->connect_q = NULL;
4710 void nvme_remove_io_tag_set(struct nvme_ctrl *ctrl)
4712 if (ctrl->ops->flags & NVME_F_FABRICS) {
4713 blk_mq_destroy_queue(ctrl->connect_q);
4714 blk_put_queue(ctrl->connect_q);
4716 blk_mq_free_tag_set(ctrl->tagset);
4720 void nvme_stop_ctrl(struct nvme_ctrl *ctrl)
4722 nvme_mpath_stop(ctrl);
4723 nvme_auth_stop(ctrl);
4724 nvme_stop_failfast_work(ctrl);
4725 flush_work(&ctrl->async_event_work);
4726 cancel_work_sync(&ctrl->fw_act_work);
4727 if (ctrl->ops->stop_ctrl)
4728 ctrl->ops->stop_ctrl(ctrl);
4732 void nvme_start_ctrl(struct nvme_ctrl *ctrl)
4734 nvme_enable_aen(ctrl);
4742 if (test_bit(NVME_CTRL_STARTED_ONCE, &ctrl->flags) &&
4743 nvme_discovery_ctrl(ctrl))
4744 nvme_change_uevent(ctrl, "NVME_EVENT=rediscover");
4746 if (ctrl->queue_count > 1) {
4747 nvme_queue_scan(ctrl);
4748 nvme_unquiesce_io_queues(ctrl);
4749 nvme_mpath_update(ctrl);
4752 nvme_change_uevent(ctrl, "NVME_EVENT=connected");
4753 set_bit(NVME_CTRL_STARTED_ONCE, &ctrl->flags);
4757 void nvme_uninit_ctrl(struct nvme_ctrl *ctrl)
4759 nvme_stop_keep_alive(ctrl);
4760 nvme_hwmon_exit(ctrl);
4761 nvme_fault_inject_fini(&ctrl->fault_inject);
4762 dev_pm_qos_hide_latency_tolerance(ctrl->device);
4763 cdev_device_del(&ctrl->cdev, ctrl->device);
4764 nvme_put_ctrl(ctrl);
4768 static void nvme_free_cels(struct nvme_ctrl *ctrl)
4773 xa_for_each(&ctrl->cels, i, cel) {
4774 xa_erase(&ctrl->cels, i);
4778 xa_destroy(&ctrl->cels);
4783 struct nvme_ctrl *ctrl =
4785 struct nvme_subsystem *subsys = ctrl->subsys;
4787 if (!subsys || ctrl->instance != subsys->instance)
4788 ida_free(&nvme_instance_ida, ctrl->instance);
4789 nvme_free_cels(ctrl);
4790 nvme_mpath_uninit(ctrl);
4791 cleanup_srcu_struct(&ctrl->srcu);
4792 nvme_auth_stop(ctrl);
4793 nvme_auth_free(ctrl);
4794 __free_page(ctrl->discard_page);
4795 free_opal_dev(ctrl->opal_dev);
4799 list_del(&ctrl->subsys_entry);
4800 sysfs_remove_link(&subsys->dev.kobj, dev_name(ctrl->device));
4804 ctrl->ops->free_ctrl(ctrl);
4818 int nvme_init_ctrl(struct nvme_ctrl *ctrl, struct device *dev,
4823 WRITE_ONCE(ctrl->state, NVME_CTRL_NEW);
4824 ctrl->passthru_err_log_enabled = false;
4825 clear_bit(NVME_CTRL_FAILFAST_EXPIRED, &ctrl->flags);
4826 spin_lock_init(&ctrl->lock);
4827 mutex_init(&ctrl->namespaces_lock);
4829 ret = init_srcu_struct(&ctrl->srcu);
4833 mutex_init(&ctrl->scan_lock);
4834 INIT_LIST_HEAD(&ctrl->namespaces);
4835 xa_init(&ctrl->cels);
4836 ctrl->dev = dev;
4837 ctrl->ops = ops;
4838 ctrl->quirks = quirks;
4839 ctrl->numa_node = NUMA_NO_NODE;
4840 INIT_WORK(&ctrl->scan_work, nvme_scan_work);
4841 INIT_WORK(&ctrl->async_event_work, nvme_async_event_work);
4842 INIT_WORK(&ctrl->fw_act_work, nvme_fw_act_work);
4843 INIT_WORK(&ctrl->delete_work, nvme_delete_ctrl_work);
4844 init_waitqueue_head(&ctrl->state_wq);
4846 INIT_DELAYED_WORK(&ctrl->ka_work, nvme_keep_alive_work);
4847 INIT_DELAYED_WORK(&ctrl->failfast_work, nvme_failfast_work);
4848 memset(&ctrl->ka_cmd, 0, sizeof(ctrl->ka_cmd));
4849 ctrl->ka_cmd.common.opcode = nvme_admin_keep_alive;
4850 ctrl->ka_last_check_time = jiffies;
4854 ctrl->discard_page = alloc_page(GFP_KERNEL);
4855 if (!ctrl->discard_page) {
4863 ctrl->instance = ret;
4865 ret = nvme_auth_init_ctrl(ctrl);
4869 nvme_mpath_init_ctrl(ctrl);
4871 device_initialize(&ctrl->ctrl_device);
4872 ctrl->device = &ctrl->ctrl_device;
4873 ctrl->device->devt = MKDEV(MAJOR(nvme_ctrl_base_chr_devt),
4874 ctrl->instance);
4875 ctrl->device->class = &nvme_class;
4876 ctrl->device->parent = ctrl->dev;
4878 ctrl->device->groups = ops->dev_attr_groups;
4880 ctrl->device->groups = nvme_dev_attr_groups;
4881 ctrl->device->release = nvme_free_ctrl;
4882 dev_set_drvdata(ctrl->device, ctrl);
4887 ida_free(&nvme_instance_ida, ctrl->instance);
4889 if (ctrl->discard_page)
4890 __free_page(ctrl->discard_page);
4891 cleanup_srcu_struct(&ctrl->srcu);
4898 * use nvme_uninit_ctrl() to properly free resources associated with the ctrl.
4900 int nvme_add_ctrl(struct nvme_ctrl *ctrl)
4904 ret = dev_set_name(ctrl->device, "nvme%d", ctrl->instance);
4908 cdev_init(&ctrl->cdev, &nvme_dev_fops);
4909 ctrl->cdev.owner = ctrl->ops->module;
4910 ret = cdev_device_add(&ctrl->cdev, ctrl->device);
4918 ctrl->device->power.set_latency_tolerance = nvme_set_latency_tolerance;
4919 dev_pm_qos_update_user_latency_tolerance(ctrl->device,
4922 nvme_fault_inject_init(&ctrl->fault_inject, dev_name(ctrl->device));
4923 nvme_get_ctrl(ctrl);
4930 void nvme_mark_namespaces_dead(struct nvme_ctrl *ctrl)
4935 srcu_idx = srcu_read_lock(&ctrl->srcu);
4936 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
4937 srcu_read_lock_held(&ctrl->srcu))
4939 srcu_read_unlock(&ctrl->srcu, srcu_idx);
4943 void nvme_unfreeze(struct nvme_ctrl *ctrl)
4948 srcu_idx = srcu_read_lock(&ctrl->srcu);
4949 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
4950 srcu_read_lock_held(&ctrl->srcu))
4952 srcu_read_unlock(&ctrl->srcu, srcu_idx);
4953 clear_bit(NVME_CTRL_FROZEN, &ctrl->flags);
4957 int nvme_wait_freeze_timeout(struct nvme_ctrl *ctrl, long timeout)
4962 srcu_idx = srcu_read_lock(&ctrl->srcu);
4963 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
4964 srcu_read_lock_held(&ctrl->srcu)) {
4969 srcu_read_unlock(&ctrl->srcu, srcu_idx);
4974 void nvme_wait_freeze(struct nvme_ctrl *ctrl)
4979 srcu_idx = srcu_read_lock(&ctrl->srcu);
4980 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
4981 srcu_read_lock_held(&ctrl->srcu))
4983 srcu_read_unlock(&ctrl->srcu, srcu_idx);
4987 void nvme_start_freeze(struct nvme_ctrl *ctrl)
4992 set_bit(NVME_CTRL_FROZEN, &ctrl->flags);
4993 srcu_idx = srcu_read_lock(&ctrl->srcu);
4994 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
4995 srcu_read_lock_held(&ctrl->srcu))
5002 srcu_read_unlock(&ctrl->srcu, srcu_idx);
5006 void nvme_quiesce_io_queues(struct nvme_ctrl *ctrl)
5008 if (!ctrl->tagset)
5010 if (!test_and_set_bit(NVME_CTRL_STOPPED, &ctrl->flags))
5011 blk_mq_quiesce_tagset(ctrl->tagset);
5013 blk_mq_wait_quiesce_done(ctrl->tagset);
5017 void nvme_unquiesce_io_queues(struct nvme_ctrl *ctrl)
5019 if (!ctrl->tagset)
5021 if (test_and_clear_bit(NVME_CTRL_STOPPED, &ctrl->flags))
5022 blk_mq_unquiesce_tagset(ctrl->tagset);
5026 void nvme_quiesce_admin_queue(struct nvme_ctrl *ctrl)
5028 if (!test_and_set_bit(NVME_CTRL_ADMIN_Q_STOPPED, &ctrl->flags))
5029 blk_mq_quiesce_queue(ctrl->admin_q);
5031 blk_mq_wait_quiesce_done(ctrl->admin_q->tag_set);
5035 void nvme_unquiesce_admin_queue(struct nvme_ctrl *ctrl)
5037 if (test_and_clear_bit(NVME_CTRL_ADMIN_Q_STOPPED, &ctrl->flags))
5038 blk_mq_unquiesce_queue(ctrl->admin_q);
5042 void nvme_sync_io_queues(struct nvme_ctrl *ctrl)
5047 srcu_idx = srcu_read_lock(&ctrl->srcu);
5048 list_for_each_entry_srcu(ns, &ctrl->namespaces, list,
5049 srcu_read_lock_held(&ctrl->srcu))
5051 srcu_read_unlock(&ctrl->srcu, srcu_idx);
5055 void nvme_sync_queues(struct nvme_ctrl *ctrl)
5057 nvme_sync_io_queues(ctrl);
5058 if (ctrl->admin_q)
5059 blk_sync_queue(ctrl->admin_q);