17f0f1aceSKlaus Jensen /* 27f0f1aceSKlaus Jensen * QEMU NVM Express Virtual Namespace 37f0f1aceSKlaus Jensen * 47f0f1aceSKlaus Jensen * Copyright (c) 2019 CNEX Labs 57f0f1aceSKlaus Jensen * Copyright (c) 2020 Samsung Electronics 67f0f1aceSKlaus Jensen * 77f0f1aceSKlaus Jensen * Authors: 87f0f1aceSKlaus Jensen * Klaus Jensen <k.jensen@samsung.com> 97f0f1aceSKlaus Jensen * 107f0f1aceSKlaus Jensen * This work is licensed under the terms of the GNU GPL, version 2. See the 117f0f1aceSKlaus Jensen * COPYING file in the top-level directory. 127f0f1aceSKlaus Jensen * 137f0f1aceSKlaus Jensen */ 147f0f1aceSKlaus Jensen 157f0f1aceSKlaus Jensen #include "qemu/osdep.h" 167f0f1aceSKlaus Jensen #include "qemu/units.h" 177f0f1aceSKlaus Jensen #include "qemu/cutils.h" 187f0f1aceSKlaus Jensen #include "qemu/log.h" 191b5804a8SKlaus Jensen #include "qemu/error-report.h" 207f0f1aceSKlaus Jensen #include "hw/block/block.h" 217f0f1aceSKlaus Jensen #include "hw/pci/pci.h" 227f0f1aceSKlaus Jensen #include "sysemu/sysemu.h" 237f0f1aceSKlaus Jensen #include "sysemu/block-backend.h" 247f0f1aceSKlaus Jensen #include "qapi/error.h" 257f0f1aceSKlaus Jensen 267f0f1aceSKlaus Jensen #include "hw/qdev-properties.h" 277f0f1aceSKlaus Jensen #include "hw/qdev-core.h" 287f0f1aceSKlaus Jensen 29a479335bSDmitry Fomichev #include "trace.h" 307f0f1aceSKlaus Jensen #include "nvme.h" 317f0f1aceSKlaus Jensen #include "nvme-ns.h" 327f0f1aceSKlaus Jensen 332605257aSKlaus Jensen #define MIN_DISCARD_GRANULARITY (4 * KiB) 342605257aSKlaus Jensen 352605257aSKlaus Jensen static int nvme_ns_init(NvmeNamespace *ns, Error **errp) 367f0f1aceSKlaus Jensen { 372605257aSKlaus Jensen BlockDriverInfo bdi; 387f0f1aceSKlaus Jensen NvmeIdNs *id_ns = &ns->id_ns; 39bc3a65e9SKlaus Jensen int npdg, nlbas; 40*6a674bc2SMinwoo Im uint8_t ds; 41*6a674bc2SMinwoo Im uint16_t ms; 42*6a674bc2SMinwoo Im int i; 437f0f1aceSKlaus Jensen 44146f720cSKlaus Jensen ns->id_ns.dlfeat = 0x1; 457f0f1aceSKlaus Jensen 46*6a674bc2SMinwoo Im ds = 31 - clz32(ns->blkconf.logical_block_size); 47*6a674bc2SMinwoo Im ms = ns->params.ms; 487f0f1aceSKlaus Jensen 49bc3a65e9SKlaus Jensen if (ns->params.ms) { 50bc3a65e9SKlaus Jensen id_ns->mc = 0x3; 51bc3a65e9SKlaus Jensen 52bc3a65e9SKlaus Jensen if (ns->params.mset) { 53bc3a65e9SKlaus Jensen id_ns->flbas |= 0x10; 54bc3a65e9SKlaus Jensen } 55146f720cSKlaus Jensen 56146f720cSKlaus Jensen id_ns->dpc = 0x1f; 57146f720cSKlaus Jensen id_ns->dps = ((ns->params.pil & 0x1) << 3) | ns->params.pi; 58*6a674bc2SMinwoo Im 59*6a674bc2SMinwoo Im NvmeLBAF lbaf[16] = { 60*6a674bc2SMinwoo Im [0] = { .ds = 9 }, 61*6a674bc2SMinwoo Im [1] = { .ds = 9, .ms = 8 }, 62*6a674bc2SMinwoo Im [2] = { .ds = 9, .ms = 16 }, 63*6a674bc2SMinwoo Im [3] = { .ds = 9, .ms = 64 }, 64*6a674bc2SMinwoo Im [4] = { .ds = 12 }, 65*6a674bc2SMinwoo Im [5] = { .ds = 12, .ms = 8 }, 66*6a674bc2SMinwoo Im [6] = { .ds = 12, .ms = 16 }, 67*6a674bc2SMinwoo Im [7] = { .ds = 12, .ms = 64 }, 68*6a674bc2SMinwoo Im }; 69*6a674bc2SMinwoo Im 70*6a674bc2SMinwoo Im memcpy(&id_ns->lbaf, &lbaf, sizeof(lbaf)); 71*6a674bc2SMinwoo Im id_ns->nlbaf = 7; 72*6a674bc2SMinwoo Im } else { 73*6a674bc2SMinwoo Im NvmeLBAF lbaf[16] = { 74*6a674bc2SMinwoo Im [0] = { .ds = 9 }, 75*6a674bc2SMinwoo Im [1] = { .ds = 12 }, 76*6a674bc2SMinwoo Im }; 77*6a674bc2SMinwoo Im 78*6a674bc2SMinwoo Im memcpy(&id_ns->lbaf, &lbaf, sizeof(lbaf)); 79*6a674bc2SMinwoo Im id_ns->nlbaf = 1; 80bc3a65e9SKlaus Jensen } 81bc3a65e9SKlaus Jensen 82*6a674bc2SMinwoo Im for (i = 0; i <= id_ns->nlbaf; i++) { 83*6a674bc2SMinwoo Im NvmeLBAF *lbaf = &id_ns->lbaf[i]; 84*6a674bc2SMinwoo Im if (lbaf->ds == ds) { 85*6a674bc2SMinwoo Im if (lbaf->ms == ms) { 86*6a674bc2SMinwoo Im id_ns->flbas |= i; 87*6a674bc2SMinwoo Im goto lbaf_found; 88*6a674bc2SMinwoo Im } 89*6a674bc2SMinwoo Im } 90*6a674bc2SMinwoo Im } 91*6a674bc2SMinwoo Im 92*6a674bc2SMinwoo Im /* add non-standard lba format */ 93*6a674bc2SMinwoo Im id_ns->nlbaf++; 94*6a674bc2SMinwoo Im id_ns->lbaf[id_ns->nlbaf].ds = ds; 95*6a674bc2SMinwoo Im id_ns->lbaf[id_ns->nlbaf].ms = ms; 96*6a674bc2SMinwoo Im id_ns->flbas |= id_ns->nlbaf; 97*6a674bc2SMinwoo Im 98*6a674bc2SMinwoo Im lbaf_found: 99bc3a65e9SKlaus Jensen nlbas = nvme_ns_nlbas(ns); 100bc3a65e9SKlaus Jensen 101bc3a65e9SKlaus Jensen id_ns->nsze = cpu_to_le64(nlbas); 102bc3a65e9SKlaus Jensen ns->mdata_offset = nvme_l2b(ns, nlbas); 1037f0f1aceSKlaus Jensen 104141354d5SNiklas Cassel ns->csi = NVME_CSI_NVM; 105141354d5SNiklas Cassel 1067f0f1aceSKlaus Jensen /* no thin provisioning */ 1077f0f1aceSKlaus Jensen id_ns->ncap = id_ns->nsze; 1087f0f1aceSKlaus Jensen id_ns->nuse = id_ns->ncap; 10954064e51SKlaus Jensen 1102605257aSKlaus Jensen /* support DULBE and I/O optimization fields */ 1112605257aSKlaus Jensen id_ns->nsfeat |= (0x4 | 0x10); 1122605257aSKlaus Jensen 1132605257aSKlaus Jensen npdg = ns->blkconf.discard_granularity / ns->blkconf.logical_block_size; 1142605257aSKlaus Jensen 1152605257aSKlaus Jensen if (bdrv_get_info(blk_bs(ns->blkconf.blk), &bdi) >= 0 && 1162605257aSKlaus Jensen bdi.cluster_size > ns->blkconf.discard_granularity) { 1172605257aSKlaus Jensen npdg = bdi.cluster_size / ns->blkconf.logical_block_size; 1182605257aSKlaus Jensen } 1192605257aSKlaus Jensen 1202605257aSKlaus Jensen id_ns->npda = id_ns->npdg = npdg - 1; 1212605257aSKlaus Jensen 122e5707685SMinwoo Im if (nvme_ns_shared(ns)) { 123e5707685SMinwoo Im id_ns->nmic |= NVME_NMIC_NS_SHARED; 124e5707685SMinwoo Im } 125e5707685SMinwoo Im 126e4e430b3SKlaus Jensen /* simple copy */ 127e4e430b3SKlaus Jensen id_ns->mssrl = cpu_to_le16(ns->params.mssrl); 128e4e430b3SKlaus Jensen id_ns->mcl = cpu_to_le32(ns->params.mcl); 129e4e430b3SKlaus Jensen id_ns->msrc = ns->params.msrc; 130e4e430b3SKlaus Jensen 1312605257aSKlaus Jensen return 0; 1327f0f1aceSKlaus Jensen } 1337f0f1aceSKlaus Jensen 134337ccd76SMinwoo Im static int nvme_ns_init_blk(NvmeNamespace *ns, Error **errp) 1357f0f1aceSKlaus Jensen { 13686b1cf32SKevin Wolf bool read_only; 13786b1cf32SKevin Wolf 1387f0f1aceSKlaus Jensen if (!blkconf_blocksizes(&ns->blkconf, errp)) { 1397f0f1aceSKlaus Jensen return -1; 1407f0f1aceSKlaus Jensen } 1417f0f1aceSKlaus Jensen 14286b1cf32SKevin Wolf read_only = !blk_supports_write_perm(ns->blkconf.blk); 14386b1cf32SKevin Wolf if (!blkconf_apply_backend_options(&ns->blkconf, read_only, false, errp)) { 1447f0f1aceSKlaus Jensen return -1; 1457f0f1aceSKlaus Jensen } 1467f0f1aceSKlaus Jensen 1472605257aSKlaus Jensen if (ns->blkconf.discard_granularity == -1) { 1482605257aSKlaus Jensen ns->blkconf.discard_granularity = 1492605257aSKlaus Jensen MAX(ns->blkconf.logical_block_size, MIN_DISCARD_GRANULARITY); 1502605257aSKlaus Jensen } 1512605257aSKlaus Jensen 1527f0f1aceSKlaus Jensen ns->size = blk_getlength(ns->blkconf.blk); 1537f0f1aceSKlaus Jensen if (ns->size < 0) { 1547f0f1aceSKlaus Jensen error_setg_errno(errp, -ns->size, "could not get blockdev size"); 1557f0f1aceSKlaus Jensen return -1; 1567f0f1aceSKlaus Jensen } 1577f0f1aceSKlaus Jensen 1587f0f1aceSKlaus Jensen return 0; 1597f0f1aceSKlaus Jensen } 1607f0f1aceSKlaus Jensen 161a479335bSDmitry Fomichev static int nvme_ns_zoned_check_calc_geometry(NvmeNamespace *ns, Error **errp) 162a479335bSDmitry Fomichev { 163a479335bSDmitry Fomichev uint64_t zone_size, zone_cap; 164a479335bSDmitry Fomichev uint32_t lbasz = ns->blkconf.logical_block_size; 165a479335bSDmitry Fomichev 166a479335bSDmitry Fomichev /* Make sure that the values of ZNS properties are sane */ 167a479335bSDmitry Fomichev if (ns->params.zone_size_bs) { 168a479335bSDmitry Fomichev zone_size = ns->params.zone_size_bs; 169a479335bSDmitry Fomichev } else { 170a479335bSDmitry Fomichev zone_size = NVME_DEFAULT_ZONE_SIZE; 171a479335bSDmitry Fomichev } 172a479335bSDmitry Fomichev if (ns->params.zone_cap_bs) { 173a479335bSDmitry Fomichev zone_cap = ns->params.zone_cap_bs; 174a479335bSDmitry Fomichev } else { 175a479335bSDmitry Fomichev zone_cap = zone_size; 176a479335bSDmitry Fomichev } 177a479335bSDmitry Fomichev if (zone_cap > zone_size) { 178a479335bSDmitry Fomichev error_setg(errp, "zone capacity %"PRIu64"B exceeds " 179a479335bSDmitry Fomichev "zone size %"PRIu64"B", zone_cap, zone_size); 180a479335bSDmitry Fomichev return -1; 181a479335bSDmitry Fomichev } 182a479335bSDmitry Fomichev if (zone_size < lbasz) { 183a479335bSDmitry Fomichev error_setg(errp, "zone size %"PRIu64"B too small, " 184a479335bSDmitry Fomichev "must be at least %"PRIu32"B", zone_size, lbasz); 185a479335bSDmitry Fomichev return -1; 186a479335bSDmitry Fomichev } 187a479335bSDmitry Fomichev if (zone_cap < lbasz) { 188a479335bSDmitry Fomichev error_setg(errp, "zone capacity %"PRIu64"B too small, " 189a479335bSDmitry Fomichev "must be at least %"PRIu32"B", zone_cap, lbasz); 190a479335bSDmitry Fomichev return -1; 191a479335bSDmitry Fomichev } 192a479335bSDmitry Fomichev 193a479335bSDmitry Fomichev /* 194a479335bSDmitry Fomichev * Save the main zone geometry values to avoid 195a479335bSDmitry Fomichev * calculating them later again. 196a479335bSDmitry Fomichev */ 197a479335bSDmitry Fomichev ns->zone_size = zone_size / lbasz; 198a479335bSDmitry Fomichev ns->zone_capacity = zone_cap / lbasz; 199bc3a65e9SKlaus Jensen ns->num_zones = nvme_ns_nlbas(ns) / ns->zone_size; 2008d18ddcdSDmitry Fomichev 2018d18ddcdSDmitry Fomichev /* Do a few more sanity checks of ZNS properties */ 202044f1876SMinwoo Im if (!ns->num_zones) { 203044f1876SMinwoo Im error_setg(errp, 204044f1876SMinwoo Im "insufficient drive capacity, must be at least the size " 205044f1876SMinwoo Im "of one zone (%"PRIu64"B)", zone_size); 206044f1876SMinwoo Im return -1; 207044f1876SMinwoo Im } 208044f1876SMinwoo Im 2098d18ddcdSDmitry Fomichev if (ns->params.max_open_zones > ns->num_zones) { 2108d18ddcdSDmitry Fomichev error_setg(errp, 2118d18ddcdSDmitry Fomichev "max_open_zones value %u exceeds the number of zones %u", 2128d18ddcdSDmitry Fomichev ns->params.max_open_zones, ns->num_zones); 2138d18ddcdSDmitry Fomichev return -1; 2148d18ddcdSDmitry Fomichev } 2158d18ddcdSDmitry Fomichev if (ns->params.max_active_zones > ns->num_zones) { 2168d18ddcdSDmitry Fomichev error_setg(errp, 2178d18ddcdSDmitry Fomichev "max_active_zones value %u exceeds the number of zones %u", 2188d18ddcdSDmitry Fomichev ns->params.max_active_zones, ns->num_zones); 2198d18ddcdSDmitry Fomichev return -1; 2208d18ddcdSDmitry Fomichev } 2218d18ddcdSDmitry Fomichev 2229ae39004SKlaus Jensen if (ns->params.max_active_zones) { 2239ae39004SKlaus Jensen if (ns->params.max_open_zones > ns->params.max_active_zones) { 2249ae39004SKlaus Jensen error_setg(errp, "max_open_zones (%u) exceeds max_active_zones (%u)", 2259ae39004SKlaus Jensen ns->params.max_open_zones, ns->params.max_active_zones); 2269ae39004SKlaus Jensen return -1; 2279ae39004SKlaus Jensen } 2289ae39004SKlaus Jensen 2299ae39004SKlaus Jensen if (!ns->params.max_open_zones) { 2309ae39004SKlaus Jensen ns->params.max_open_zones = ns->params.max_active_zones; 2319ae39004SKlaus Jensen } 2329ae39004SKlaus Jensen } 2339ae39004SKlaus Jensen 2341a9290adSDmitry Fomichev if (ns->params.zd_extension_size) { 2351a9290adSDmitry Fomichev if (ns->params.zd_extension_size & 0x3f) { 2361a9290adSDmitry Fomichev error_setg(errp, 2371a9290adSDmitry Fomichev "zone descriptor extension size must be a multiple of 64B"); 2381a9290adSDmitry Fomichev return -1; 2391a9290adSDmitry Fomichev } 2401a9290adSDmitry Fomichev if ((ns->params.zd_extension_size >> 6) > 0xff) { 2411a9290adSDmitry Fomichev error_setg(errp, "zone descriptor extension size is too large"); 2421a9290adSDmitry Fomichev return -1; 2431a9290adSDmitry Fomichev } 2441a9290adSDmitry Fomichev } 2451a9290adSDmitry Fomichev 246a479335bSDmitry Fomichev return 0; 247a479335bSDmitry Fomichev } 248a479335bSDmitry Fomichev 249a479335bSDmitry Fomichev static void nvme_ns_zoned_init_state(NvmeNamespace *ns) 250a479335bSDmitry Fomichev { 251a479335bSDmitry Fomichev uint64_t start = 0, zone_size = ns->zone_size; 252a479335bSDmitry Fomichev uint64_t capacity = ns->num_zones * zone_size; 253a479335bSDmitry Fomichev NvmeZone *zone; 254a479335bSDmitry Fomichev int i; 255a479335bSDmitry Fomichev 256a479335bSDmitry Fomichev ns->zone_array = g_new0(NvmeZone, ns->num_zones); 2571a9290adSDmitry Fomichev if (ns->params.zd_extension_size) { 2581a9290adSDmitry Fomichev ns->zd_extensions = g_malloc0(ns->params.zd_extension_size * 2591a9290adSDmitry Fomichev ns->num_zones); 2601a9290adSDmitry Fomichev } 261a479335bSDmitry Fomichev 262a479335bSDmitry Fomichev QTAILQ_INIT(&ns->exp_open_zones); 263a479335bSDmitry Fomichev QTAILQ_INIT(&ns->imp_open_zones); 264a479335bSDmitry Fomichev QTAILQ_INIT(&ns->closed_zones); 265a479335bSDmitry Fomichev QTAILQ_INIT(&ns->full_zones); 266a479335bSDmitry Fomichev 267a479335bSDmitry Fomichev zone = ns->zone_array; 268a479335bSDmitry Fomichev for (i = 0; i < ns->num_zones; i++, zone++) { 269a479335bSDmitry Fomichev if (start + zone_size > capacity) { 270a479335bSDmitry Fomichev zone_size = capacity - start; 271a479335bSDmitry Fomichev } 272a479335bSDmitry Fomichev zone->d.zt = NVME_ZONE_TYPE_SEQ_WRITE; 273a479335bSDmitry Fomichev nvme_set_zone_state(zone, NVME_ZONE_STATE_EMPTY); 274a479335bSDmitry Fomichev zone->d.za = 0; 275a479335bSDmitry Fomichev zone->d.zcap = ns->zone_capacity; 276a479335bSDmitry Fomichev zone->d.zslba = start; 277a479335bSDmitry Fomichev zone->d.wp = start; 278a479335bSDmitry Fomichev zone->w_ptr = start; 279a479335bSDmitry Fomichev start += zone_size; 280a479335bSDmitry Fomichev } 281a479335bSDmitry Fomichev 282a479335bSDmitry Fomichev ns->zone_size_log2 = 0; 283a479335bSDmitry Fomichev if (is_power_of_2(ns->zone_size)) { 284a479335bSDmitry Fomichev ns->zone_size_log2 = 63 - clz64(ns->zone_size); 285a479335bSDmitry Fomichev } 286a479335bSDmitry Fomichev } 287a479335bSDmitry Fomichev 288*6a674bc2SMinwoo Im static void nvme_ns_init_zoned(NvmeNamespace *ns) 289a479335bSDmitry Fomichev { 290a479335bSDmitry Fomichev NvmeIdNsZoned *id_ns_z; 291*6a674bc2SMinwoo Im int i; 292a479335bSDmitry Fomichev 293a479335bSDmitry Fomichev nvme_ns_zoned_init_state(ns); 294a479335bSDmitry Fomichev 295a479335bSDmitry Fomichev id_ns_z = g_malloc0(sizeof(NvmeIdNsZoned)); 296a479335bSDmitry Fomichev 297a479335bSDmitry Fomichev /* MAR/MOR are zeroes-based, 0xffffffff means no limit */ 2988d18ddcdSDmitry Fomichev id_ns_z->mar = cpu_to_le32(ns->params.max_active_zones - 1); 2998d18ddcdSDmitry Fomichev id_ns_z->mor = cpu_to_le32(ns->params.max_open_zones - 1); 300a479335bSDmitry Fomichev id_ns_z->zoc = 0; 301a479335bSDmitry Fomichev id_ns_z->ozcs = ns->params.cross_zone_read ? 0x01 : 0x00; 302a479335bSDmitry Fomichev 303*6a674bc2SMinwoo Im for (i = 0; i <= ns->id_ns.nlbaf; i++) { 304*6a674bc2SMinwoo Im id_ns_z->lbafe[i].zsze = cpu_to_le64(ns->zone_size); 305*6a674bc2SMinwoo Im id_ns_z->lbafe[i].zdes = 3061a9290adSDmitry Fomichev ns->params.zd_extension_size >> 6; /* Units of 64B */ 307*6a674bc2SMinwoo Im } 308a479335bSDmitry Fomichev 309a479335bSDmitry Fomichev ns->csi = NVME_CSI_ZONED; 310a479335bSDmitry Fomichev ns->id_ns.nsze = cpu_to_le64(ns->num_zones * ns->zone_size); 311a479335bSDmitry Fomichev ns->id_ns.ncap = ns->id_ns.nsze; 312a479335bSDmitry Fomichev ns->id_ns.nuse = ns->id_ns.ncap; 313a479335bSDmitry Fomichev 3141b5804a8SKlaus Jensen /* 3151b5804a8SKlaus Jensen * The device uses the BDRV_BLOCK_ZERO flag to determine the "deallocated" 3161b5804a8SKlaus Jensen * status of logical blocks. Since the spec defines that logical blocks 3171b5804a8SKlaus Jensen * SHALL be deallocated when then zone is in the Empty or Offline states, 3181b5804a8SKlaus Jensen * we can only support DULBE if the zone size is a multiple of the 3191b5804a8SKlaus Jensen * calculated NPDG. 3201b5804a8SKlaus Jensen */ 3211b5804a8SKlaus Jensen if (ns->zone_size % (ns->id_ns.npdg + 1)) { 3221b5804a8SKlaus Jensen warn_report("the zone size (%"PRIu64" blocks) is not a multiple of " 3231b5804a8SKlaus Jensen "the calculated deallocation granularity (%d blocks); " 3241b5804a8SKlaus Jensen "DULBE support disabled", 3251b5804a8SKlaus Jensen ns->zone_size, ns->id_ns.npdg + 1); 3261b5804a8SKlaus Jensen 3271b5804a8SKlaus Jensen ns->id_ns.nsfeat &= ~0x4; 3281b5804a8SKlaus Jensen } 3291b5804a8SKlaus Jensen 330a479335bSDmitry Fomichev ns->id_ns_zoned = id_ns_z; 331a479335bSDmitry Fomichev } 332a479335bSDmitry Fomichev 333a479335bSDmitry Fomichev static void nvme_clear_zone(NvmeNamespace *ns, NvmeZone *zone) 334a479335bSDmitry Fomichev { 335a479335bSDmitry Fomichev uint8_t state; 336a479335bSDmitry Fomichev 337a479335bSDmitry Fomichev zone->w_ptr = zone->d.wp; 338a479335bSDmitry Fomichev state = nvme_get_zone_state(zone); 3391a9290adSDmitry Fomichev if (zone->d.wp != zone->d.zslba || 3401a9290adSDmitry Fomichev (zone->d.za & NVME_ZA_ZD_EXT_VALID)) { 341a479335bSDmitry Fomichev if (state != NVME_ZONE_STATE_CLOSED) { 342a479335bSDmitry Fomichev trace_pci_nvme_clear_ns_close(state, zone->d.zslba); 343a479335bSDmitry Fomichev nvme_set_zone_state(zone, NVME_ZONE_STATE_CLOSED); 344a479335bSDmitry Fomichev } 3458d18ddcdSDmitry Fomichev nvme_aor_inc_active(ns); 346a479335bSDmitry Fomichev QTAILQ_INSERT_HEAD(&ns->closed_zones, zone, entry); 347a479335bSDmitry Fomichev } else { 348a479335bSDmitry Fomichev trace_pci_nvme_clear_ns_reset(state, zone->d.zslba); 349a479335bSDmitry Fomichev nvme_set_zone_state(zone, NVME_ZONE_STATE_EMPTY); 350a479335bSDmitry Fomichev } 351a479335bSDmitry Fomichev } 352a479335bSDmitry Fomichev 353a479335bSDmitry Fomichev /* 354a479335bSDmitry Fomichev * Close all the zones that are currently open. 355a479335bSDmitry Fomichev */ 356a479335bSDmitry Fomichev static void nvme_zoned_ns_shutdown(NvmeNamespace *ns) 357a479335bSDmitry Fomichev { 358a479335bSDmitry Fomichev NvmeZone *zone, *next; 359a479335bSDmitry Fomichev 360a479335bSDmitry Fomichev QTAILQ_FOREACH_SAFE(zone, &ns->closed_zones, entry, next) { 361a479335bSDmitry Fomichev QTAILQ_REMOVE(&ns->closed_zones, zone, entry); 3628d18ddcdSDmitry Fomichev nvme_aor_dec_active(ns); 363a479335bSDmitry Fomichev nvme_clear_zone(ns, zone); 364a479335bSDmitry Fomichev } 365a479335bSDmitry Fomichev QTAILQ_FOREACH_SAFE(zone, &ns->imp_open_zones, entry, next) { 366a479335bSDmitry Fomichev QTAILQ_REMOVE(&ns->imp_open_zones, zone, entry); 3678d18ddcdSDmitry Fomichev nvme_aor_dec_open(ns); 3688d18ddcdSDmitry Fomichev nvme_aor_dec_active(ns); 369a479335bSDmitry Fomichev nvme_clear_zone(ns, zone); 370a479335bSDmitry Fomichev } 371a479335bSDmitry Fomichev QTAILQ_FOREACH_SAFE(zone, &ns->exp_open_zones, entry, next) { 372a479335bSDmitry Fomichev QTAILQ_REMOVE(&ns->exp_open_zones, zone, entry); 3738d18ddcdSDmitry Fomichev nvme_aor_dec_open(ns); 3748d18ddcdSDmitry Fomichev nvme_aor_dec_active(ns); 375a479335bSDmitry Fomichev nvme_clear_zone(ns, zone); 376a479335bSDmitry Fomichev } 3778d18ddcdSDmitry Fomichev 3788d18ddcdSDmitry Fomichev assert(ns->nr_open_zones == 0); 379a479335bSDmitry Fomichev } 380a479335bSDmitry Fomichev 3817f0f1aceSKlaus Jensen static int nvme_ns_check_constraints(NvmeNamespace *ns, Error **errp) 3827f0f1aceSKlaus Jensen { 3837f0f1aceSKlaus Jensen if (!ns->blkconf.blk) { 3847f0f1aceSKlaus Jensen error_setg(errp, "block backend not configured"); 3857f0f1aceSKlaus Jensen return -1; 3867f0f1aceSKlaus Jensen } 3877f0f1aceSKlaus Jensen 388146f720cSKlaus Jensen if (ns->params.pi && !ns->params.ms) { 389146f720cSKlaus Jensen error_setg(errp, "at least 8 bytes of metadata required to enable " 390146f720cSKlaus Jensen "protection information"); 391146f720cSKlaus Jensen return -1; 392146f720cSKlaus Jensen } 393146f720cSKlaus Jensen 3947f0f1aceSKlaus Jensen return 0; 3957f0f1aceSKlaus Jensen } 3967f0f1aceSKlaus Jensen 39724ec776aSMinwoo Im int nvme_ns_setup(NvmeNamespace *ns, Error **errp) 3987f0f1aceSKlaus Jensen { 3997f0f1aceSKlaus Jensen if (nvme_ns_check_constraints(ns, errp)) { 4007f0f1aceSKlaus Jensen return -1; 4017f0f1aceSKlaus Jensen } 4027f0f1aceSKlaus Jensen 403337ccd76SMinwoo Im if (nvme_ns_init_blk(ns, errp)) { 4047f0f1aceSKlaus Jensen return -1; 4057f0f1aceSKlaus Jensen } 4067f0f1aceSKlaus Jensen 4072605257aSKlaus Jensen if (nvme_ns_init(ns, errp)) { 4082605257aSKlaus Jensen return -1; 4092605257aSKlaus Jensen } 410a479335bSDmitry Fomichev if (ns->params.zoned) { 411a479335bSDmitry Fomichev if (nvme_ns_zoned_check_calc_geometry(ns, errp) != 0) { 412a479335bSDmitry Fomichev return -1; 413a479335bSDmitry Fomichev } 414*6a674bc2SMinwoo Im nvme_ns_init_zoned(ns); 415a479335bSDmitry Fomichev } 41654064e51SKlaus Jensen 4177f0f1aceSKlaus Jensen return 0; 4187f0f1aceSKlaus Jensen } 4197f0f1aceSKlaus Jensen 4207f0f1aceSKlaus Jensen void nvme_ns_drain(NvmeNamespace *ns) 4217f0f1aceSKlaus Jensen { 4227f0f1aceSKlaus Jensen blk_drain(ns->blkconf.blk); 4237f0f1aceSKlaus Jensen } 4247f0f1aceSKlaus Jensen 425ba69f224SDmitry Fomichev void nvme_ns_shutdown(NvmeNamespace *ns) 4267f0f1aceSKlaus Jensen { 4277f0f1aceSKlaus Jensen blk_flush(ns->blkconf.blk); 428a479335bSDmitry Fomichev if (ns->params.zoned) { 429a479335bSDmitry Fomichev nvme_zoned_ns_shutdown(ns); 430a479335bSDmitry Fomichev } 431a479335bSDmitry Fomichev } 432a479335bSDmitry Fomichev 433a479335bSDmitry Fomichev void nvme_ns_cleanup(NvmeNamespace *ns) 434a479335bSDmitry Fomichev { 435a479335bSDmitry Fomichev if (ns->params.zoned) { 436a479335bSDmitry Fomichev g_free(ns->id_ns_zoned); 437a479335bSDmitry Fomichev g_free(ns->zone_array); 4381a9290adSDmitry Fomichev g_free(ns->zd_extensions); 439a479335bSDmitry Fomichev } 4407f0f1aceSKlaus Jensen } 4417f0f1aceSKlaus Jensen 4427f0f1aceSKlaus Jensen static void nvme_ns_realize(DeviceState *dev, Error **errp) 4437f0f1aceSKlaus Jensen { 4447f0f1aceSKlaus Jensen NvmeNamespace *ns = NVME_NS(dev); 4457f0f1aceSKlaus Jensen BusState *s = qdev_get_parent_bus(dev); 4467f0f1aceSKlaus Jensen NvmeCtrl *n = NVME(s->parent); 4477f0f1aceSKlaus Jensen 448832a59e4SKlaus Jensen if (nvme_ns_setup(ns, errp)) { 4497f0f1aceSKlaus Jensen return; 4507f0f1aceSKlaus Jensen } 45115d024d4SMinwoo Im 452e5707685SMinwoo Im if (ns->subsys) { 453e5707685SMinwoo Im if (nvme_subsys_register_ns(ns, errp)) { 454e5707685SMinwoo Im return; 455e5707685SMinwoo Im } 456e5707685SMinwoo Im } else { 45715d024d4SMinwoo Im if (nvme_register_namespace(n, ns, errp)) { 45815d024d4SMinwoo Im return; 45915d024d4SMinwoo Im } 460e5707685SMinwoo Im } 4617f0f1aceSKlaus Jensen } 4627f0f1aceSKlaus Jensen 4637f0f1aceSKlaus Jensen static Property nvme_ns_props[] = { 4647f0f1aceSKlaus Jensen DEFINE_BLOCK_PROPERTIES(NvmeNamespace, blkconf), 465e5707685SMinwoo Im DEFINE_PROP_LINK("subsys", NvmeNamespace, subsys, TYPE_NVME_SUBSYS, 466e5707685SMinwoo Im NvmeSubsystem *), 467037953b5SMinwoo Im DEFINE_PROP_BOOL("detached", NvmeNamespace, params.detached, false), 4687f0f1aceSKlaus Jensen DEFINE_PROP_UINT32("nsid", NvmeNamespace, params.nsid, 0), 469b52f26cdSDmitry Fomichev DEFINE_PROP_UUID("uuid", NvmeNamespace, params.uuid), 470bc3a65e9SKlaus Jensen DEFINE_PROP_UINT16("ms", NvmeNamespace, params.ms, 0), 471bc3a65e9SKlaus Jensen DEFINE_PROP_UINT8("mset", NvmeNamespace, params.mset, 0), 472146f720cSKlaus Jensen DEFINE_PROP_UINT8("pi", NvmeNamespace, params.pi, 0), 473146f720cSKlaus Jensen DEFINE_PROP_UINT8("pil", NvmeNamespace, params.pil, 0), 474e4e430b3SKlaus Jensen DEFINE_PROP_UINT16("mssrl", NvmeNamespace, params.mssrl, 128), 475e4e430b3SKlaus Jensen DEFINE_PROP_UINT32("mcl", NvmeNamespace, params.mcl, 128), 476e4e430b3SKlaus Jensen DEFINE_PROP_UINT8("msrc", NvmeNamespace, params.msrc, 127), 477a479335bSDmitry Fomichev DEFINE_PROP_BOOL("zoned", NvmeNamespace, params.zoned, false), 478a479335bSDmitry Fomichev DEFINE_PROP_SIZE("zoned.zone_size", NvmeNamespace, params.zone_size_bs, 479a479335bSDmitry Fomichev NVME_DEFAULT_ZONE_SIZE), 480a479335bSDmitry Fomichev DEFINE_PROP_SIZE("zoned.zone_capacity", NvmeNamespace, params.zone_cap_bs, 481a479335bSDmitry Fomichev 0), 482a479335bSDmitry Fomichev DEFINE_PROP_BOOL("zoned.cross_read", NvmeNamespace, 483a479335bSDmitry Fomichev params.cross_zone_read, false), 4848d18ddcdSDmitry Fomichev DEFINE_PROP_UINT32("zoned.max_active", NvmeNamespace, 4858d18ddcdSDmitry Fomichev params.max_active_zones, 0), 4868d18ddcdSDmitry Fomichev DEFINE_PROP_UINT32("zoned.max_open", NvmeNamespace, 4878d18ddcdSDmitry Fomichev params.max_open_zones, 0), 4881a9290adSDmitry Fomichev DEFINE_PROP_UINT32("zoned.descr_ext_size", NvmeNamespace, 4891a9290adSDmitry Fomichev params.zd_extension_size, 0), 4907f0f1aceSKlaus Jensen DEFINE_PROP_END_OF_LIST(), 4917f0f1aceSKlaus Jensen }; 4927f0f1aceSKlaus Jensen 4937f0f1aceSKlaus Jensen static void nvme_ns_class_init(ObjectClass *oc, void *data) 4947f0f1aceSKlaus Jensen { 4957f0f1aceSKlaus Jensen DeviceClass *dc = DEVICE_CLASS(oc); 4967f0f1aceSKlaus Jensen 4977f0f1aceSKlaus Jensen set_bit(DEVICE_CATEGORY_STORAGE, dc->categories); 4987f0f1aceSKlaus Jensen 4997f0f1aceSKlaus Jensen dc->bus_type = TYPE_NVME_BUS; 5007f0f1aceSKlaus Jensen dc->realize = nvme_ns_realize; 5017f0f1aceSKlaus Jensen device_class_set_props(dc, nvme_ns_props); 5027f0f1aceSKlaus Jensen dc->desc = "Virtual NVMe namespace"; 5037f0f1aceSKlaus Jensen } 5047f0f1aceSKlaus Jensen 5057f0f1aceSKlaus Jensen static void nvme_ns_instance_init(Object *obj) 5067f0f1aceSKlaus Jensen { 5077f0f1aceSKlaus Jensen NvmeNamespace *ns = NVME_NS(obj); 5087f0f1aceSKlaus Jensen char *bootindex = g_strdup_printf("/namespace@%d,0", ns->params.nsid); 5097f0f1aceSKlaus Jensen 5107f0f1aceSKlaus Jensen device_add_bootindex_property(obj, &ns->bootindex, "bootindex", 5117f0f1aceSKlaus Jensen bootindex, DEVICE(obj)); 5127f0f1aceSKlaus Jensen 5137f0f1aceSKlaus Jensen g_free(bootindex); 5147f0f1aceSKlaus Jensen } 5157f0f1aceSKlaus Jensen 5167f0f1aceSKlaus Jensen static const TypeInfo nvme_ns_info = { 5177f0f1aceSKlaus Jensen .name = TYPE_NVME_NS, 5187f0f1aceSKlaus Jensen .parent = TYPE_DEVICE, 5197f0f1aceSKlaus Jensen .class_init = nvme_ns_class_init, 5207f0f1aceSKlaus Jensen .instance_size = sizeof(NvmeNamespace), 5217f0f1aceSKlaus Jensen .instance_init = nvme_ns_instance_init, 5227f0f1aceSKlaus Jensen }; 5237f0f1aceSKlaus Jensen 5247f0f1aceSKlaus Jensen static void nvme_ns_register_types(void) 5257f0f1aceSKlaus Jensen { 5267f0f1aceSKlaus Jensen type_register_static(&nvme_ns_info); 5277f0f1aceSKlaus Jensen } 5287f0f1aceSKlaus Jensen 5297f0f1aceSKlaus Jensen type_init(nvme_ns_register_types) 530