libnvdimm: write blk label set
authorDan Williams <dan.j.williams@intel.com>
Sat, 30 May 2015 16:35:36 +0000 (12:35 -0400)
committerDan Williams <dan.j.williams@intel.com>
Thu, 25 Jun 2015 01:24:10 +0000 (21:24 -0400)
After 'uuid', 'size', 'sector_size', and optionally 'alt_name' have been
set to valid values the labels on the dimm can be updated.  The
difference with the pmem case is that blk namespaces are limited to one
dimm and can cover discontiguous ranges in dpa space.

Also, after allocating label slots, it is useful for userspace to know
how many slots are left.  Export this information in sysfs.

Cc: Greg KH <gregkh@linuxfoundation.org>
Cc: Neil Brown <neilb@suse.de>
Acked-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Dan Williams <dan.j.williams@intel.com>
drivers/nvdimm/bus.c
drivers/nvdimm/dimm_devs.c
drivers/nvdimm/label.c
drivers/nvdimm/label.h
drivers/nvdimm/namespace_devs.c
drivers/nvdimm/nd-core.h

index fddc3f2a8f80cf9221a84b23f730dd98f65a518f..ca802702440e4f8f8f07f4a3f7cd8f75a9a61f55 100644 (file)
@@ -155,6 +155,10 @@ static void nd_async_device_unregister(void *d, async_cookie_t cookie)
 {
        struct device *dev = d;
 
+       /* flush bus operations before delete */
+       nvdimm_bus_lock(dev);
+       nvdimm_bus_unlock(dev);
+
        device_unregister(dev);
        put_device(dev);
 }
index 156d518a089c4d37c0ae522b74388033d4d5c7ad..83b179ed6d61c64e85c0f0e3d7ea0cabcd8fa270 100644 (file)
@@ -19,6 +19,7 @@
 #include <linux/fs.h>
 #include <linux/mm.h>
 #include "nd-core.h"
+#include "label.h"
 #include "nd.h"
 
 static DEFINE_IDA(dimm_ida);
@@ -296,9 +297,33 @@ static ssize_t state_show(struct device *dev, struct device_attribute *attr,
 }
 static DEVICE_ATTR_RO(state);
 
+static ssize_t available_slots_show(struct device *dev,
+               struct device_attribute *attr, char *buf)
+{
+       struct nvdimm_drvdata *ndd = dev_get_drvdata(dev);
+       ssize_t rc;
+       u32 nfree;
+
+       if (!ndd)
+               return -ENXIO;
+
+       nvdimm_bus_lock(dev);
+       nfree = nd_label_nfree(ndd);
+       if (nfree - 1 > nfree) {
+               dev_WARN_ONCE(dev, 1, "we ate our last label?\n");
+               nfree = 0;
+       } else
+               nfree--;
+       rc = sprintf(buf, "%d\n", nfree);
+       nvdimm_bus_unlock(dev);
+       return rc;
+}
+static DEVICE_ATTR_RO(available_slots);
+
 static struct attribute *nvdimm_attributes[] = {
        &dev_attr_state.attr,
        &dev_attr_commands.attr,
+       &dev_attr_available_slots.attr,
        NULL,
 };
 
index ffa85d7004598d2ceb3e246974702523c56e7596..34148003fc73abe48d164a2ee28ac6d8d4d91b48 100644 (file)
@@ -56,7 +56,7 @@ size_t sizeof_namespace_index(struct nvdimm_drvdata *ndd)
        return ndd->nsindex_size;
 }
 
-static int nvdimm_num_label_slots(struct nvdimm_drvdata *ndd)
+int nvdimm_num_label_slots(struct nvdimm_drvdata *ndd)
 {
        return ndd->nsarea.config_size / 129;
 }
@@ -371,7 +371,7 @@ struct nd_namespace_label *nd_label_active(struct nvdimm_drvdata *ndd, int n)
        return NULL;
 }
 
-static u32 nd_label_alloc_slot(struct nvdimm_drvdata *ndd)
+u32 nd_label_alloc_slot(struct nvdimm_drvdata *ndd)
 {
        struct nd_namespace_index *nsindex;
        unsigned long *free;
@@ -391,7 +391,7 @@ static u32 nd_label_alloc_slot(struct nvdimm_drvdata *ndd)
        return slot;
 }
 
-static bool nd_label_free_slot(struct nvdimm_drvdata *ndd, u32 slot)
+bool nd_label_free_slot(struct nvdimm_drvdata *ndd, u32 slot)
 {
        struct nd_namespace_index *nsindex;
        unsigned long *free;
@@ -416,7 +416,7 @@ u32 nd_label_nfree(struct nvdimm_drvdata *ndd)
        WARN_ON(!is_nvdimm_bus_locked(ndd->dev));
 
        if (!preamble_next(ndd, &nsindex, &free, &nslot))
-               return 0;
+               return nvdimm_num_label_slots(ndd);
 
        return bitmap_weight(free, nslot);
 }
@@ -554,22 +554,270 @@ static int __pmem_label_update(struct nd_region *nd_region,
        return 0;
 }
 
-static int init_labels(struct nd_mapping *nd_mapping)
+static void del_label(struct nd_mapping *nd_mapping, int l)
+{
+       struct nd_namespace_label *next_label, *nd_label;
+       struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
+       unsigned int slot;
+       int j;
+
+       nd_label = nd_mapping->labels[l];
+       slot = to_slot(ndd, nd_label);
+       dev_vdbg(ndd->dev, "%s: clear: %d\n", __func__, slot);
+
+       for (j = l; (next_label = nd_mapping->labels[j + 1]); j++)
+               nd_mapping->labels[j] = next_label;
+       nd_mapping->labels[j] = NULL;
+}
+
+static bool is_old_resource(struct resource *res, struct resource **list, int n)
 {
        int i;
+
+       if (res->flags & DPA_RESOURCE_ADJUSTED)
+               return false;
+       for (i = 0; i < n; i++)
+               if (res == list[i])
+                       return true;
+       return false;
+}
+
+static struct resource *to_resource(struct nvdimm_drvdata *ndd,
+               struct nd_namespace_label *nd_label)
+{
+       struct resource *res;
+
+       for_each_dpa_resource(ndd, res) {
+               if (res->start != __le64_to_cpu(nd_label->dpa))
+                       continue;
+               if (resource_size(res) != __le64_to_cpu(nd_label->rawsize))
+                       continue;
+               return res;
+       }
+
+       return NULL;
+}
+
+/*
+ * 1/ Account all the labels that can be freed after this update
+ * 2/ Allocate and write the label to the staging (next) index
+ * 3/ Record the resources in the namespace device
+ */
+static int __blk_label_update(struct nd_region *nd_region,
+               struct nd_mapping *nd_mapping, struct nd_namespace_blk *nsblk,
+               int num_labels)
+{
+       int i, l, alloc, victims, nfree, old_num_resources, nlabel, rc = -ENXIO;
+       struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
+       struct nd_namespace_label *nd_label;
+       struct nd_namespace_index *nsindex;
+       unsigned long *free, *victim_map = NULL;
+       struct resource *res, **old_res_list;
+       struct nd_label_id label_id;
+       u8 uuid[NSLABEL_UUID_LEN];
+       u32 nslot, slot;
+
+       if (!preamble_next(ndd, &nsindex, &free, &nslot))
+               return -ENXIO;
+
+       old_res_list = nsblk->res;
+       nfree = nd_label_nfree(ndd);
+       old_num_resources = nsblk->num_resources;
+       nd_label_gen_id(&label_id, nsblk->uuid, NSLABEL_FLAG_LOCAL);
+
+       /*
+        * We need to loop over the old resources a few times, which seems a
+        * bit inefficient, but we need to know that we have the label
+        * space before we start mutating the tracking structures.
+        * Otherwise the recovery method of last resort for userspace is
+        * disable and re-enable the parent region.
+        */
+       alloc = 0;
+       for_each_dpa_resource(ndd, res) {
+               if (strcmp(res->name, label_id.id) != 0)
+                       continue;
+               if (!is_old_resource(res, old_res_list, old_num_resources))
+                       alloc++;
+       }
+
+       victims = 0;
+       if (old_num_resources) {
+               /* convert old local-label-map to dimm-slot victim-map */
+               victim_map = kcalloc(BITS_TO_LONGS(nslot), sizeof(long),
+                               GFP_KERNEL);
+               if (!victim_map)
+                       return -ENOMEM;
+
+               /* mark unused labels for garbage collection */
+               for_each_clear_bit_le(slot, free, nslot) {
+                       nd_label = nd_label_base(ndd) + slot;
+                       memcpy(uuid, nd_label->uuid, NSLABEL_UUID_LEN);
+                       if (memcmp(uuid, nsblk->uuid, NSLABEL_UUID_LEN) != 0)
+                               continue;
+                       res = to_resource(ndd, nd_label);
+                       if (res && is_old_resource(res, old_res_list,
+                                               old_num_resources))
+                               continue;
+                       slot = to_slot(ndd, nd_label);
+                       set_bit(slot, victim_map);
+                       victims++;
+               }
+       }
+
+       /* don't allow updates that consume the last label */
+       if (nfree - alloc < 0 || nfree - alloc + victims < 1) {
+               dev_info(&nsblk->dev, "insufficient label space\n");
+               kfree(victim_map);
+               return -ENOSPC;
+       }
+       /* from here on we need to abort on error */
+
+
+       /* assign all resources to the namespace before writing the labels */
+       nsblk->res = NULL;
+       nsblk->num_resources = 0;
+       for_each_dpa_resource(ndd, res) {
+               if (strcmp(res->name, label_id.id) != 0)
+                       continue;
+               if (!nsblk_add_resource(nd_region, ndd, nsblk, res->start)) {
+                       rc = -ENOMEM;
+                       goto abort;
+               }
+       }
+
+       for (i = 0; i < nsblk->num_resources; i++) {
+               size_t offset;
+
+               res = nsblk->res[i];
+               if (is_old_resource(res, old_res_list, old_num_resources))
+                       continue; /* carry-over */
+               slot = nd_label_alloc_slot(ndd);
+               if (slot == UINT_MAX)
+                       goto abort;
+               dev_dbg(ndd->dev, "%s: allocated: %d\n", __func__, slot);
+
+               nd_label = nd_label_base(ndd) + slot;
+               memset(nd_label, 0, sizeof(struct nd_namespace_label));
+               memcpy(nd_label->uuid, nsblk->uuid, NSLABEL_UUID_LEN);
+               if (nsblk->alt_name)
+                       memcpy(nd_label->name, nsblk->alt_name,
+                                       NSLABEL_NAME_LEN);
+               nd_label->flags = __cpu_to_le32(NSLABEL_FLAG_LOCAL);
+               nd_label->nlabel = __cpu_to_le16(0); /* N/A */
+               nd_label->position = __cpu_to_le16(0); /* N/A */
+               nd_label->isetcookie = __cpu_to_le64(0); /* N/A */
+               nd_label->dpa = __cpu_to_le64(res->start);
+               nd_label->rawsize = __cpu_to_le64(resource_size(res));
+               nd_label->lbasize = __cpu_to_le64(nsblk->lbasize);
+               nd_label->slot = __cpu_to_le32(slot);
+
+               /* update label */
+               offset = nd_label_offset(ndd, nd_label);
+               rc = nvdimm_set_config_data(ndd, offset, nd_label,
+                               sizeof(struct nd_namespace_label));
+               if (rc < 0)
+                       goto abort;
+       }
+
+       /* free up now unused slots in the new index */
+       for_each_set_bit(slot, victim_map, victim_map ? nslot : 0) {
+               dev_dbg(ndd->dev, "%s: free: %d\n", __func__, slot);
+               nd_label_free_slot(ndd, slot);
+       }
+
+       /* update index */
+       rc = nd_label_write_index(ndd, ndd->ns_next,
+                       nd_inc_seq(__le32_to_cpu(nsindex->seq)), 0);
+       if (rc)
+               goto abort;
+
+       /*
+        * Now that the on-dimm labels are up to date, fix up the tracking
+        * entries in nd_mapping->labels
+        */
+       nlabel = 0;
+       for_each_label(l, nd_label, nd_mapping->labels) {
+               nlabel++;
+               memcpy(uuid, nd_label->uuid, NSLABEL_UUID_LEN);
+               if (memcmp(uuid, nsblk->uuid, NSLABEL_UUID_LEN) != 0)
+                       continue;
+               nlabel--;
+               del_label(nd_mapping, l);
+               l--; /* retry with the new label at this index */
+       }
+       if (nlabel + nsblk->num_resources > num_labels) {
+               /*
+                * Bug, we can't end up with more resources than
+                * available labels
+                */
+               WARN_ON_ONCE(1);
+               rc = -ENXIO;
+               goto out;
+       }
+
+       for_each_clear_bit_le(slot, free, nslot) {
+               nd_label = nd_label_base(ndd) + slot;
+               memcpy(uuid, nd_label->uuid, NSLABEL_UUID_LEN);
+               if (memcmp(uuid, nsblk->uuid, NSLABEL_UUID_LEN) != 0)
+                       continue;
+               res = to_resource(ndd, nd_label);
+               res->flags &= ~DPA_RESOURCE_ADJUSTED;
+               dev_vdbg(&nsblk->dev, "assign label[%d] slot: %d\n", l, slot);
+               nd_mapping->labels[l++] = nd_label;
+       }
+       nd_mapping->labels[l] = NULL;
+
+ out:
+       kfree(old_res_list);
+       kfree(victim_map);
+       return rc;
+
+ abort:
+       /*
+        * 1/ repair the allocated label bitmap in the index
+        * 2/ restore the resource list
+        */
+       nd_label_copy(ndd, nsindex, to_current_namespace_index(ndd));
+       kfree(nsblk->res);
+       nsblk->res = old_res_list;
+       nsblk->num_resources = old_num_resources;
+       old_res_list = NULL;
+       goto out;
+}
+
+static int init_labels(struct nd_mapping *nd_mapping, int num_labels)
+{
+       int i, l, old_num_labels = 0;
        struct nd_namespace_index *nsindex;
+       struct nd_namespace_label *nd_label;
        struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
+       size_t size = (num_labels + 1) * sizeof(struct nd_namespace_label *);
 
-       if (!nd_mapping->labels)
-               nd_mapping->labels = kcalloc(2, sizeof(void *), GFP_KERNEL);
+       for_each_label(l, nd_label, nd_mapping->labels)
+               old_num_labels++;
 
+       /*
+        * We need to preserve all the old labels for the mapping so
+        * they can be garbage collected after writing the new labels.
+        */
+       if (num_labels > old_num_labels) {
+               struct nd_namespace_label **labels;
+
+               labels = krealloc(nd_mapping->labels, size, GFP_KERNEL);
+               if (!labels)
+                       return -ENOMEM;
+               nd_mapping->labels = labels;
+       }
        if (!nd_mapping->labels)
                return -ENOMEM;
 
+       for (i = old_num_labels; i <= num_labels; i++)
+               nd_mapping->labels[i] = NULL;
+
        if (ndd->ns_current == -1 || ndd->ns_next == -1)
                /* pass */;
        else
-               return 0;
+               return max(num_labels, old_num_labels);
 
        nsindex = to_namespace_index(ndd, 0);
        memset(nsindex, 0, ndd->nsarea.config_size);
@@ -582,7 +830,7 @@ static int init_labels(struct nd_mapping *nd_mapping)
        ndd->ns_next = 1;
        ndd->ns_current = 0;
 
-       return 0;
+       return max(num_labels, old_num_labels);
 }
 
 static int del_labels(struct nd_mapping *nd_mapping, u8 *uuid)
@@ -604,22 +852,15 @@ static int del_labels(struct nd_mapping *nd_mapping, u8 *uuid)
                return 0;
 
        for_each_label(l, nd_label, nd_mapping->labels) {
-               int j;
-
                memcpy(label_uuid, nd_label->uuid, NSLABEL_UUID_LEN);
                if (memcmp(label_uuid, uuid, NSLABEL_UUID_LEN) != 0)
                        continue;
                slot = to_slot(ndd, nd_label);
                nd_label_free_slot(ndd, slot);
                dev_dbg(ndd->dev, "%s: free: %d\n", __func__, slot);
-               for (j = l; nd_mapping->labels[j + 1]; j++) {
-                       struct nd_namespace_label *next_label;
-
-                       next_label = nd_mapping->labels[j + 1];
-                       nd_mapping->labels[j] = next_label;
-               }
-               nd_mapping->labels[j] = NULL;
+               del_label(nd_mapping, l);
                num_freed++;
+               l--; /* retry with new label at this index */
        }
 
        if (num_freed > l) {
@@ -652,8 +893,8 @@ int nd_pmem_namespace_label_update(struct nd_region *nd_region,
                        continue;
                }
 
-               rc = init_labels(nd_mapping);
-               if (rc)
+               rc = init_labels(nd_mapping, 1);
+               if (rc < 0)
                        return rc;
 
                rc = __pmem_label_update(nd_region, nd_mapping, nspm, i);
@@ -663,3 +904,23 @@ int nd_pmem_namespace_label_update(struct nd_region *nd_region,
 
        return 0;
 }
+
+int nd_blk_namespace_label_update(struct nd_region *nd_region,
+               struct nd_namespace_blk *nsblk, resource_size_t size)
+{
+       struct nd_mapping *nd_mapping = &nd_region->mapping[0];
+       struct resource *res;
+       int count = 0;
+
+       if (size == 0)
+               return del_labels(nd_mapping, nsblk->uuid);
+
+       for_each_dpa_resource(to_ndd(nd_mapping), res)
+               count++;
+
+       count = init_labels(nd_mapping, count);
+       if (count < 0)
+               return count;
+
+       return __blk_label_update(nd_region, nd_mapping, nsblk, count);
+}
index 6d376be31937862e1b6d7cd7d903f524b025df6f..a59ef6eef2a376b871b3c70e33f890c973dc7744 100644 (file)
@@ -128,9 +128,14 @@ void nd_label_copy(struct nvdimm_drvdata *ndd, struct nd_namespace_index *dst,
 size_t sizeof_namespace_index(struct nvdimm_drvdata *ndd);
 int nd_label_active_count(struct nvdimm_drvdata *ndd);
 struct nd_namespace_label *nd_label_active(struct nvdimm_drvdata *ndd, int n);
+u32 nd_label_alloc_slot(struct nvdimm_drvdata *ndd);
+bool nd_label_free_slot(struct nvdimm_drvdata *ndd, u32 slot);
 u32 nd_label_nfree(struct nvdimm_drvdata *ndd);
 struct nd_region;
 struct nd_namespace_pmem;
+struct nd_namespace_blk;
 int nd_pmem_namespace_label_update(struct nd_region *nd_region,
                struct nd_namespace_pmem *nspm, resource_size_t size);
+int nd_blk_namespace_label_update(struct nd_region *nd_region,
+               struct nd_namespace_blk *nsblk, resource_size_t size);
 #endif /* __LABEL_H__ */
index 546e77e122fd7d0ffaf22d8525f2955085636544..50b502b1908eecd7605d092230a88c016fc65f59 100644 (file)
@@ -163,8 +163,7 @@ static int nd_namespace_label_update(struct nd_region *nd_region,
         */
        if (is_namespace_pmem(dev)) {
                struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
-               struct resource *res = &nspm->nsio.res;
-               resource_size_t size = resource_size(res);
+               resource_size_t size = resource_size(&nspm->nsio.res);
 
                if (size == 0 && nspm->uuid)
                        /* delete allocation */;
@@ -173,8 +172,15 @@ static int nd_namespace_label_update(struct nd_region *nd_region,
 
                return nd_pmem_namespace_label_update(nd_region, nspm, size);
        } else if (is_namespace_blk(dev)) {
-               /* TODO: implement blk labels */
-               return 0;
+               struct nd_namespace_blk *nsblk = to_nd_namespace_blk(dev);
+               resource_size_t size = nd_namespace_blk_size(nsblk);
+
+               if (size == 0 && nsblk->uuid)
+                       /* delete allocation */;
+               else if (!nsblk->uuid || !nsblk->lbasize)
+                       return 0;
+
+               return nd_blk_namespace_label_update(nd_region, nsblk, size);
        } else
                return -ENXIO;
 }
@@ -986,6 +992,48 @@ static ssize_t sector_size_store(struct device *dev,
 }
 static DEVICE_ATTR_RW(sector_size);
 
+static ssize_t dpa_extents_show(struct device *dev,
+               struct device_attribute *attr, char *buf)
+{
+       struct nd_region *nd_region = to_nd_region(dev->parent);
+       struct nd_label_id label_id;
+       int count = 0, i;
+       u8 *uuid = NULL;
+       u32 flags = 0;
+
+       nvdimm_bus_lock(dev);
+       if (is_namespace_pmem(dev)) {
+               struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
+
+               uuid = nspm->uuid;
+               flags = 0;
+       } else if (is_namespace_blk(dev)) {
+               struct nd_namespace_blk *nsblk = to_nd_namespace_blk(dev);
+
+               uuid = nsblk->uuid;
+               flags = NSLABEL_FLAG_LOCAL;
+       }
+
+       if (!uuid)
+               goto out;
+
+       nd_label_gen_id(&label_id, uuid, flags);
+       for (i = 0; i < nd_region->ndr_mappings; i++) {
+               struct nd_mapping *nd_mapping = &nd_region->mapping[i];
+               struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
+               struct resource *res;
+
+               for_each_dpa_resource(ndd, res)
+                       if (strcmp(res->name, label_id.id) == 0)
+                               count++;
+       }
+ out:
+       nvdimm_bus_unlock(dev);
+
+       return sprintf(buf, "%d\n", count);
+}
+static DEVICE_ATTR_RO(dpa_extents);
+
 static struct attribute *nd_namespace_attributes[] = {
        &dev_attr_nstype.attr,
        &dev_attr_size.attr,
@@ -993,6 +1041,7 @@ static struct attribute *nd_namespace_attributes[] = {
        &dev_attr_resource.attr,
        &dev_attr_alt_name.attr,
        &dev_attr_sector_size.attr,
+       &dev_attr_dpa_extents.attr,
        NULL,
 };
 
index 22489555a6f1261ce526cf734fa581db51f5ef47..78d6c51f4bacf36aa5e9d067b6b9f730662e3062 100644 (file)
@@ -75,5 +75,6 @@ struct nd_mapping;
 struct resource *nsblk_add_resource(struct nd_region *nd_region,
                struct nvdimm_drvdata *ndd, struct nd_namespace_blk *nsblk,
                resource_size_t start);
+int nvdimm_num_label_slots(struct nvdimm_drvdata *ndd);
 void get_ndd(struct nvdimm_drvdata *ndd);
 #endif /* __ND_CORE_H__ */