Merge tag 'dma-mapping-6.8-2024-01-18' of git://git.infradead.org/users/hch/dma-mapping
[linux-block.git] / drivers / nvdimm / namespace_devs.c
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Copyright(c) 2013-2015 Intel Corporation. All rights reserved.
4  */
5 #include <linux/kstrtox.h>
6 #include <linux/module.h>
7 #include <linux/device.h>
8 #include <linux/sort.h>
9 #include <linux/slab.h>
10 #include <linux/list.h>
11 #include <linux/nd.h>
12 #include "nd-core.h"
13 #include "pmem.h"
14 #include "pfn.h"
15 #include "nd.h"
16
17 static void namespace_io_release(struct device *dev)
18 {
19         struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
20
21         kfree(nsio);
22 }
23
24 static void namespace_pmem_release(struct device *dev)
25 {
26         struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
27         struct nd_region *nd_region = to_nd_region(dev->parent);
28
29         if (nspm->id >= 0)
30                 ida_free(&nd_region->ns_ida, nspm->id);
31         kfree(nspm->alt_name);
32         kfree(nspm->uuid);
33         kfree(nspm);
34 }
35
36 static bool is_namespace_pmem(const struct device *dev);
37 static bool is_namespace_io(const struct device *dev);
38
39 static int is_uuid_busy(struct device *dev, void *data)
40 {
41         uuid_t *uuid1 = data, *uuid2 = NULL;
42
43         if (is_namespace_pmem(dev)) {
44                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
45
46                 uuid2 = nspm->uuid;
47         } else if (is_nd_btt(dev)) {
48                 struct nd_btt *nd_btt = to_nd_btt(dev);
49
50                 uuid2 = nd_btt->uuid;
51         } else if (is_nd_pfn(dev)) {
52                 struct nd_pfn *nd_pfn = to_nd_pfn(dev);
53
54                 uuid2 = nd_pfn->uuid;
55         }
56
57         if (uuid2 && uuid_equal(uuid1, uuid2))
58                 return -EBUSY;
59
60         return 0;
61 }
62
63 static int is_namespace_uuid_busy(struct device *dev, void *data)
64 {
65         if (is_nd_region(dev))
66                 return device_for_each_child(dev, data, is_uuid_busy);
67         return 0;
68 }
69
70 /**
71  * nd_is_uuid_unique - verify that no other namespace has @uuid
72  * @dev: any device on a nvdimm_bus
73  * @uuid: uuid to check
74  *
75  * Returns: %true if the uuid is unique, %false if not
76  */
77 bool nd_is_uuid_unique(struct device *dev, uuid_t *uuid)
78 {
79         struct nvdimm_bus *nvdimm_bus = walk_to_nvdimm_bus(dev);
80
81         if (!nvdimm_bus)
82                 return false;
83         WARN_ON_ONCE(!is_nvdimm_bus_locked(&nvdimm_bus->dev));
84         if (device_for_each_child(&nvdimm_bus->dev, uuid,
85                                 is_namespace_uuid_busy) != 0)
86                 return false;
87         return true;
88 }
89
90 bool pmem_should_map_pages(struct device *dev)
91 {
92         struct nd_region *nd_region = to_nd_region(dev->parent);
93         struct nd_namespace_common *ndns = to_ndns(dev);
94         struct nd_namespace_io *nsio;
95
96         if (!IS_ENABLED(CONFIG_ZONE_DEVICE))
97                 return false;
98
99         if (!test_bit(ND_REGION_PAGEMAP, &nd_region->flags))
100                 return false;
101
102         if (is_nd_pfn(dev) || is_nd_btt(dev))
103                 return false;
104
105         if (ndns->force_raw)
106                 return false;
107
108         nsio = to_nd_namespace_io(dev);
109         if (region_intersects(nsio->res.start, resource_size(&nsio->res),
110                                 IORESOURCE_SYSTEM_RAM,
111                                 IORES_DESC_NONE) == REGION_MIXED)
112                 return false;
113
114         return ARCH_MEMREMAP_PMEM == MEMREMAP_WB;
115 }
116 EXPORT_SYMBOL(pmem_should_map_pages);
117
118 unsigned int pmem_sector_size(struct nd_namespace_common *ndns)
119 {
120         if (is_namespace_pmem(&ndns->dev)) {
121                 struct nd_namespace_pmem *nspm;
122
123                 nspm = to_nd_namespace_pmem(&ndns->dev);
124                 if (nspm->lbasize == 0 || nspm->lbasize == 512)
125                         /* default */;
126                 else if (nspm->lbasize == 4096)
127                         return 4096;
128                 else
129                         dev_WARN(&ndns->dev, "unsupported sector size: %ld\n",
130                                         nspm->lbasize);
131         }
132
133         /*
134          * There is no namespace label (is_namespace_io()), or the label
135          * indicates the default sector size.
136          */
137         return 512;
138 }
139 EXPORT_SYMBOL(pmem_sector_size);
140
141 const char *nvdimm_namespace_disk_name(struct nd_namespace_common *ndns,
142                 char *name)
143 {
144         struct nd_region *nd_region = to_nd_region(ndns->dev.parent);
145         const char *suffix = NULL;
146
147         if (ndns->claim && is_nd_btt(ndns->claim))
148                 suffix = "s";
149
150         if (is_namespace_pmem(&ndns->dev) || is_namespace_io(&ndns->dev)) {
151                 int nsidx = 0;
152
153                 if (is_namespace_pmem(&ndns->dev)) {
154                         struct nd_namespace_pmem *nspm;
155
156                         nspm = to_nd_namespace_pmem(&ndns->dev);
157                         nsidx = nspm->id;
158                 }
159
160                 if (nsidx)
161                         sprintf(name, "pmem%d.%d%s", nd_region->id, nsidx,
162                                         suffix ? suffix : "");
163                 else
164                         sprintf(name, "pmem%d%s", nd_region->id,
165                                         suffix ? suffix : "");
166         } else {
167                 return NULL;
168         }
169
170         return name;
171 }
172 EXPORT_SYMBOL(nvdimm_namespace_disk_name);
173
174 const uuid_t *nd_dev_to_uuid(struct device *dev)
175 {
176         if (dev && is_namespace_pmem(dev)) {
177                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
178
179                 return nspm->uuid;
180         }
181         return &uuid_null;
182 }
183 EXPORT_SYMBOL(nd_dev_to_uuid);
184
185 static ssize_t nstype_show(struct device *dev,
186                 struct device_attribute *attr, char *buf)
187 {
188         struct nd_region *nd_region = to_nd_region(dev->parent);
189
190         return sprintf(buf, "%d\n", nd_region_to_nstype(nd_region));
191 }
192 static DEVICE_ATTR_RO(nstype);
193
194 static ssize_t __alt_name_store(struct device *dev, const char *buf,
195                 const size_t len)
196 {
197         char *input, *pos, *alt_name, **ns_altname;
198         ssize_t rc;
199
200         if (is_namespace_pmem(dev)) {
201                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
202
203                 ns_altname = &nspm->alt_name;
204         } else
205                 return -ENXIO;
206
207         if (dev->driver || to_ndns(dev)->claim)
208                 return -EBUSY;
209
210         input = kstrndup(buf, len, GFP_KERNEL);
211         if (!input)
212                 return -ENOMEM;
213
214         pos = strim(input);
215         if (strlen(pos) + 1 > NSLABEL_NAME_LEN) {
216                 rc = -EINVAL;
217                 goto out;
218         }
219
220         alt_name = kzalloc(NSLABEL_NAME_LEN, GFP_KERNEL);
221         if (!alt_name) {
222                 rc = -ENOMEM;
223                 goto out;
224         }
225         kfree(*ns_altname);
226         *ns_altname = alt_name;
227         sprintf(*ns_altname, "%s", pos);
228         rc = len;
229
230 out:
231         kfree(input);
232         return rc;
233 }
234
235 static int nd_namespace_label_update(struct nd_region *nd_region,
236                 struct device *dev)
237 {
238         dev_WARN_ONCE(dev, dev->driver || to_ndns(dev)->claim,
239                         "namespace must be idle during label update\n");
240         if (dev->driver || to_ndns(dev)->claim)
241                 return 0;
242
243         /*
244          * Only allow label writes that will result in a valid namespace
245          * or deletion of an existing namespace.
246          */
247         if (is_namespace_pmem(dev)) {
248                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
249                 resource_size_t size = resource_size(&nspm->nsio.res);
250
251                 if (size == 0 && nspm->uuid)
252                         /* delete allocation */;
253                 else if (!nspm->uuid)
254                         return 0;
255
256                 return nd_pmem_namespace_label_update(nd_region, nspm, size);
257         } else
258                 return -ENXIO;
259 }
260
261 static ssize_t alt_name_store(struct device *dev,
262                 struct device_attribute *attr, const char *buf, size_t len)
263 {
264         struct nd_region *nd_region = to_nd_region(dev->parent);
265         ssize_t rc;
266
267         device_lock(dev);
268         nvdimm_bus_lock(dev);
269         wait_nvdimm_bus_probe_idle(dev);
270         rc = __alt_name_store(dev, buf, len);
271         if (rc >= 0)
272                 rc = nd_namespace_label_update(nd_region, dev);
273         dev_dbg(dev, "%s(%zd)\n", rc < 0 ? "fail " : "", rc);
274         nvdimm_bus_unlock(dev);
275         device_unlock(dev);
276
277         return rc < 0 ? rc : len;
278 }
279
280 static ssize_t alt_name_show(struct device *dev,
281                 struct device_attribute *attr, char *buf)
282 {
283         char *ns_altname;
284
285         if (is_namespace_pmem(dev)) {
286                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
287
288                 ns_altname = nspm->alt_name;
289         } else
290                 return -ENXIO;
291
292         return sprintf(buf, "%s\n", ns_altname ? ns_altname : "");
293 }
294 static DEVICE_ATTR_RW(alt_name);
295
296 static int scan_free(struct nd_region *nd_region,
297                 struct nd_mapping *nd_mapping, struct nd_label_id *label_id,
298                 resource_size_t n)
299 {
300         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
301         int rc = 0;
302
303         while (n) {
304                 struct resource *res, *last;
305
306                 last = NULL;
307                 for_each_dpa_resource(ndd, res)
308                         if (strcmp(res->name, label_id->id) == 0)
309                                 last = res;
310                 res = last;
311                 if (!res)
312                         return 0;
313
314                 if (n >= resource_size(res)) {
315                         n -= resource_size(res);
316                         nd_dbg_dpa(nd_region, ndd, res, "delete %d\n", rc);
317                         nvdimm_free_dpa(ndd, res);
318                         /* retry with last resource deleted */
319                         continue;
320                 }
321
322                 rc = adjust_resource(res, res->start, resource_size(res) - n);
323                 if (rc == 0)
324                         res->flags |= DPA_RESOURCE_ADJUSTED;
325                 nd_dbg_dpa(nd_region, ndd, res, "shrink %d\n", rc);
326                 break;
327         }
328
329         return rc;
330 }
331
332 /**
333  * shrink_dpa_allocation - for each dimm in region free n bytes for label_id
334  * @nd_region: the set of dimms to reclaim @n bytes from
335  * @label_id: unique identifier for the namespace consuming this dpa range
336  * @n: number of bytes per-dimm to release
337  *
338  * Assumes resources are ordered.  Starting from the end try to
339  * adjust_resource() the allocation to @n, but if @n is larger than the
340  * allocation delete it and find the 'new' last allocation in the label
341  * set.
342  *
343  * Returns: %0 on success on -errno on error
344  */
345 static int shrink_dpa_allocation(struct nd_region *nd_region,
346                 struct nd_label_id *label_id, resource_size_t n)
347 {
348         int i;
349
350         for (i = 0; i < nd_region->ndr_mappings; i++) {
351                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
352                 int rc;
353
354                 rc = scan_free(nd_region, nd_mapping, label_id, n);
355                 if (rc)
356                         return rc;
357         }
358
359         return 0;
360 }
361
362 static resource_size_t init_dpa_allocation(struct nd_label_id *label_id,
363                 struct nd_region *nd_region, struct nd_mapping *nd_mapping,
364                 resource_size_t n)
365 {
366         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
367         struct resource *res;
368         int rc = 0;
369
370         /* first resource allocation for this label-id or dimm */
371         res = nvdimm_allocate_dpa(ndd, label_id, nd_mapping->start, n);
372         if (!res)
373                 rc = -EBUSY;
374
375         nd_dbg_dpa(nd_region, ndd, res, "init %d\n", rc);
376         return rc ? n : 0;
377 }
378
379
380 /**
381  * space_valid() - validate free dpa space against constraints
382  * @nd_region: hosting region of the free space
383  * @ndd: dimm device data for debug
384  * @label_id: namespace id to allocate space
385  * @prev: potential allocation that precedes free space
386  * @next: allocation that follows the given free space range
387  * @exist: first allocation with same id in the mapping
388  * @n: range that must satisfied for pmem allocations
389  * @valid: free space range to validate
390  *
391  * BLK-space is valid as long as it does not precede a PMEM
392  * allocation in a given region. PMEM-space must be contiguous
393  * and adjacent to an existing allocation (if one
394  * exists).  If reserving PMEM any space is valid.
395  */
396 static void space_valid(struct nd_region *nd_region, struct nvdimm_drvdata *ndd,
397                 struct nd_label_id *label_id, struct resource *prev,
398                 struct resource *next, struct resource *exist,
399                 resource_size_t n, struct resource *valid)
400 {
401         bool is_reserve = strcmp(label_id->id, "pmem-reserve") == 0;
402         unsigned long align;
403
404         align = nd_region->align / nd_region->ndr_mappings;
405         valid->start = ALIGN(valid->start, align);
406         valid->end = ALIGN_DOWN(valid->end + 1, align) - 1;
407
408         if (valid->start >= valid->end)
409                 goto invalid;
410
411         if (is_reserve)
412                 return;
413
414         /* allocation needs to be contiguous, so this is all or nothing */
415         if (resource_size(valid) < n)
416                 goto invalid;
417
418         /* we've got all the space we need and no existing allocation */
419         if (!exist)
420                 return;
421
422         /* allocation needs to be contiguous with the existing namespace */
423         if (valid->start == exist->end + 1
424                         || valid->end == exist->start - 1)
425                 return;
426
427  invalid:
428         /* truncate @valid size to 0 */
429         valid->end = valid->start - 1;
430 }
431
432 enum alloc_loc {
433         ALLOC_ERR = 0, ALLOC_BEFORE, ALLOC_MID, ALLOC_AFTER,
434 };
435
436 static resource_size_t scan_allocate(struct nd_region *nd_region,
437                 struct nd_mapping *nd_mapping, struct nd_label_id *label_id,
438                 resource_size_t n)
439 {
440         resource_size_t mapping_end = nd_mapping->start + nd_mapping->size - 1;
441         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
442         struct resource *res, *exist = NULL, valid;
443         const resource_size_t to_allocate = n;
444         int first;
445
446         for_each_dpa_resource(ndd, res)
447                 if (strcmp(label_id->id, res->name) == 0)
448                         exist = res;
449
450         valid.start = nd_mapping->start;
451         valid.end = mapping_end;
452         valid.name = "free space";
453  retry:
454         first = 0;
455         for_each_dpa_resource(ndd, res) {
456                 struct resource *next = res->sibling, *new_res = NULL;
457                 resource_size_t allocate, available = 0;
458                 enum alloc_loc loc = ALLOC_ERR;
459                 const char *action;
460                 int rc = 0;
461
462                 /* ignore resources outside this nd_mapping */
463                 if (res->start > mapping_end)
464                         continue;
465                 if (res->end < nd_mapping->start)
466                         continue;
467
468                 /* space at the beginning of the mapping */
469                 if (!first++ && res->start > nd_mapping->start) {
470                         valid.start = nd_mapping->start;
471                         valid.end = res->start - 1;
472                         space_valid(nd_region, ndd, label_id, NULL, next, exist,
473                                         to_allocate, &valid);
474                         available = resource_size(&valid);
475                         if (available)
476                                 loc = ALLOC_BEFORE;
477                 }
478
479                 /* space between allocations */
480                 if (!loc && next) {
481                         valid.start = res->start + resource_size(res);
482                         valid.end = min(mapping_end, next->start - 1);
483                         space_valid(nd_region, ndd, label_id, res, next, exist,
484                                         to_allocate, &valid);
485                         available = resource_size(&valid);
486                         if (available)
487                                 loc = ALLOC_MID;
488                 }
489
490                 /* space at the end of the mapping */
491                 if (!loc && !next) {
492                         valid.start = res->start + resource_size(res);
493                         valid.end = mapping_end;
494                         space_valid(nd_region, ndd, label_id, res, next, exist,
495                                         to_allocate, &valid);
496                         available = resource_size(&valid);
497                         if (available)
498                                 loc = ALLOC_AFTER;
499                 }
500
501                 if (!loc || !available)
502                         continue;
503                 allocate = min(available, n);
504                 switch (loc) {
505                 case ALLOC_BEFORE:
506                         if (strcmp(res->name, label_id->id) == 0) {
507                                 /* adjust current resource up */
508                                 rc = adjust_resource(res, res->start - allocate,
509                                                 resource_size(res) + allocate);
510                                 action = "cur grow up";
511                         } else
512                                 action = "allocate";
513                         break;
514                 case ALLOC_MID:
515                         if (strcmp(next->name, label_id->id) == 0) {
516                                 /* adjust next resource up */
517                                 rc = adjust_resource(next, next->start
518                                                 - allocate, resource_size(next)
519                                                 + allocate);
520                                 new_res = next;
521                                 action = "next grow up";
522                         } else if (strcmp(res->name, label_id->id) == 0) {
523                                 action = "grow down";
524                         } else
525                                 action = "allocate";
526                         break;
527                 case ALLOC_AFTER:
528                         if (strcmp(res->name, label_id->id) == 0)
529                                 action = "grow down";
530                         else
531                                 action = "allocate";
532                         break;
533                 default:
534                         return n;
535                 }
536
537                 if (strcmp(action, "allocate") == 0) {
538                         new_res = nvdimm_allocate_dpa(ndd, label_id,
539                                         valid.start, allocate);
540                         if (!new_res)
541                                 rc = -EBUSY;
542                 } else if (strcmp(action, "grow down") == 0) {
543                         /* adjust current resource down */
544                         rc = adjust_resource(res, res->start, resource_size(res)
545                                         + allocate);
546                         if (rc == 0)
547                                 res->flags |= DPA_RESOURCE_ADJUSTED;
548                 }
549
550                 if (!new_res)
551                         new_res = res;
552
553                 nd_dbg_dpa(nd_region, ndd, new_res, "%s(%d) %d\n",
554                                 action, loc, rc);
555
556                 if (rc)
557                         return n;
558
559                 n -= allocate;
560                 if (n) {
561                         /*
562                          * Retry scan with newly inserted resources.
563                          * For example, if we did an ALLOC_BEFORE
564                          * insertion there may also have been space
565                          * available for an ALLOC_AFTER insertion, so we
566                          * need to check this same resource again
567                          */
568                         goto retry;
569                 } else
570                         return 0;
571         }
572
573         if (n == to_allocate)
574                 return init_dpa_allocation(label_id, nd_region, nd_mapping, n);
575         return n;
576 }
577
578 static int merge_dpa(struct nd_region *nd_region,
579                 struct nd_mapping *nd_mapping, struct nd_label_id *label_id)
580 {
581         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
582         struct resource *res;
583
584         if (strncmp("pmem", label_id->id, 4) == 0)
585                 return 0;
586  retry:
587         for_each_dpa_resource(ndd, res) {
588                 int rc;
589                 struct resource *next = res->sibling;
590                 resource_size_t end = res->start + resource_size(res);
591
592                 if (!next || strcmp(res->name, label_id->id) != 0
593                                 || strcmp(next->name, label_id->id) != 0
594                                 || end != next->start)
595                         continue;
596                 end += resource_size(next);
597                 nvdimm_free_dpa(ndd, next);
598                 rc = adjust_resource(res, res->start, end - res->start);
599                 nd_dbg_dpa(nd_region, ndd, res, "merge %d\n", rc);
600                 if (rc)
601                         return rc;
602                 res->flags |= DPA_RESOURCE_ADJUSTED;
603                 goto retry;
604         }
605
606         return 0;
607 }
608
609 int __reserve_free_pmem(struct device *dev, void *data)
610 {
611         struct nvdimm *nvdimm = data;
612         struct nd_region *nd_region;
613         struct nd_label_id label_id;
614         int i;
615
616         if (!is_memory(dev))
617                 return 0;
618
619         nd_region = to_nd_region(dev);
620         if (nd_region->ndr_mappings == 0)
621                 return 0;
622
623         memset(&label_id, 0, sizeof(label_id));
624         strcat(label_id.id, "pmem-reserve");
625         for (i = 0; i < nd_region->ndr_mappings; i++) {
626                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
627                 resource_size_t n, rem = 0;
628
629                 if (nd_mapping->nvdimm != nvdimm)
630                         continue;
631
632                 n = nd_pmem_available_dpa(nd_region, nd_mapping);
633                 if (n == 0)
634                         return 0;
635                 rem = scan_allocate(nd_region, nd_mapping, &label_id, n);
636                 dev_WARN_ONCE(&nd_region->dev, rem,
637                                 "pmem reserve underrun: %#llx of %#llx bytes\n",
638                                 (unsigned long long) n - rem,
639                                 (unsigned long long) n);
640                 return rem ? -ENXIO : 0;
641         }
642
643         return 0;
644 }
645
646 void release_free_pmem(struct nvdimm_bus *nvdimm_bus,
647                 struct nd_mapping *nd_mapping)
648 {
649         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
650         struct resource *res, *_res;
651
652         for_each_dpa_resource_safe(ndd, res, _res)
653                 if (strcmp(res->name, "pmem-reserve") == 0)
654                         nvdimm_free_dpa(ndd, res);
655 }
656
657 /**
658  * grow_dpa_allocation - for each dimm allocate n bytes for @label_id
659  * @nd_region: the set of dimms to allocate @n more bytes from
660  * @label_id: unique identifier for the namespace consuming this dpa range
661  * @n: number of bytes per-dimm to add to the existing allocation
662  *
663  * Assumes resources are ordered.  For BLK regions, first consume
664  * BLK-only available DPA free space, then consume PMEM-aliased DPA
665  * space starting at the highest DPA.  For PMEM regions start
666  * allocations from the start of an interleave set and end at the first
667  * BLK allocation or the end of the interleave set, whichever comes
668  * first.
669  *
670  * Returns: %0 on success on -errno on error
671  */
672 static int grow_dpa_allocation(struct nd_region *nd_region,
673                 struct nd_label_id *label_id, resource_size_t n)
674 {
675         int i;
676
677         for (i = 0; i < nd_region->ndr_mappings; i++) {
678                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
679                 resource_size_t rem = n;
680                 int rc;
681
682                 rem = scan_allocate(nd_region, nd_mapping, label_id, rem);
683                 dev_WARN_ONCE(&nd_region->dev, rem,
684                                 "allocation underrun: %#llx of %#llx bytes\n",
685                                 (unsigned long long) n - rem,
686                                 (unsigned long long) n);
687                 if (rem)
688                         return -ENXIO;
689
690                 rc = merge_dpa(nd_region, nd_mapping, label_id);
691                 if (rc)
692                         return rc;
693         }
694
695         return 0;
696 }
697
698 static void nd_namespace_pmem_set_resource(struct nd_region *nd_region,
699                 struct nd_namespace_pmem *nspm, resource_size_t size)
700 {
701         struct resource *res = &nspm->nsio.res;
702         resource_size_t offset = 0;
703
704         if (size && !nspm->uuid) {
705                 WARN_ON_ONCE(1);
706                 size = 0;
707         }
708
709         if (size && nspm->uuid) {
710                 struct nd_mapping *nd_mapping = &nd_region->mapping[0];
711                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
712                 struct nd_label_id label_id;
713                 struct resource *res;
714
715                 if (!ndd) {
716                         size = 0;
717                         goto out;
718                 }
719
720                 nd_label_gen_id(&label_id, nspm->uuid, 0);
721
722                 /* calculate a spa offset from the dpa allocation offset */
723                 for_each_dpa_resource(ndd, res)
724                         if (strcmp(res->name, label_id.id) == 0) {
725                                 offset = (res->start - nd_mapping->start)
726                                         * nd_region->ndr_mappings;
727                                 goto out;
728                         }
729
730                 WARN_ON_ONCE(1);
731                 size = 0;
732         }
733
734  out:
735         res->start = nd_region->ndr_start + offset;
736         res->end = res->start + size - 1;
737 }
738
739 static bool uuid_not_set(const uuid_t *uuid, struct device *dev,
740                          const char *where)
741 {
742         if (!uuid) {
743                 dev_dbg(dev, "%s: uuid not set\n", where);
744                 return true;
745         }
746         return false;
747 }
748
749 static ssize_t __size_store(struct device *dev, unsigned long long val)
750 {
751         resource_size_t allocated = 0, available = 0;
752         struct nd_region *nd_region = to_nd_region(dev->parent);
753         struct nd_namespace_common *ndns = to_ndns(dev);
754         struct nd_mapping *nd_mapping;
755         struct nvdimm_drvdata *ndd;
756         struct nd_label_id label_id;
757         u32 flags = 0, remainder;
758         int rc, i, id = -1;
759         uuid_t *uuid = NULL;
760
761         if (dev->driver || ndns->claim)
762                 return -EBUSY;
763
764         if (is_namespace_pmem(dev)) {
765                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
766
767                 uuid = nspm->uuid;
768                 id = nspm->id;
769         }
770
771         /*
772          * We need a uuid for the allocation-label and dimm(s) on which
773          * to store the label.
774          */
775         if (uuid_not_set(uuid, dev, __func__))
776                 return -ENXIO;
777         if (nd_region->ndr_mappings == 0) {
778                 dev_dbg(dev, "not associated with dimm(s)\n");
779                 return -ENXIO;
780         }
781
782         div_u64_rem(val, nd_region->align, &remainder);
783         if (remainder) {
784                 dev_dbg(dev, "%llu is not %ldK aligned\n", val,
785                                 nd_region->align / SZ_1K);
786                 return -EINVAL;
787         }
788
789         nd_label_gen_id(&label_id, uuid, flags);
790         for (i = 0; i < nd_region->ndr_mappings; i++) {
791                 nd_mapping = &nd_region->mapping[i];
792                 ndd = to_ndd(nd_mapping);
793
794                 /*
795                  * All dimms in an interleave set, need to be enabled
796                  * for the size to be changed.
797                  */
798                 if (!ndd)
799                         return -ENXIO;
800
801                 allocated += nvdimm_allocated_dpa(ndd, &label_id);
802         }
803         available = nd_region_allocatable_dpa(nd_region);
804
805         if (val > available + allocated)
806                 return -ENOSPC;
807
808         if (val == allocated)
809                 return 0;
810
811         val = div_u64(val, nd_region->ndr_mappings);
812         allocated = div_u64(allocated, nd_region->ndr_mappings);
813         if (val < allocated)
814                 rc = shrink_dpa_allocation(nd_region, &label_id,
815                                 allocated - val);
816         else
817                 rc = grow_dpa_allocation(nd_region, &label_id, val - allocated);
818
819         if (rc)
820                 return rc;
821
822         if (is_namespace_pmem(dev)) {
823                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
824
825                 nd_namespace_pmem_set_resource(nd_region, nspm,
826                                 val * nd_region->ndr_mappings);
827         }
828
829         /*
830          * Try to delete the namespace if we deleted all of its
831          * allocation, this is not the seed or 0th device for the
832          * region, and it is not actively claimed by a btt, pfn, or dax
833          * instance.
834          */
835         if (val == 0 && id != 0 && nd_region->ns_seed != dev && !ndns->claim)
836                 nd_device_unregister(dev, ND_ASYNC);
837
838         return rc;
839 }
840
841 static ssize_t size_store(struct device *dev,
842                 struct device_attribute *attr, const char *buf, size_t len)
843 {
844         struct nd_region *nd_region = to_nd_region(dev->parent);
845         unsigned long long val;
846         int rc;
847
848         rc = kstrtoull(buf, 0, &val);
849         if (rc)
850                 return rc;
851
852         device_lock(dev);
853         nvdimm_bus_lock(dev);
854         wait_nvdimm_bus_probe_idle(dev);
855         rc = __size_store(dev, val);
856         if (rc >= 0)
857                 rc = nd_namespace_label_update(nd_region, dev);
858
859         /* setting size zero == 'delete namespace' */
860         if (rc == 0 && val == 0 && is_namespace_pmem(dev)) {
861                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
862
863                 kfree(nspm->uuid);
864                 nspm->uuid = NULL;
865         }
866
867         dev_dbg(dev, "%llx %s (%d)\n", val, rc < 0 ? "fail" : "success", rc);
868
869         nvdimm_bus_unlock(dev);
870         device_unlock(dev);
871
872         return rc < 0 ? rc : len;
873 }
874
875 resource_size_t __nvdimm_namespace_capacity(struct nd_namespace_common *ndns)
876 {
877         struct device *dev = &ndns->dev;
878
879         if (is_namespace_pmem(dev)) {
880                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
881
882                 return resource_size(&nspm->nsio.res);
883         } else if (is_namespace_io(dev)) {
884                 struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
885
886                 return resource_size(&nsio->res);
887         } else
888                 WARN_ONCE(1, "unknown namespace type\n");
889         return 0;
890 }
891
892 resource_size_t nvdimm_namespace_capacity(struct nd_namespace_common *ndns)
893 {
894         resource_size_t size;
895
896         nvdimm_bus_lock(&ndns->dev);
897         size = __nvdimm_namespace_capacity(ndns);
898         nvdimm_bus_unlock(&ndns->dev);
899
900         return size;
901 }
902 EXPORT_SYMBOL(nvdimm_namespace_capacity);
903
904 bool nvdimm_namespace_locked(struct nd_namespace_common *ndns)
905 {
906         int i;
907         bool locked = false;
908         struct device *dev = &ndns->dev;
909         struct nd_region *nd_region = to_nd_region(dev->parent);
910
911         for (i = 0; i < nd_region->ndr_mappings; i++) {
912                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
913                 struct nvdimm *nvdimm = nd_mapping->nvdimm;
914
915                 if (test_bit(NDD_LOCKED, &nvdimm->flags)) {
916                         dev_dbg(dev, "%s locked\n", nvdimm_name(nvdimm));
917                         locked = true;
918                 }
919         }
920         return locked;
921 }
922 EXPORT_SYMBOL(nvdimm_namespace_locked);
923
924 static ssize_t size_show(struct device *dev,
925                 struct device_attribute *attr, char *buf)
926 {
927         return sprintf(buf, "%llu\n", (unsigned long long)
928                         nvdimm_namespace_capacity(to_ndns(dev)));
929 }
930 static DEVICE_ATTR(size, 0444, size_show, size_store);
931
932 static uuid_t *namespace_to_uuid(struct device *dev)
933 {
934         if (is_namespace_pmem(dev)) {
935                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
936
937                 return nspm->uuid;
938         }
939         return ERR_PTR(-ENXIO);
940 }
941
942 static ssize_t uuid_show(struct device *dev, struct device_attribute *attr,
943                          char *buf)
944 {
945         uuid_t *uuid = namespace_to_uuid(dev);
946
947         if (IS_ERR(uuid))
948                 return PTR_ERR(uuid);
949         if (uuid)
950                 return sprintf(buf, "%pUb\n", uuid);
951         return sprintf(buf, "\n");
952 }
953
954 /**
955  * namespace_update_uuid - check for a unique uuid and whether we're "renaming"
956  * @nd_region: parent region so we can updates all dimms in the set
957  * @dev: namespace type for generating label_id
958  * @new_uuid: incoming uuid
959  * @old_uuid: reference to the uuid storage location in the namespace object
960  *
961  * Returns: %0 on success on -errno on error
962  */
963 static int namespace_update_uuid(struct nd_region *nd_region,
964                                  struct device *dev, uuid_t *new_uuid,
965                                  uuid_t **old_uuid)
966 {
967         struct nd_label_id old_label_id;
968         struct nd_label_id new_label_id;
969         int i;
970
971         if (!nd_is_uuid_unique(dev, new_uuid))
972                 return -EINVAL;
973
974         if (*old_uuid == NULL)
975                 goto out;
976
977         /*
978          * If we've already written a label with this uuid, then it's
979          * too late to rename because we can't reliably update the uuid
980          * without losing the old namespace.  Userspace must delete this
981          * namespace to abandon the old uuid.
982          */
983         for (i = 0; i < nd_region->ndr_mappings; i++) {
984                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
985
986                 /*
987                  * This check by itself is sufficient because old_uuid
988                  * would be NULL above if this uuid did not exist in the
989                  * currently written set.
990                  *
991                  * FIXME: can we delete uuid with zero dpa allocated?
992                  */
993                 if (list_empty(&nd_mapping->labels))
994                         return -EBUSY;
995         }
996
997         nd_label_gen_id(&old_label_id, *old_uuid, 0);
998         nd_label_gen_id(&new_label_id, new_uuid, 0);
999         for (i = 0; i < nd_region->ndr_mappings; i++) {
1000                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1001                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1002                 struct nd_label_ent *label_ent;
1003                 struct resource *res;
1004
1005                 for_each_dpa_resource(ndd, res)
1006                         if (strcmp(res->name, old_label_id.id) == 0)
1007                                 sprintf((void *) res->name, "%s",
1008                                                 new_label_id.id);
1009
1010                 mutex_lock(&nd_mapping->lock);
1011                 list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1012                         struct nd_namespace_label *nd_label = label_ent->label;
1013                         struct nd_label_id label_id;
1014                         uuid_t uuid;
1015
1016                         if (!nd_label)
1017                                 continue;
1018                         nsl_get_uuid(ndd, nd_label, &uuid);
1019                         nd_label_gen_id(&label_id, &uuid,
1020                                         nsl_get_flags(ndd, nd_label));
1021                         if (strcmp(old_label_id.id, label_id.id) == 0)
1022                                 set_bit(ND_LABEL_REAP, &label_ent->flags);
1023                 }
1024                 mutex_unlock(&nd_mapping->lock);
1025         }
1026         kfree(*old_uuid);
1027  out:
1028         *old_uuid = new_uuid;
1029         return 0;
1030 }
1031
1032 static ssize_t uuid_store(struct device *dev,
1033                 struct device_attribute *attr, const char *buf, size_t len)
1034 {
1035         struct nd_region *nd_region = to_nd_region(dev->parent);
1036         uuid_t *uuid = NULL;
1037         uuid_t **ns_uuid;
1038         ssize_t rc = 0;
1039
1040         if (is_namespace_pmem(dev)) {
1041                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1042
1043                 ns_uuid = &nspm->uuid;
1044         } else
1045                 return -ENXIO;
1046
1047         device_lock(dev);
1048         nvdimm_bus_lock(dev);
1049         wait_nvdimm_bus_probe_idle(dev);
1050         if (to_ndns(dev)->claim)
1051                 rc = -EBUSY;
1052         if (rc >= 0)
1053                 rc = nd_uuid_store(dev, &uuid, buf, len);
1054         if (rc >= 0)
1055                 rc = namespace_update_uuid(nd_region, dev, uuid, ns_uuid);
1056         if (rc >= 0)
1057                 rc = nd_namespace_label_update(nd_region, dev);
1058         else
1059                 kfree(uuid);
1060         dev_dbg(dev, "result: %zd wrote: %s%s", rc, buf,
1061                         buf[len - 1] == '\n' ? "" : "\n");
1062         nvdimm_bus_unlock(dev);
1063         device_unlock(dev);
1064
1065         return rc < 0 ? rc : len;
1066 }
1067 static DEVICE_ATTR_RW(uuid);
1068
1069 static ssize_t resource_show(struct device *dev,
1070                 struct device_attribute *attr, char *buf)
1071 {
1072         struct resource *res;
1073
1074         if (is_namespace_pmem(dev)) {
1075                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1076
1077                 res = &nspm->nsio.res;
1078         } else if (is_namespace_io(dev)) {
1079                 struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
1080
1081                 res = &nsio->res;
1082         } else
1083                 return -ENXIO;
1084
1085         /* no address to convey if the namespace has no allocation */
1086         if (resource_size(res) == 0)
1087                 return -ENXIO;
1088         return sprintf(buf, "%#llx\n", (unsigned long long) res->start);
1089 }
1090 static DEVICE_ATTR_ADMIN_RO(resource);
1091
1092 static const unsigned long pmem_lbasize_supported[] = { 512, 4096, 0 };
1093
1094 static ssize_t sector_size_show(struct device *dev,
1095                 struct device_attribute *attr, char *buf)
1096 {
1097         if (is_namespace_pmem(dev)) {
1098                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1099
1100                 return nd_size_select_show(nspm->lbasize,
1101                                 pmem_lbasize_supported, buf);
1102         }
1103         return -ENXIO;
1104 }
1105
1106 static ssize_t sector_size_store(struct device *dev,
1107                 struct device_attribute *attr, const char *buf, size_t len)
1108 {
1109         struct nd_region *nd_region = to_nd_region(dev->parent);
1110         const unsigned long *supported;
1111         unsigned long *lbasize;
1112         ssize_t rc = 0;
1113
1114         if (is_namespace_pmem(dev)) {
1115                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1116
1117                 lbasize = &nspm->lbasize;
1118                 supported = pmem_lbasize_supported;
1119         } else
1120                 return -ENXIO;
1121
1122         device_lock(dev);
1123         nvdimm_bus_lock(dev);
1124         if (to_ndns(dev)->claim)
1125                 rc = -EBUSY;
1126         if (rc >= 0)
1127                 rc = nd_size_select_store(dev, buf, lbasize, supported);
1128         if (rc >= 0)
1129                 rc = nd_namespace_label_update(nd_region, dev);
1130         dev_dbg(dev, "result: %zd %s: %s%s", rc, rc < 0 ? "tried" : "wrote",
1131                         buf, buf[len - 1] == '\n' ? "" : "\n");
1132         nvdimm_bus_unlock(dev);
1133         device_unlock(dev);
1134
1135         return rc ? rc : len;
1136 }
1137 static DEVICE_ATTR_RW(sector_size);
1138
1139 static ssize_t dpa_extents_show(struct device *dev,
1140                 struct device_attribute *attr, char *buf)
1141 {
1142         struct nd_region *nd_region = to_nd_region(dev->parent);
1143         struct nd_label_id label_id;
1144         uuid_t *uuid = NULL;
1145         int count = 0, i;
1146         u32 flags = 0;
1147
1148         nvdimm_bus_lock(dev);
1149         if (is_namespace_pmem(dev)) {
1150                 struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1151
1152                 uuid = nspm->uuid;
1153                 flags = 0;
1154         }
1155
1156         if (!uuid)
1157                 goto out;
1158
1159         nd_label_gen_id(&label_id, uuid, flags);
1160         for (i = 0; i < nd_region->ndr_mappings; i++) {
1161                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1162                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1163                 struct resource *res;
1164
1165                 for_each_dpa_resource(ndd, res)
1166                         if (strcmp(res->name, label_id.id) == 0)
1167                                 count++;
1168         }
1169  out:
1170         nvdimm_bus_unlock(dev);
1171
1172         return sprintf(buf, "%d\n", count);
1173 }
1174 static DEVICE_ATTR_RO(dpa_extents);
1175
1176 static int btt_claim_class(struct device *dev)
1177 {
1178         struct nd_region *nd_region = to_nd_region(dev->parent);
1179         int i, loop_bitmask = 0;
1180
1181         for (i = 0; i < nd_region->ndr_mappings; i++) {
1182                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1183                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1184                 struct nd_namespace_index *nsindex;
1185
1186                 /*
1187                  * If any of the DIMMs do not support labels the only
1188                  * possible BTT format is v1.
1189                  */
1190                 if (!ndd) {
1191                         loop_bitmask = 0;
1192                         break;
1193                 }
1194
1195                 nsindex = to_namespace_index(ndd, ndd->ns_current);
1196                 if (nsindex == NULL)
1197                         loop_bitmask |= 1;
1198                 else {
1199                         /* check whether existing labels are v1.1 or v1.2 */
1200                         if (__le16_to_cpu(nsindex->major) == 1
1201                                         && __le16_to_cpu(nsindex->minor) == 1)
1202                                 loop_bitmask |= 2;
1203                         else
1204                                 loop_bitmask |= 4;
1205                 }
1206         }
1207         /*
1208          * If nsindex is null loop_bitmask's bit 0 will be set, and if an index
1209          * block is found, a v1.1 label for any mapping will set bit 1, and a
1210          * v1.2 label will set bit 2.
1211          *
1212          * At the end of the loop, at most one of the three bits must be set.
1213          * If multiple bits were set, it means the different mappings disagree
1214          * about their labels, and this must be cleaned up first.
1215          *
1216          * If all the label index blocks are found to agree, nsindex of NULL
1217          * implies labels haven't been initialized yet, and when they will,
1218          * they will be of the 1.2 format, so we can assume BTT2.0
1219          *
1220          * If 1.1 labels are found, we enforce BTT1.1, and if 1.2 labels are
1221          * found, we enforce BTT2.0
1222          *
1223          * If the loop was never entered, default to BTT1.1 (legacy namespaces)
1224          */
1225         switch (loop_bitmask) {
1226         case 0:
1227         case 2:
1228                 return NVDIMM_CCLASS_BTT;
1229         case 1:
1230         case 4:
1231                 return NVDIMM_CCLASS_BTT2;
1232         default:
1233                 return -ENXIO;
1234         }
1235 }
1236
1237 static ssize_t holder_show(struct device *dev,
1238                 struct device_attribute *attr, char *buf)
1239 {
1240         struct nd_namespace_common *ndns = to_ndns(dev);
1241         ssize_t rc;
1242
1243         device_lock(dev);
1244         rc = sprintf(buf, "%s\n", ndns->claim ? dev_name(ndns->claim) : "");
1245         device_unlock(dev);
1246
1247         return rc;
1248 }
1249 static DEVICE_ATTR_RO(holder);
1250
1251 static int __holder_class_store(struct device *dev, const char *buf)
1252 {
1253         struct nd_namespace_common *ndns = to_ndns(dev);
1254
1255         if (dev->driver || ndns->claim)
1256                 return -EBUSY;
1257
1258         if (sysfs_streq(buf, "btt")) {
1259                 int rc = btt_claim_class(dev);
1260
1261                 if (rc < NVDIMM_CCLASS_NONE)
1262                         return rc;
1263                 ndns->claim_class = rc;
1264         } else if (sysfs_streq(buf, "pfn"))
1265                 ndns->claim_class = NVDIMM_CCLASS_PFN;
1266         else if (sysfs_streq(buf, "dax"))
1267                 ndns->claim_class = NVDIMM_CCLASS_DAX;
1268         else if (sysfs_streq(buf, ""))
1269                 ndns->claim_class = NVDIMM_CCLASS_NONE;
1270         else
1271                 return -EINVAL;
1272
1273         return 0;
1274 }
1275
1276 static ssize_t holder_class_store(struct device *dev,
1277                 struct device_attribute *attr, const char *buf, size_t len)
1278 {
1279         struct nd_region *nd_region = to_nd_region(dev->parent);
1280         int rc;
1281
1282         device_lock(dev);
1283         nvdimm_bus_lock(dev);
1284         wait_nvdimm_bus_probe_idle(dev);
1285         rc = __holder_class_store(dev, buf);
1286         if (rc >= 0)
1287                 rc = nd_namespace_label_update(nd_region, dev);
1288         dev_dbg(dev, "%s(%d)\n", rc < 0 ? "fail " : "", rc);
1289         nvdimm_bus_unlock(dev);
1290         device_unlock(dev);
1291
1292         return rc < 0 ? rc : len;
1293 }
1294
1295 static ssize_t holder_class_show(struct device *dev,
1296                 struct device_attribute *attr, char *buf)
1297 {
1298         struct nd_namespace_common *ndns = to_ndns(dev);
1299         ssize_t rc;
1300
1301         device_lock(dev);
1302         if (ndns->claim_class == NVDIMM_CCLASS_NONE)
1303                 rc = sprintf(buf, "\n");
1304         else if ((ndns->claim_class == NVDIMM_CCLASS_BTT) ||
1305                         (ndns->claim_class == NVDIMM_CCLASS_BTT2))
1306                 rc = sprintf(buf, "btt\n");
1307         else if (ndns->claim_class == NVDIMM_CCLASS_PFN)
1308                 rc = sprintf(buf, "pfn\n");
1309         else if (ndns->claim_class == NVDIMM_CCLASS_DAX)
1310                 rc = sprintf(buf, "dax\n");
1311         else
1312                 rc = sprintf(buf, "<unknown>\n");
1313         device_unlock(dev);
1314
1315         return rc;
1316 }
1317 static DEVICE_ATTR_RW(holder_class);
1318
1319 static ssize_t mode_show(struct device *dev,
1320                 struct device_attribute *attr, char *buf)
1321 {
1322         struct nd_namespace_common *ndns = to_ndns(dev);
1323         struct device *claim;
1324         char *mode;
1325         ssize_t rc;
1326
1327         device_lock(dev);
1328         claim = ndns->claim;
1329         if (claim && is_nd_btt(claim))
1330                 mode = "safe";
1331         else if (claim && is_nd_pfn(claim))
1332                 mode = "memory";
1333         else if (claim && is_nd_dax(claim))
1334                 mode = "dax";
1335         else if (!claim && pmem_should_map_pages(dev))
1336                 mode = "memory";
1337         else
1338                 mode = "raw";
1339         rc = sprintf(buf, "%s\n", mode);
1340         device_unlock(dev);
1341
1342         return rc;
1343 }
1344 static DEVICE_ATTR_RO(mode);
1345
1346 static ssize_t force_raw_store(struct device *dev,
1347                 struct device_attribute *attr, const char *buf, size_t len)
1348 {
1349         bool force_raw;
1350         int rc = kstrtobool(buf, &force_raw);
1351
1352         if (rc)
1353                 return rc;
1354
1355         to_ndns(dev)->force_raw = force_raw;
1356         return len;
1357 }
1358
1359 static ssize_t force_raw_show(struct device *dev,
1360                 struct device_attribute *attr, char *buf)
1361 {
1362         return sprintf(buf, "%d\n", to_ndns(dev)->force_raw);
1363 }
1364 static DEVICE_ATTR_RW(force_raw);
1365
1366 static struct attribute *nd_namespace_attributes[] = {
1367         &dev_attr_nstype.attr,
1368         &dev_attr_size.attr,
1369         &dev_attr_mode.attr,
1370         &dev_attr_uuid.attr,
1371         &dev_attr_holder.attr,
1372         &dev_attr_resource.attr,
1373         &dev_attr_alt_name.attr,
1374         &dev_attr_force_raw.attr,
1375         &dev_attr_sector_size.attr,
1376         &dev_attr_dpa_extents.attr,
1377         &dev_attr_holder_class.attr,
1378         NULL,
1379 };
1380
1381 static umode_t namespace_visible(struct kobject *kobj,
1382                 struct attribute *a, int n)
1383 {
1384         struct device *dev = container_of(kobj, struct device, kobj);
1385
1386         if (is_namespace_pmem(dev)) {
1387                 if (a == &dev_attr_size.attr)
1388                         return 0644;
1389
1390                 return a->mode;
1391         }
1392
1393         /* base is_namespace_io() attributes */
1394         if (a == &dev_attr_nstype.attr || a == &dev_attr_size.attr ||
1395             a == &dev_attr_holder.attr || a == &dev_attr_holder_class.attr ||
1396             a == &dev_attr_force_raw.attr || a == &dev_attr_mode.attr ||
1397             a == &dev_attr_resource.attr)
1398                 return a->mode;
1399
1400         return 0;
1401 }
1402
1403 static struct attribute_group nd_namespace_attribute_group = {
1404         .attrs = nd_namespace_attributes,
1405         .is_visible = namespace_visible,
1406 };
1407
1408 static const struct attribute_group *nd_namespace_attribute_groups[] = {
1409         &nd_device_attribute_group,
1410         &nd_namespace_attribute_group,
1411         &nd_numa_attribute_group,
1412         NULL,
1413 };
1414
1415 static const struct device_type namespace_io_device_type = {
1416         .name = "nd_namespace_io",
1417         .release = namespace_io_release,
1418         .groups = nd_namespace_attribute_groups,
1419 };
1420
1421 static const struct device_type namespace_pmem_device_type = {
1422         .name = "nd_namespace_pmem",
1423         .release = namespace_pmem_release,
1424         .groups = nd_namespace_attribute_groups,
1425 };
1426
1427 static bool is_namespace_pmem(const struct device *dev)
1428 {
1429         return dev ? dev->type == &namespace_pmem_device_type : false;
1430 }
1431
1432 static bool is_namespace_io(const struct device *dev)
1433 {
1434         return dev ? dev->type == &namespace_io_device_type : false;
1435 }
1436
1437 struct nd_namespace_common *nvdimm_namespace_common_probe(struct device *dev)
1438 {
1439         struct nd_btt *nd_btt = is_nd_btt(dev) ? to_nd_btt(dev) : NULL;
1440         struct nd_pfn *nd_pfn = is_nd_pfn(dev) ? to_nd_pfn(dev) : NULL;
1441         struct nd_dax *nd_dax = is_nd_dax(dev) ? to_nd_dax(dev) : NULL;
1442         struct nd_namespace_common *ndns = NULL;
1443         resource_size_t size;
1444
1445         if (nd_btt || nd_pfn || nd_dax) {
1446                 if (nd_btt)
1447                         ndns = nd_btt->ndns;
1448                 else if (nd_pfn)
1449                         ndns = nd_pfn->ndns;
1450                 else if (nd_dax)
1451                         ndns = nd_dax->nd_pfn.ndns;
1452
1453                 if (!ndns)
1454                         return ERR_PTR(-ENODEV);
1455
1456                 /*
1457                  * Flush any in-progess probes / removals in the driver
1458                  * for the raw personality of this namespace.
1459                  */
1460                 device_lock(&ndns->dev);
1461                 device_unlock(&ndns->dev);
1462                 if (ndns->dev.driver) {
1463                         dev_dbg(&ndns->dev, "is active, can't bind %s\n",
1464                                         dev_name(dev));
1465                         return ERR_PTR(-EBUSY);
1466                 }
1467                 if (dev_WARN_ONCE(&ndns->dev, ndns->claim != dev,
1468                                         "host (%s) vs claim (%s) mismatch\n",
1469                                         dev_name(dev),
1470                                         dev_name(ndns->claim)))
1471                         return ERR_PTR(-ENXIO);
1472         } else {
1473                 ndns = to_ndns(dev);
1474                 if (ndns->claim) {
1475                         dev_dbg(dev, "claimed by %s, failing probe\n",
1476                                 dev_name(ndns->claim));
1477
1478                         return ERR_PTR(-ENXIO);
1479                 }
1480         }
1481
1482         if (nvdimm_namespace_locked(ndns))
1483                 return ERR_PTR(-EACCES);
1484
1485         size = nvdimm_namespace_capacity(ndns);
1486         if (size < ND_MIN_NAMESPACE_SIZE) {
1487                 dev_dbg(&ndns->dev, "%pa, too small must be at least %#x\n",
1488                                 &size, ND_MIN_NAMESPACE_SIZE);
1489                 return ERR_PTR(-ENODEV);
1490         }
1491
1492         /*
1493          * Note, alignment validation for fsdax and devdax mode
1494          * namespaces happens in nd_pfn_validate() where infoblock
1495          * padding parameters can be applied.
1496          */
1497         if (pmem_should_map_pages(dev)) {
1498                 struct nd_namespace_io *nsio = to_nd_namespace_io(&ndns->dev);
1499                 struct resource *res = &nsio->res;
1500
1501                 if (!IS_ALIGNED(res->start | (res->end + 1),
1502                                         memremap_compat_align())) {
1503                         dev_err(&ndns->dev, "%pr misaligned, unable to map\n", res);
1504                         return ERR_PTR(-EOPNOTSUPP);
1505                 }
1506         }
1507
1508         if (is_namespace_pmem(&ndns->dev)) {
1509                 struct nd_namespace_pmem *nspm;
1510
1511                 nspm = to_nd_namespace_pmem(&ndns->dev);
1512                 if (uuid_not_set(nspm->uuid, &ndns->dev, __func__))
1513                         return ERR_PTR(-ENODEV);
1514         }
1515
1516         return ndns;
1517 }
1518 EXPORT_SYMBOL(nvdimm_namespace_common_probe);
1519
1520 int devm_namespace_enable(struct device *dev, struct nd_namespace_common *ndns,
1521                 resource_size_t size)
1522 {
1523         return devm_nsio_enable(dev, to_nd_namespace_io(&ndns->dev), size);
1524 }
1525 EXPORT_SYMBOL_GPL(devm_namespace_enable);
1526
1527 void devm_namespace_disable(struct device *dev, struct nd_namespace_common *ndns)
1528 {
1529         devm_nsio_disable(dev, to_nd_namespace_io(&ndns->dev));
1530 }
1531 EXPORT_SYMBOL_GPL(devm_namespace_disable);
1532
1533 static struct device **create_namespace_io(struct nd_region *nd_region)
1534 {
1535         struct nd_namespace_io *nsio;
1536         struct device *dev, **devs;
1537         struct resource *res;
1538
1539         nsio = kzalloc(sizeof(*nsio), GFP_KERNEL);
1540         if (!nsio)
1541                 return NULL;
1542
1543         devs = kcalloc(2, sizeof(struct device *), GFP_KERNEL);
1544         if (!devs) {
1545                 kfree(nsio);
1546                 return NULL;
1547         }
1548
1549         dev = &nsio->common.dev;
1550         dev->type = &namespace_io_device_type;
1551         dev->parent = &nd_region->dev;
1552         res = &nsio->res;
1553         res->name = dev_name(&nd_region->dev);
1554         res->flags = IORESOURCE_MEM;
1555         res->start = nd_region->ndr_start;
1556         res->end = res->start + nd_region->ndr_size - 1;
1557
1558         devs[0] = dev;
1559         return devs;
1560 }
1561
1562 static bool has_uuid_at_pos(struct nd_region *nd_region, const uuid_t *uuid,
1563                             u64 cookie, u16 pos)
1564 {
1565         struct nd_namespace_label *found = NULL;
1566         int i;
1567
1568         for (i = 0; i < nd_region->ndr_mappings; i++) {
1569                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1570                 struct nd_interleave_set *nd_set = nd_region->nd_set;
1571                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1572                 struct nd_label_ent *label_ent;
1573                 bool found_uuid = false;
1574
1575                 list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1576                         struct nd_namespace_label *nd_label = label_ent->label;
1577                         u16 position;
1578
1579                         if (!nd_label)
1580                                 continue;
1581                         position = nsl_get_position(ndd, nd_label);
1582
1583                         if (!nsl_validate_isetcookie(ndd, nd_label, cookie))
1584                                 continue;
1585
1586                         if (!nsl_uuid_equal(ndd, nd_label, uuid))
1587                                 continue;
1588
1589                         if (!nsl_validate_type_guid(ndd, nd_label,
1590                                                     &nd_set->type_guid))
1591                                 continue;
1592
1593                         if (found_uuid) {
1594                                 dev_dbg(ndd->dev, "duplicate entry for uuid\n");
1595                                 return false;
1596                         }
1597                         found_uuid = true;
1598                         if (!nsl_validate_nlabel(nd_region, ndd, nd_label))
1599                                 continue;
1600                         if (position != pos)
1601                                 continue;
1602                         found = nd_label;
1603                         break;
1604                 }
1605                 if (found)
1606                         break;
1607         }
1608         return found != NULL;
1609 }
1610
1611 static int select_pmem_id(struct nd_region *nd_region, const uuid_t *pmem_id)
1612 {
1613         int i;
1614
1615         if (!pmem_id)
1616                 return -ENODEV;
1617
1618         for (i = 0; i < nd_region->ndr_mappings; i++) {
1619                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1620                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1621                 struct nd_namespace_label *nd_label = NULL;
1622                 u64 hw_start, hw_end, pmem_start, pmem_end;
1623                 struct nd_label_ent *label_ent;
1624
1625                 lockdep_assert_held(&nd_mapping->lock);
1626                 list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1627                         nd_label = label_ent->label;
1628                         if (!nd_label)
1629                                 continue;
1630                         if (nsl_uuid_equal(ndd, nd_label, pmem_id))
1631                                 break;
1632                         nd_label = NULL;
1633                 }
1634
1635                 if (!nd_label) {
1636                         WARN_ON(1);
1637                         return -EINVAL;
1638                 }
1639
1640                 /*
1641                  * Check that this label is compliant with the dpa
1642                  * range published in NFIT
1643                  */
1644                 hw_start = nd_mapping->start;
1645                 hw_end = hw_start + nd_mapping->size;
1646                 pmem_start = nsl_get_dpa(ndd, nd_label);
1647                 pmem_end = pmem_start + nsl_get_rawsize(ndd, nd_label);
1648                 if (pmem_start >= hw_start && pmem_start < hw_end
1649                                 && pmem_end <= hw_end && pmem_end > hw_start)
1650                         /* pass */;
1651                 else {
1652                         dev_dbg(&nd_region->dev, "%s invalid label for %pUb\n",
1653                                 dev_name(ndd->dev),
1654                                 nsl_uuid_raw(ndd, nd_label));
1655                         return -EINVAL;
1656                 }
1657
1658                 /* move recently validated label to the front of the list */
1659                 list_move(&label_ent->list, &nd_mapping->labels);
1660         }
1661         return 0;
1662 }
1663
1664 /**
1665  * create_namespace_pmem - validate interleave set labelling, retrieve label0
1666  * @nd_region: region with mappings to validate
1667  * @nd_mapping: container of dpa-resource-root + labels
1668  * @nd_label: target pmem namespace label to evaluate
1669  *
1670  * Returns: the created &struct device on success or ERR_PTR(-errno) on error
1671  */
1672 static struct device *create_namespace_pmem(struct nd_region *nd_region,
1673                                             struct nd_mapping *nd_mapping,
1674                                             struct nd_namespace_label *nd_label)
1675 {
1676         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1677         struct nd_namespace_index *nsindex =
1678                 to_namespace_index(ndd, ndd->ns_current);
1679         u64 cookie = nd_region_interleave_set_cookie(nd_region, nsindex);
1680         u64 altcookie = nd_region_interleave_set_altcookie(nd_region);
1681         struct nd_label_ent *label_ent;
1682         struct nd_namespace_pmem *nspm;
1683         resource_size_t size = 0;
1684         struct resource *res;
1685         struct device *dev;
1686         uuid_t uuid;
1687         int rc = 0;
1688         u16 i;
1689
1690         if (cookie == 0) {
1691                 dev_dbg(&nd_region->dev, "invalid interleave-set-cookie\n");
1692                 return ERR_PTR(-ENXIO);
1693         }
1694
1695         if (!nsl_validate_isetcookie(ndd, nd_label, cookie)) {
1696                 dev_dbg(&nd_region->dev, "invalid cookie in label: %pUb\n",
1697                         nsl_uuid_raw(ndd, nd_label));
1698                 if (!nsl_validate_isetcookie(ndd, nd_label, altcookie))
1699                         return ERR_PTR(-EAGAIN);
1700
1701                 dev_dbg(&nd_region->dev, "valid altcookie in label: %pUb\n",
1702                         nsl_uuid_raw(ndd, nd_label));
1703         }
1704
1705         nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1706         if (!nspm)
1707                 return ERR_PTR(-ENOMEM);
1708
1709         nspm->id = -1;
1710         dev = &nspm->nsio.common.dev;
1711         dev->type = &namespace_pmem_device_type;
1712         dev->parent = &nd_region->dev;
1713         res = &nspm->nsio.res;
1714         res->name = dev_name(&nd_region->dev);
1715         res->flags = IORESOURCE_MEM;
1716
1717         for (i = 0; i < nd_region->ndr_mappings; i++) {
1718                 nsl_get_uuid(ndd, nd_label, &uuid);
1719                 if (has_uuid_at_pos(nd_region, &uuid, cookie, i))
1720                         continue;
1721                 if (has_uuid_at_pos(nd_region, &uuid, altcookie, i))
1722                         continue;
1723                 break;
1724         }
1725
1726         if (i < nd_region->ndr_mappings) {
1727                 struct nvdimm *nvdimm = nd_region->mapping[i].nvdimm;
1728
1729                 /*
1730                  * Give up if we don't find an instance of a uuid at each
1731                  * position (from 0 to nd_region->ndr_mappings - 1), or if we
1732                  * find a dimm with two instances of the same uuid.
1733                  */
1734                 dev_err(&nd_region->dev, "%s missing label for %pUb\n",
1735                         nvdimm_name(nvdimm), nsl_uuid_raw(ndd, nd_label));
1736                 rc = -EINVAL;
1737                 goto err;
1738         }
1739
1740         /*
1741          * Fix up each mapping's 'labels' to have the validated pmem label for
1742          * that position at labels[0], and NULL at labels[1].  In the process,
1743          * check that the namespace aligns with interleave-set.
1744          */
1745         nsl_get_uuid(ndd, nd_label, &uuid);
1746         rc = select_pmem_id(nd_region, &uuid);
1747         if (rc)
1748                 goto err;
1749
1750         /* Calculate total size and populate namespace properties from label0 */
1751         for (i = 0; i < nd_region->ndr_mappings; i++) {
1752                 struct nd_namespace_label *label0;
1753                 struct nvdimm_drvdata *ndd;
1754
1755                 nd_mapping = &nd_region->mapping[i];
1756                 label_ent = list_first_entry_or_null(&nd_mapping->labels,
1757                                 typeof(*label_ent), list);
1758                 label0 = label_ent ? label_ent->label : NULL;
1759
1760                 if (!label0) {
1761                         WARN_ON(1);
1762                         continue;
1763                 }
1764
1765                 ndd = to_ndd(nd_mapping);
1766                 size += nsl_get_rawsize(ndd, label0);
1767                 if (nsl_get_position(ndd, label0) != 0)
1768                         continue;
1769                 WARN_ON(nspm->alt_name || nspm->uuid);
1770                 nspm->alt_name = kmemdup(nsl_ref_name(ndd, label0),
1771                                          NSLABEL_NAME_LEN, GFP_KERNEL);
1772                 nsl_get_uuid(ndd, label0, &uuid);
1773                 nspm->uuid = kmemdup(&uuid, sizeof(uuid_t), GFP_KERNEL);
1774                 nspm->lbasize = nsl_get_lbasize(ndd, label0);
1775                 nspm->nsio.common.claim_class =
1776                         nsl_get_claim_class(ndd, label0);
1777         }
1778
1779         if (!nspm->alt_name || !nspm->uuid) {
1780                 rc = -ENOMEM;
1781                 goto err;
1782         }
1783
1784         nd_namespace_pmem_set_resource(nd_region, nspm, size);
1785
1786         return dev;
1787  err:
1788         namespace_pmem_release(dev);
1789         switch (rc) {
1790         case -EINVAL:
1791                 dev_dbg(&nd_region->dev, "invalid label(s)\n");
1792                 break;
1793         case -ENODEV:
1794                 dev_dbg(&nd_region->dev, "label not found\n");
1795                 break;
1796         default:
1797                 dev_dbg(&nd_region->dev, "unexpected err: %d\n", rc);
1798                 break;
1799         }
1800         return ERR_PTR(rc);
1801 }
1802
1803 static struct device *nd_namespace_pmem_create(struct nd_region *nd_region)
1804 {
1805         struct nd_namespace_pmem *nspm;
1806         struct resource *res;
1807         struct device *dev;
1808
1809         if (!is_memory(&nd_region->dev))
1810                 return NULL;
1811
1812         nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1813         if (!nspm)
1814                 return NULL;
1815
1816         dev = &nspm->nsio.common.dev;
1817         dev->type = &namespace_pmem_device_type;
1818         dev->parent = &nd_region->dev;
1819         res = &nspm->nsio.res;
1820         res->name = dev_name(&nd_region->dev);
1821         res->flags = IORESOURCE_MEM;
1822
1823         nspm->id = ida_alloc(&nd_region->ns_ida, GFP_KERNEL);
1824         if (nspm->id < 0) {
1825                 kfree(nspm);
1826                 return NULL;
1827         }
1828         dev_set_name(dev, "namespace%d.%d", nd_region->id, nspm->id);
1829         nd_namespace_pmem_set_resource(nd_region, nspm, 0);
1830
1831         return dev;
1832 }
1833
1834 static struct lock_class_key nvdimm_namespace_key;
1835
1836 void nd_region_create_ns_seed(struct nd_region *nd_region)
1837 {
1838         WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1839
1840         if (nd_region_to_nstype(nd_region) == ND_DEVICE_NAMESPACE_IO)
1841                 return;
1842
1843         nd_region->ns_seed = nd_namespace_pmem_create(nd_region);
1844
1845         /*
1846          * Seed creation failures are not fatal, provisioning is simply
1847          * disabled until memory becomes available
1848          */
1849         if (!nd_region->ns_seed)
1850                 dev_err(&nd_region->dev, "failed to create namespace\n");
1851         else {
1852                 device_initialize(nd_region->ns_seed);
1853                 lockdep_set_class(&nd_region->ns_seed->mutex,
1854                                   &nvdimm_namespace_key);
1855                 nd_device_register(nd_region->ns_seed);
1856         }
1857 }
1858
1859 void nd_region_create_dax_seed(struct nd_region *nd_region)
1860 {
1861         WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1862         nd_region->dax_seed = nd_dax_create(nd_region);
1863         /*
1864          * Seed creation failures are not fatal, provisioning is simply
1865          * disabled until memory becomes available
1866          */
1867         if (!nd_region->dax_seed)
1868                 dev_err(&nd_region->dev, "failed to create dax namespace\n");
1869 }
1870
1871 void nd_region_create_pfn_seed(struct nd_region *nd_region)
1872 {
1873         WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1874         nd_region->pfn_seed = nd_pfn_create(nd_region);
1875         /*
1876          * Seed creation failures are not fatal, provisioning is simply
1877          * disabled until memory becomes available
1878          */
1879         if (!nd_region->pfn_seed)
1880                 dev_err(&nd_region->dev, "failed to create pfn namespace\n");
1881 }
1882
1883 void nd_region_create_btt_seed(struct nd_region *nd_region)
1884 {
1885         WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1886         nd_region->btt_seed = nd_btt_create(nd_region);
1887         /*
1888          * Seed creation failures are not fatal, provisioning is simply
1889          * disabled until memory becomes available
1890          */
1891         if (!nd_region->btt_seed)
1892                 dev_err(&nd_region->dev, "failed to create btt namespace\n");
1893 }
1894
1895 static int add_namespace_resource(struct nd_region *nd_region,
1896                 struct nd_namespace_label *nd_label, struct device **devs,
1897                 int count)
1898 {
1899         struct nd_mapping *nd_mapping = &nd_region->mapping[0];
1900         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1901         int i;
1902
1903         for (i = 0; i < count; i++) {
1904                 uuid_t *uuid = namespace_to_uuid(devs[i]);
1905
1906                 if (IS_ERR(uuid)) {
1907                         WARN_ON(1);
1908                         continue;
1909                 }
1910
1911                 if (!nsl_uuid_equal(ndd, nd_label, uuid))
1912                         continue;
1913                 dev_err(&nd_region->dev,
1914                         "error: conflicting extents for uuid: %pUb\n", uuid);
1915                 return -ENXIO;
1916         }
1917
1918         return i;
1919 }
1920
1921 static int cmp_dpa(const void *a, const void *b)
1922 {
1923         const struct device *dev_a = *(const struct device **) a;
1924         const struct device *dev_b = *(const struct device **) b;
1925         struct nd_namespace_pmem *nspm_a, *nspm_b;
1926
1927         if (is_namespace_io(dev_a))
1928                 return 0;
1929
1930         nspm_a = to_nd_namespace_pmem(dev_a);
1931         nspm_b = to_nd_namespace_pmem(dev_b);
1932
1933         return memcmp(&nspm_a->nsio.res.start, &nspm_b->nsio.res.start,
1934                         sizeof(resource_size_t));
1935 }
1936
1937 static struct device **scan_labels(struct nd_region *nd_region)
1938 {
1939         int i, count = 0;
1940         struct device *dev, **devs = NULL;
1941         struct nd_label_ent *label_ent, *e;
1942         struct nd_mapping *nd_mapping = &nd_region->mapping[0];
1943         struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1944         resource_size_t map_end = nd_mapping->start + nd_mapping->size - 1;
1945
1946         /* "safe" because create_namespace_pmem() might list_move() label_ent */
1947         list_for_each_entry_safe(label_ent, e, &nd_mapping->labels, list) {
1948                 struct nd_namespace_label *nd_label = label_ent->label;
1949                 struct device **__devs;
1950
1951                 if (!nd_label)
1952                         continue;
1953
1954                 /* skip labels that describe extents outside of the region */
1955                 if (nsl_get_dpa(ndd, nd_label) < nd_mapping->start ||
1956                     nsl_get_dpa(ndd, nd_label) > map_end)
1957                         continue;
1958
1959                 i = add_namespace_resource(nd_region, nd_label, devs, count);
1960                 if (i < 0)
1961                         goto err;
1962                 if (i < count)
1963                         continue;
1964                 __devs = kcalloc(count + 2, sizeof(dev), GFP_KERNEL);
1965                 if (!__devs)
1966                         goto err;
1967                 memcpy(__devs, devs, sizeof(dev) * count);
1968                 kfree(devs);
1969                 devs = __devs;
1970
1971                 dev = create_namespace_pmem(nd_region, nd_mapping, nd_label);
1972                 if (IS_ERR(dev)) {
1973                         switch (PTR_ERR(dev)) {
1974                         case -EAGAIN:
1975                                 /* skip invalid labels */
1976                                 continue;
1977                         case -ENODEV:
1978                                 /* fallthrough to seed creation */
1979                                 break;
1980                         default:
1981                                 goto err;
1982                         }
1983                 } else
1984                         devs[count++] = dev;
1985
1986         }
1987
1988         dev_dbg(&nd_region->dev, "discovered %d namespace%s\n", count,
1989                 count == 1 ? "" : "s");
1990
1991         if (count == 0) {
1992                 struct nd_namespace_pmem *nspm;
1993
1994                 /* Publish a zero-sized namespace for userspace to configure. */
1995                 nd_mapping_free_labels(nd_mapping);
1996
1997                 devs = kcalloc(2, sizeof(dev), GFP_KERNEL);
1998                 if (!devs)
1999                         goto err;
2000
2001                 nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
2002                 if (!nspm)
2003                         goto err;
2004                 dev = &nspm->nsio.common.dev;
2005                 dev->type = &namespace_pmem_device_type;
2006                 nd_namespace_pmem_set_resource(nd_region, nspm, 0);
2007                 dev->parent = &nd_region->dev;
2008                 devs[count++] = dev;
2009         } else if (is_memory(&nd_region->dev)) {
2010                 /* clean unselected labels */
2011                 for (i = 0; i < nd_region->ndr_mappings; i++) {
2012                         struct list_head *l, *e;
2013                         LIST_HEAD(list);
2014                         int j;
2015
2016                         nd_mapping = &nd_region->mapping[i];
2017                         if (list_empty(&nd_mapping->labels)) {
2018                                 WARN_ON(1);
2019                                 continue;
2020                         }
2021
2022                         j = count;
2023                         list_for_each_safe(l, e, &nd_mapping->labels) {
2024                                 if (!j--)
2025                                         break;
2026                                 list_move_tail(l, &list);
2027                         }
2028                         nd_mapping_free_labels(nd_mapping);
2029                         list_splice_init(&list, &nd_mapping->labels);
2030                 }
2031         }
2032
2033         if (count > 1)
2034                 sort(devs, count, sizeof(struct device *), cmp_dpa, NULL);
2035
2036         return devs;
2037
2038  err:
2039         if (devs) {
2040                 for (i = 0; devs[i]; i++)
2041                         namespace_pmem_release(devs[i]);
2042                 kfree(devs);
2043         }
2044         return NULL;
2045 }
2046
2047 static struct device **create_namespaces(struct nd_region *nd_region)
2048 {
2049         struct nd_mapping *nd_mapping;
2050         struct device **devs;
2051         int i;
2052
2053         if (nd_region->ndr_mappings == 0)
2054                 return NULL;
2055
2056         /* lock down all mappings while we scan labels */
2057         for (i = 0; i < nd_region->ndr_mappings; i++) {
2058                 nd_mapping = &nd_region->mapping[i];
2059                 mutex_lock_nested(&nd_mapping->lock, i);
2060         }
2061
2062         devs = scan_labels(nd_region);
2063
2064         for (i = 0; i < nd_region->ndr_mappings; i++) {
2065                 int reverse = nd_region->ndr_mappings - 1 - i;
2066
2067                 nd_mapping = &nd_region->mapping[reverse];
2068                 mutex_unlock(&nd_mapping->lock);
2069         }
2070
2071         return devs;
2072 }
2073
2074 static void deactivate_labels(void *region)
2075 {
2076         struct nd_region *nd_region = region;
2077         int i;
2078
2079         for (i = 0; i < nd_region->ndr_mappings; i++) {
2080                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
2081                 struct nvdimm_drvdata *ndd = nd_mapping->ndd;
2082                 struct nvdimm *nvdimm = nd_mapping->nvdimm;
2083
2084                 mutex_lock(&nd_mapping->lock);
2085                 nd_mapping_free_labels(nd_mapping);
2086                 mutex_unlock(&nd_mapping->lock);
2087
2088                 put_ndd(ndd);
2089                 nd_mapping->ndd = NULL;
2090                 if (ndd)
2091                         atomic_dec(&nvdimm->busy);
2092         }
2093 }
2094
2095 static int init_active_labels(struct nd_region *nd_region)
2096 {
2097         int i, rc = 0;
2098
2099         for (i = 0; i < nd_region->ndr_mappings; i++) {
2100                 struct nd_mapping *nd_mapping = &nd_region->mapping[i];
2101                 struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
2102                 struct nvdimm *nvdimm = nd_mapping->nvdimm;
2103                 struct nd_label_ent *label_ent;
2104                 int count, j;
2105
2106                 /*
2107                  * If the dimm is disabled then we may need to prevent
2108                  * the region from being activated.
2109                  */
2110                 if (!ndd) {
2111                         if (test_bit(NDD_LOCKED, &nvdimm->flags))
2112                                 /* fail, label data may be unreadable */;
2113                         else if (test_bit(NDD_LABELING, &nvdimm->flags))
2114                                 /* fail, labels needed to disambiguate dpa */;
2115                         else
2116                                 continue;
2117
2118                         dev_err(&nd_region->dev, "%s: is %s, failing probe\n",
2119                                         dev_name(&nd_mapping->nvdimm->dev),
2120                                         test_bit(NDD_LOCKED, &nvdimm->flags)
2121                                         ? "locked" : "disabled");
2122                         rc = -ENXIO;
2123                         goto out;
2124                 }
2125                 nd_mapping->ndd = ndd;
2126                 atomic_inc(&nvdimm->busy);
2127                 get_ndd(ndd);
2128
2129                 count = nd_label_active_count(ndd);
2130                 dev_dbg(ndd->dev, "count: %d\n", count);
2131                 if (!count)
2132                         continue;
2133                 for (j = 0; j < count; j++) {
2134                         struct nd_namespace_label *label;
2135
2136                         label_ent = kzalloc(sizeof(*label_ent), GFP_KERNEL);
2137                         if (!label_ent)
2138                                 break;
2139                         label = nd_label_active(ndd, j);
2140                         label_ent->label = label;
2141
2142                         mutex_lock(&nd_mapping->lock);
2143                         list_add_tail(&label_ent->list, &nd_mapping->labels);
2144                         mutex_unlock(&nd_mapping->lock);
2145                 }
2146
2147                 if (j < count)
2148                         break;
2149         }
2150
2151         if (i < nd_region->ndr_mappings)
2152                 rc = -ENOMEM;
2153
2154 out:
2155         if (rc) {
2156                 deactivate_labels(nd_region);
2157                 return rc;
2158         }
2159
2160         return devm_add_action_or_reset(&nd_region->dev, deactivate_labels,
2161                                         nd_region);
2162 }
2163
2164 int nd_region_register_namespaces(struct nd_region *nd_region, int *err)
2165 {
2166         struct device **devs = NULL;
2167         int i, rc = 0, type;
2168
2169         *err = 0;
2170         nvdimm_bus_lock(&nd_region->dev);
2171         rc = init_active_labels(nd_region);
2172         if (rc) {
2173                 nvdimm_bus_unlock(&nd_region->dev);
2174                 return rc;
2175         }
2176
2177         type = nd_region_to_nstype(nd_region);
2178         switch (type) {
2179         case ND_DEVICE_NAMESPACE_IO:
2180                 devs = create_namespace_io(nd_region);
2181                 break;
2182         case ND_DEVICE_NAMESPACE_PMEM:
2183                 devs = create_namespaces(nd_region);
2184                 break;
2185         default:
2186                 break;
2187         }
2188         nvdimm_bus_unlock(&nd_region->dev);
2189
2190         if (!devs)
2191                 return -ENODEV;
2192
2193         for (i = 0; devs[i]; i++) {
2194                 struct device *dev = devs[i];
2195                 int id;
2196
2197                 if (type == ND_DEVICE_NAMESPACE_PMEM) {
2198                         struct nd_namespace_pmem *nspm;
2199
2200                         nspm = to_nd_namespace_pmem(dev);
2201                         id = ida_alloc(&nd_region->ns_ida, GFP_KERNEL);
2202                         nspm->id = id;
2203                 } else
2204                         id = i;
2205
2206                 if (id < 0)
2207                         break;
2208                 dev_set_name(dev, "namespace%d.%d", nd_region->id, id);
2209                 device_initialize(dev);
2210                 lockdep_set_class(&dev->mutex, &nvdimm_namespace_key);
2211                 nd_device_register(dev);
2212         }
2213         if (i)
2214                 nd_region->ns_seed = devs[0];
2215
2216         if (devs[i]) {
2217                 int j;
2218
2219                 for (j = i; devs[j]; j++) {
2220                         struct device *dev = devs[j];
2221
2222                         device_initialize(dev);
2223                         put_device(dev);
2224                 }
2225                 *err = j - i;
2226                 /*
2227                  * All of the namespaces we tried to register failed, so
2228                  * fail region activation.
2229                  */
2230                 if (*err == 0)
2231                         rc = -ENODEV;
2232         }
2233         kfree(devs);
2234
2235         if (rc == -ENODEV)
2236                 return rc;
2237
2238         return i;
2239 }