Linux Audio

Check our new training course

Loading...
v6.13.7
   1// SPDX-License-Identifier: GPL-2.0-only
   2/*
   3 * Copyright(c) 2013-2015 Intel Corporation. All rights reserved.
   4 */
   5#include <linux/kstrtox.h>
   6#include <linux/module.h>
   7#include <linux/device.h>
   8#include <linux/sort.h>
   9#include <linux/slab.h>
  10#include <linux/list.h>
  11#include <linux/nd.h>
  12#include "nd-core.h"
  13#include "pmem.h"
  14#include "pfn.h"
  15#include "nd.h"
  16
  17static void namespace_io_release(struct device *dev)
  18{
  19	struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
  20
  21	kfree(nsio);
  22}
  23
  24static void namespace_pmem_release(struct device *dev)
  25{
  26	struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
  27	struct nd_region *nd_region = to_nd_region(dev->parent);
  28
  29	if (nspm->id >= 0)
  30		ida_free(&nd_region->ns_ida, nspm->id);
  31	kfree(nspm->alt_name);
  32	kfree(nspm->uuid);
  33	kfree(nspm);
  34}
  35
  36static bool is_namespace_pmem(const struct device *dev);
  37static bool is_namespace_io(const struct device *dev);
  38
  39static int is_uuid_busy(struct device *dev, void *data)
  40{
  41	uuid_t *uuid1 = data, *uuid2 = NULL;
  42
  43	if (is_namespace_pmem(dev)) {
  44		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
  45
  46		uuid2 = nspm->uuid;
  47	} else if (is_nd_btt(dev)) {
  48		struct nd_btt *nd_btt = to_nd_btt(dev);
  49
  50		uuid2 = nd_btt->uuid;
  51	} else if (is_nd_pfn(dev)) {
  52		struct nd_pfn *nd_pfn = to_nd_pfn(dev);
  53
  54		uuid2 = nd_pfn->uuid;
  55	}
  56
  57	if (uuid2 && uuid_equal(uuid1, uuid2))
  58		return -EBUSY;
  59
  60	return 0;
  61}
  62
  63static int is_namespace_uuid_busy(struct device *dev, void *data)
  64{
  65	if (is_nd_region(dev))
  66		return device_for_each_child(dev, data, is_uuid_busy);
  67	return 0;
  68}
  69
  70/**
  71 * nd_is_uuid_unique - verify that no other namespace has @uuid
  72 * @dev: any device on a nvdimm_bus
  73 * @uuid: uuid to check
  74 *
  75 * Returns: %true if the uuid is unique, %false if not
  76 */
  77bool nd_is_uuid_unique(struct device *dev, uuid_t *uuid)
  78{
  79	struct nvdimm_bus *nvdimm_bus = walk_to_nvdimm_bus(dev);
  80
  81	if (!nvdimm_bus)
  82		return false;
  83	WARN_ON_ONCE(!is_nvdimm_bus_locked(&nvdimm_bus->dev));
  84	if (device_for_each_child(&nvdimm_bus->dev, uuid,
  85				is_namespace_uuid_busy) != 0)
  86		return false;
  87	return true;
  88}
  89
  90bool pmem_should_map_pages(struct device *dev)
  91{
  92	struct nd_region *nd_region = to_nd_region(dev->parent);
  93	struct nd_namespace_common *ndns = to_ndns(dev);
  94	struct nd_namespace_io *nsio;
  95
  96	if (!IS_ENABLED(CONFIG_ZONE_DEVICE))
  97		return false;
  98
  99	if (!test_bit(ND_REGION_PAGEMAP, &nd_region->flags))
 100		return false;
 101
 102	if (is_nd_pfn(dev) || is_nd_btt(dev))
 103		return false;
 104
 105	if (ndns->force_raw)
 106		return false;
 107
 108	nsio = to_nd_namespace_io(dev);
 109	if (region_intersects(nsio->res.start, resource_size(&nsio->res),
 110				IORESOURCE_SYSTEM_RAM,
 111				IORES_DESC_NONE) == REGION_MIXED)
 112		return false;
 113
 114	return ARCH_MEMREMAP_PMEM == MEMREMAP_WB;
 115}
 116EXPORT_SYMBOL(pmem_should_map_pages);
 117
 118unsigned int pmem_sector_size(struct nd_namespace_common *ndns)
 119{
 120	if (is_namespace_pmem(&ndns->dev)) {
 121		struct nd_namespace_pmem *nspm;
 122
 123		nspm = to_nd_namespace_pmem(&ndns->dev);
 124		if (nspm->lbasize == 0 || nspm->lbasize == 512)
 125			/* default */;
 126		else if (nspm->lbasize == 4096)
 127			return 4096;
 128		else
 129			dev_WARN(&ndns->dev, "unsupported sector size: %ld\n",
 130					nspm->lbasize);
 131	}
 132
 133	/*
 134	 * There is no namespace label (is_namespace_io()), or the label
 135	 * indicates the default sector size.
 136	 */
 137	return 512;
 138}
 139EXPORT_SYMBOL(pmem_sector_size);
 140
 141const char *nvdimm_namespace_disk_name(struct nd_namespace_common *ndns,
 142		char *name)
 143{
 144	struct nd_region *nd_region = to_nd_region(ndns->dev.parent);
 145	const char *suffix = NULL;
 146
 147	if (ndns->claim && is_nd_btt(ndns->claim))
 148		suffix = "s";
 149
 150	if (is_namespace_pmem(&ndns->dev) || is_namespace_io(&ndns->dev)) {
 151		int nsidx = 0;
 152
 153		if (is_namespace_pmem(&ndns->dev)) {
 154			struct nd_namespace_pmem *nspm;
 155
 156			nspm = to_nd_namespace_pmem(&ndns->dev);
 157			nsidx = nspm->id;
 158		}
 159
 160		if (nsidx)
 161			sprintf(name, "pmem%d.%d%s", nd_region->id, nsidx,
 162					suffix ? suffix : "");
 163		else
 164			sprintf(name, "pmem%d%s", nd_region->id,
 165					suffix ? suffix : "");
 166	} else {
 167		return NULL;
 168	}
 169
 170	return name;
 171}
 172EXPORT_SYMBOL(nvdimm_namespace_disk_name);
 173
 174const uuid_t *nd_dev_to_uuid(struct device *dev)
 175{
 176	if (dev && is_namespace_pmem(dev)) {
 177		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 178
 179		return nspm->uuid;
 180	}
 181	return &uuid_null;
 182}
 183EXPORT_SYMBOL(nd_dev_to_uuid);
 184
 185static ssize_t nstype_show(struct device *dev,
 186		struct device_attribute *attr, char *buf)
 187{
 188	struct nd_region *nd_region = to_nd_region(dev->parent);
 189
 190	return sprintf(buf, "%d\n", nd_region_to_nstype(nd_region));
 191}
 192static DEVICE_ATTR_RO(nstype);
 193
 194static ssize_t __alt_name_store(struct device *dev, const char *buf,
 195		const size_t len)
 196{
 197	char *input, *pos, *alt_name, **ns_altname;
 198	ssize_t rc;
 199
 200	if (is_namespace_pmem(dev)) {
 201		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 202
 203		ns_altname = &nspm->alt_name;
 204	} else
 205		return -ENXIO;
 206
 207	if (dev->driver || to_ndns(dev)->claim)
 208		return -EBUSY;
 209
 210	input = kstrndup(buf, len, GFP_KERNEL);
 211	if (!input)
 212		return -ENOMEM;
 213
 214	pos = strim(input);
 215	if (strlen(pos) + 1 > NSLABEL_NAME_LEN) {
 216		rc = -EINVAL;
 217		goto out;
 218	}
 219
 220	alt_name = kzalloc(NSLABEL_NAME_LEN, GFP_KERNEL);
 221	if (!alt_name) {
 222		rc = -ENOMEM;
 223		goto out;
 224	}
 225	kfree(*ns_altname);
 226	*ns_altname = alt_name;
 227	sprintf(*ns_altname, "%s", pos);
 228	rc = len;
 229
 230out:
 231	kfree(input);
 232	return rc;
 233}
 234
 235static int nd_namespace_label_update(struct nd_region *nd_region,
 236		struct device *dev)
 237{
 238	dev_WARN_ONCE(dev, dev->driver || to_ndns(dev)->claim,
 239			"namespace must be idle during label update\n");
 240	if (dev->driver || to_ndns(dev)->claim)
 241		return 0;
 242
 243	/*
 244	 * Only allow label writes that will result in a valid namespace
 245	 * or deletion of an existing namespace.
 246	 */
 247	if (is_namespace_pmem(dev)) {
 248		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 249		resource_size_t size = resource_size(&nspm->nsio.res);
 250
 251		if (size == 0 && nspm->uuid)
 252			/* delete allocation */;
 253		else if (!nspm->uuid)
 254			return 0;
 255
 256		return nd_pmem_namespace_label_update(nd_region, nspm, size);
 257	} else
 258		return -ENXIO;
 259}
 260
 261static ssize_t alt_name_store(struct device *dev,
 262		struct device_attribute *attr, const char *buf, size_t len)
 263{
 264	struct nd_region *nd_region = to_nd_region(dev->parent);
 265	ssize_t rc;
 266
 267	device_lock(dev);
 268	nvdimm_bus_lock(dev);
 269	wait_nvdimm_bus_probe_idle(dev);
 270	rc = __alt_name_store(dev, buf, len);
 271	if (rc >= 0)
 272		rc = nd_namespace_label_update(nd_region, dev);
 273	dev_dbg(dev, "%s(%zd)\n", rc < 0 ? "fail " : "", rc);
 274	nvdimm_bus_unlock(dev);
 275	device_unlock(dev);
 276
 277	return rc < 0 ? rc : len;
 278}
 279
 280static ssize_t alt_name_show(struct device *dev,
 281		struct device_attribute *attr, char *buf)
 282{
 283	char *ns_altname;
 284
 285	if (is_namespace_pmem(dev)) {
 286		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 287
 288		ns_altname = nspm->alt_name;
 289	} else
 290		return -ENXIO;
 291
 292	return sprintf(buf, "%s\n", ns_altname ? ns_altname : "");
 293}
 294static DEVICE_ATTR_RW(alt_name);
 295
 296static int scan_free(struct nd_region *nd_region,
 297		struct nd_mapping *nd_mapping, struct nd_label_id *label_id,
 298		resource_size_t n)
 299{
 300	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 301	int rc = 0;
 302
 303	while (n) {
 304		struct resource *res, *last;
 305
 306		last = NULL;
 307		for_each_dpa_resource(ndd, res)
 308			if (strcmp(res->name, label_id->id) == 0)
 309				last = res;
 310		res = last;
 311		if (!res)
 312			return 0;
 313
 314		if (n >= resource_size(res)) {
 315			n -= resource_size(res);
 316			nd_dbg_dpa(nd_region, ndd, res, "delete %d\n", rc);
 317			nvdimm_free_dpa(ndd, res);
 318			/* retry with last resource deleted */
 319			continue;
 320		}
 321
 322		rc = adjust_resource(res, res->start, resource_size(res) - n);
 323		if (rc == 0)
 324			res->flags |= DPA_RESOURCE_ADJUSTED;
 325		nd_dbg_dpa(nd_region, ndd, res, "shrink %d\n", rc);
 326		break;
 327	}
 328
 329	return rc;
 330}
 331
 332/**
 333 * shrink_dpa_allocation - for each dimm in region free n bytes for label_id
 334 * @nd_region: the set of dimms to reclaim @n bytes from
 335 * @label_id: unique identifier for the namespace consuming this dpa range
 336 * @n: number of bytes per-dimm to release
 337 *
 338 * Assumes resources are ordered.  Starting from the end try to
 339 * adjust_resource() the allocation to @n, but if @n is larger than the
 340 * allocation delete it and find the 'new' last allocation in the label
 341 * set.
 342 *
 343 * Returns: %0 on success on -errno on error
 344 */
 345static int shrink_dpa_allocation(struct nd_region *nd_region,
 346		struct nd_label_id *label_id, resource_size_t n)
 347{
 348	int i;
 349
 350	for (i = 0; i < nd_region->ndr_mappings; i++) {
 351		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 352		int rc;
 353
 354		rc = scan_free(nd_region, nd_mapping, label_id, n);
 355		if (rc)
 356			return rc;
 357	}
 358
 359	return 0;
 360}
 361
 362static resource_size_t init_dpa_allocation(struct nd_label_id *label_id,
 363		struct nd_region *nd_region, struct nd_mapping *nd_mapping,
 364		resource_size_t n)
 365{
 366	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 367	struct resource *res;
 368	int rc = 0;
 369
 370	/* first resource allocation for this label-id or dimm */
 371	res = nvdimm_allocate_dpa(ndd, label_id, nd_mapping->start, n);
 372	if (!res)
 373		rc = -EBUSY;
 374
 375	nd_dbg_dpa(nd_region, ndd, res, "init %d\n", rc);
 376	return rc ? n : 0;
 377}
 378
 379
 380/**
 381 * space_valid() - validate free dpa space against constraints
 382 * @nd_region: hosting region of the free space
 383 * @ndd: dimm device data for debug
 384 * @label_id: namespace id to allocate space
 385 * @prev: potential allocation that precedes free space
 386 * @next: allocation that follows the given free space range
 387 * @exist: first allocation with same id in the mapping
 388 * @n: range that must satisfied for pmem allocations
 389 * @valid: free space range to validate
 390 *
 391 * BLK-space is valid as long as it does not precede a PMEM
 392 * allocation in a given region. PMEM-space must be contiguous
 393 * and adjacent to an existing allocation (if one
 394 * exists).  If reserving PMEM any space is valid.
 395 */
 396static void space_valid(struct nd_region *nd_region, struct nvdimm_drvdata *ndd,
 397		struct nd_label_id *label_id, struct resource *prev,
 398		struct resource *next, struct resource *exist,
 399		resource_size_t n, struct resource *valid)
 400{
 401	bool is_reserve = strcmp(label_id->id, "pmem-reserve") == 0;
 402	unsigned long align;
 403
 404	align = nd_region->align / nd_region->ndr_mappings;
 405	valid->start = ALIGN(valid->start, align);
 406	valid->end = ALIGN_DOWN(valid->end + 1, align) - 1;
 407
 408	if (valid->start >= valid->end)
 409		goto invalid;
 410
 411	if (is_reserve)
 412		return;
 413
 414	/* allocation needs to be contiguous, so this is all or nothing */
 415	if (resource_size(valid) < n)
 416		goto invalid;
 417
 418	/* we've got all the space we need and no existing allocation */
 419	if (!exist)
 420		return;
 421
 422	/* allocation needs to be contiguous with the existing namespace */
 423	if (valid->start == exist->end + 1
 424			|| valid->end == exist->start - 1)
 425		return;
 426
 427 invalid:
 428	/* truncate @valid size to 0 */
 429	valid->end = valid->start - 1;
 430}
 431
 432enum alloc_loc {
 433	ALLOC_ERR = 0, ALLOC_BEFORE, ALLOC_MID, ALLOC_AFTER,
 434};
 435
 436static resource_size_t scan_allocate(struct nd_region *nd_region,
 437		struct nd_mapping *nd_mapping, struct nd_label_id *label_id,
 438		resource_size_t n)
 439{
 440	resource_size_t mapping_end = nd_mapping->start + nd_mapping->size - 1;
 441	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 442	struct resource *res, *exist = NULL, valid;
 443	const resource_size_t to_allocate = n;
 444	int first;
 445
 446	for_each_dpa_resource(ndd, res)
 447		if (strcmp(label_id->id, res->name) == 0)
 448			exist = res;
 449
 450	valid.start = nd_mapping->start;
 451	valid.end = mapping_end;
 452	valid.name = "free space";
 453 retry:
 454	first = 0;
 455	for_each_dpa_resource(ndd, res) {
 456		struct resource *next = res->sibling, *new_res = NULL;
 457		resource_size_t allocate, available = 0;
 458		enum alloc_loc loc = ALLOC_ERR;
 459		const char *action;
 460		int rc = 0;
 461
 462		/* ignore resources outside this nd_mapping */
 463		if (res->start > mapping_end)
 464			continue;
 465		if (res->end < nd_mapping->start)
 466			continue;
 467
 468		/* space at the beginning of the mapping */
 469		if (!first++ && res->start > nd_mapping->start) {
 470			valid.start = nd_mapping->start;
 471			valid.end = res->start - 1;
 472			space_valid(nd_region, ndd, label_id, NULL, next, exist,
 473					to_allocate, &valid);
 474			available = resource_size(&valid);
 475			if (available)
 476				loc = ALLOC_BEFORE;
 477		}
 478
 479		/* space between allocations */
 480		if (!loc && next) {
 481			valid.start = res->start + resource_size(res);
 482			valid.end = min(mapping_end, next->start - 1);
 483			space_valid(nd_region, ndd, label_id, res, next, exist,
 484					to_allocate, &valid);
 485			available = resource_size(&valid);
 486			if (available)
 487				loc = ALLOC_MID;
 488		}
 489
 490		/* space at the end of the mapping */
 491		if (!loc && !next) {
 492			valid.start = res->start + resource_size(res);
 493			valid.end = mapping_end;
 494			space_valid(nd_region, ndd, label_id, res, next, exist,
 495					to_allocate, &valid);
 496			available = resource_size(&valid);
 497			if (available)
 498				loc = ALLOC_AFTER;
 499		}
 500
 501		if (!loc || !available)
 502			continue;
 503		allocate = min(available, n);
 504		switch (loc) {
 505		case ALLOC_BEFORE:
 506			if (strcmp(res->name, label_id->id) == 0) {
 507				/* adjust current resource up */
 508				rc = adjust_resource(res, res->start - allocate,
 509						resource_size(res) + allocate);
 510				action = "cur grow up";
 511			} else
 512				action = "allocate";
 513			break;
 514		case ALLOC_MID:
 515			if (strcmp(next->name, label_id->id) == 0) {
 516				/* adjust next resource up */
 517				rc = adjust_resource(next, next->start
 518						- allocate, resource_size(next)
 519						+ allocate);
 520				new_res = next;
 521				action = "next grow up";
 522			} else if (strcmp(res->name, label_id->id) == 0) {
 523				action = "grow down";
 524			} else
 525				action = "allocate";
 526			break;
 527		case ALLOC_AFTER:
 528			if (strcmp(res->name, label_id->id) == 0)
 529				action = "grow down";
 530			else
 531				action = "allocate";
 532			break;
 533		default:
 534			return n;
 535		}
 536
 537		if (strcmp(action, "allocate") == 0) {
 538			new_res = nvdimm_allocate_dpa(ndd, label_id,
 539					valid.start, allocate);
 540			if (!new_res)
 541				rc = -EBUSY;
 542		} else if (strcmp(action, "grow down") == 0) {
 543			/* adjust current resource down */
 544			rc = adjust_resource(res, res->start, resource_size(res)
 545					+ allocate);
 546			if (rc == 0)
 547				res->flags |= DPA_RESOURCE_ADJUSTED;
 548		}
 549
 550		if (!new_res)
 551			new_res = res;
 552
 553		nd_dbg_dpa(nd_region, ndd, new_res, "%s(%d) %d\n",
 554				action, loc, rc);
 555
 556		if (rc)
 557			return n;
 558
 559		n -= allocate;
 560		if (n) {
 561			/*
 562			 * Retry scan with newly inserted resources.
 563			 * For example, if we did an ALLOC_BEFORE
 564			 * insertion there may also have been space
 565			 * available for an ALLOC_AFTER insertion, so we
 566			 * need to check this same resource again
 567			 */
 568			goto retry;
 569		} else
 570			return 0;
 571	}
 572
 573	if (n == to_allocate)
 574		return init_dpa_allocation(label_id, nd_region, nd_mapping, n);
 575	return n;
 576}
 577
 578static int merge_dpa(struct nd_region *nd_region,
 579		struct nd_mapping *nd_mapping, struct nd_label_id *label_id)
 580{
 581	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 582	struct resource *res;
 583
 584	if (strncmp("pmem", label_id->id, 4) == 0)
 585		return 0;
 586 retry:
 587	for_each_dpa_resource(ndd, res) {
 588		int rc;
 589		struct resource *next = res->sibling;
 590		resource_size_t end = res->start + resource_size(res);
 591
 592		if (!next || strcmp(res->name, label_id->id) != 0
 593				|| strcmp(next->name, label_id->id) != 0
 594				|| end != next->start)
 595			continue;
 596		end += resource_size(next);
 597		nvdimm_free_dpa(ndd, next);
 598		rc = adjust_resource(res, res->start, end - res->start);
 599		nd_dbg_dpa(nd_region, ndd, res, "merge %d\n", rc);
 600		if (rc)
 601			return rc;
 602		res->flags |= DPA_RESOURCE_ADJUSTED;
 603		goto retry;
 604	}
 605
 606	return 0;
 607}
 608
 609int __reserve_free_pmem(struct device *dev, void *data)
 610{
 611	struct nvdimm *nvdimm = data;
 612	struct nd_region *nd_region;
 613	struct nd_label_id label_id;
 614	int i;
 615
 616	if (!is_memory(dev))
 617		return 0;
 618
 619	nd_region = to_nd_region(dev);
 620	if (nd_region->ndr_mappings == 0)
 621		return 0;
 622
 623	memset(&label_id, 0, sizeof(label_id));
 624	strcat(label_id.id, "pmem-reserve");
 625	for (i = 0; i < nd_region->ndr_mappings; i++) {
 626		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 627		resource_size_t n, rem = 0;
 628
 629		if (nd_mapping->nvdimm != nvdimm)
 630			continue;
 631
 632		n = nd_pmem_available_dpa(nd_region, nd_mapping);
 633		if (n == 0)
 634			return 0;
 635		rem = scan_allocate(nd_region, nd_mapping, &label_id, n);
 636		dev_WARN_ONCE(&nd_region->dev, rem,
 637				"pmem reserve underrun: %#llx of %#llx bytes\n",
 638				(unsigned long long) n - rem,
 639				(unsigned long long) n);
 640		return rem ? -ENXIO : 0;
 641	}
 642
 643	return 0;
 644}
 645
 646void release_free_pmem(struct nvdimm_bus *nvdimm_bus,
 647		struct nd_mapping *nd_mapping)
 648{
 649	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 650	struct resource *res, *_res;
 651
 652	for_each_dpa_resource_safe(ndd, res, _res)
 653		if (strcmp(res->name, "pmem-reserve") == 0)
 654			nvdimm_free_dpa(ndd, res);
 655}
 656
 657/**
 658 * grow_dpa_allocation - for each dimm allocate n bytes for @label_id
 659 * @nd_region: the set of dimms to allocate @n more bytes from
 660 * @label_id: unique identifier for the namespace consuming this dpa range
 661 * @n: number of bytes per-dimm to add to the existing allocation
 662 *
 663 * Assumes resources are ordered.  For BLK regions, first consume
 664 * BLK-only available DPA free space, then consume PMEM-aliased DPA
 665 * space starting at the highest DPA.  For PMEM regions start
 666 * allocations from the start of an interleave set and end at the first
 667 * BLK allocation or the end of the interleave set, whichever comes
 668 * first.
 669 *
 670 * Returns: %0 on success on -errno on error
 671 */
 672static int grow_dpa_allocation(struct nd_region *nd_region,
 673		struct nd_label_id *label_id, resource_size_t n)
 674{
 675	int i;
 676
 677	for (i = 0; i < nd_region->ndr_mappings; i++) {
 678		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 679		resource_size_t rem = n;
 680		int rc;
 681
 682		rem = scan_allocate(nd_region, nd_mapping, label_id, rem);
 683		dev_WARN_ONCE(&nd_region->dev, rem,
 684				"allocation underrun: %#llx of %#llx bytes\n",
 685				(unsigned long long) n - rem,
 686				(unsigned long long) n);
 687		if (rem)
 688			return -ENXIO;
 689
 690		rc = merge_dpa(nd_region, nd_mapping, label_id);
 691		if (rc)
 692			return rc;
 693	}
 694
 695	return 0;
 696}
 697
 698static void nd_namespace_pmem_set_resource(struct nd_region *nd_region,
 699		struct nd_namespace_pmem *nspm, resource_size_t size)
 700{
 701	struct resource *res = &nspm->nsio.res;
 702	resource_size_t offset = 0;
 703
 704	if (size && !nspm->uuid) {
 705		WARN_ON_ONCE(1);
 706		size = 0;
 707	}
 708
 709	if (size && nspm->uuid) {
 710		struct nd_mapping *nd_mapping = &nd_region->mapping[0];
 711		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 712		struct nd_label_id label_id;
 713		struct resource *res;
 714
 715		if (!ndd) {
 716			size = 0;
 717			goto out;
 718		}
 719
 720		nd_label_gen_id(&label_id, nspm->uuid, 0);
 721
 722		/* calculate a spa offset from the dpa allocation offset */
 723		for_each_dpa_resource(ndd, res)
 724			if (strcmp(res->name, label_id.id) == 0) {
 725				offset = (res->start - nd_mapping->start)
 726					* nd_region->ndr_mappings;
 727				goto out;
 728			}
 729
 730		WARN_ON_ONCE(1);
 731		size = 0;
 732	}
 733
 734 out:
 735	res->start = nd_region->ndr_start + offset;
 736	res->end = res->start + size - 1;
 737}
 738
 739static bool uuid_not_set(const uuid_t *uuid, struct device *dev,
 740			 const char *where)
 741{
 742	if (!uuid) {
 743		dev_dbg(dev, "%s: uuid not set\n", where);
 744		return true;
 745	}
 746	return false;
 747}
 748
 749static ssize_t __size_store(struct device *dev, unsigned long long val)
 750{
 751	resource_size_t allocated = 0, available = 0;
 752	struct nd_region *nd_region = to_nd_region(dev->parent);
 753	struct nd_namespace_common *ndns = to_ndns(dev);
 754	struct nd_mapping *nd_mapping;
 755	struct nvdimm_drvdata *ndd;
 756	struct nd_label_id label_id;
 757	u32 flags = 0, remainder;
 758	int rc, i, id = -1;
 759	uuid_t *uuid = NULL;
 760
 761	if (dev->driver || ndns->claim)
 762		return -EBUSY;
 763
 764	if (is_namespace_pmem(dev)) {
 765		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 766
 767		uuid = nspm->uuid;
 768		id = nspm->id;
 769	}
 770
 771	/*
 772	 * We need a uuid for the allocation-label and dimm(s) on which
 773	 * to store the label.
 774	 */
 775	if (uuid_not_set(uuid, dev, __func__))
 776		return -ENXIO;
 777	if (nd_region->ndr_mappings == 0) {
 778		dev_dbg(dev, "not associated with dimm(s)\n");
 779		return -ENXIO;
 780	}
 781
 782	div_u64_rem(val, nd_region->align, &remainder);
 783	if (remainder) {
 784		dev_dbg(dev, "%llu is not %ldK aligned\n", val,
 785				nd_region->align / SZ_1K);
 786		return -EINVAL;
 787	}
 788
 789	nd_label_gen_id(&label_id, uuid, flags);
 790	for (i = 0; i < nd_region->ndr_mappings; i++) {
 791		nd_mapping = &nd_region->mapping[i];
 792		ndd = to_ndd(nd_mapping);
 793
 794		/*
 795		 * All dimms in an interleave set, need to be enabled
 796		 * for the size to be changed.
 797		 */
 798		if (!ndd)
 799			return -ENXIO;
 800
 801		allocated += nvdimm_allocated_dpa(ndd, &label_id);
 802	}
 803	available = nd_region_allocatable_dpa(nd_region);
 804
 805	if (val > available + allocated)
 806		return -ENOSPC;
 807
 808	if (val == allocated)
 809		return 0;
 810
 811	val = div_u64(val, nd_region->ndr_mappings);
 812	allocated = div_u64(allocated, nd_region->ndr_mappings);
 813	if (val < allocated)
 814		rc = shrink_dpa_allocation(nd_region, &label_id,
 815				allocated - val);
 816	else
 817		rc = grow_dpa_allocation(nd_region, &label_id, val - allocated);
 818
 819	if (rc)
 820		return rc;
 821
 822	if (is_namespace_pmem(dev)) {
 823		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 824
 825		nd_namespace_pmem_set_resource(nd_region, nspm,
 826				val * nd_region->ndr_mappings);
 827	}
 828
 829	/*
 830	 * Try to delete the namespace if we deleted all of its
 831	 * allocation, this is not the seed or 0th device for the
 832	 * region, and it is not actively claimed by a btt, pfn, or dax
 833	 * instance.
 834	 */
 835	if (val == 0 && id != 0 && nd_region->ns_seed != dev && !ndns->claim)
 836		nd_device_unregister(dev, ND_ASYNC);
 837
 838	return rc;
 839}
 840
 841static ssize_t size_store(struct device *dev,
 842		struct device_attribute *attr, const char *buf, size_t len)
 843{
 844	struct nd_region *nd_region = to_nd_region(dev->parent);
 845	unsigned long long val;
 846	int rc;
 847
 848	rc = kstrtoull(buf, 0, &val);
 849	if (rc)
 850		return rc;
 851
 852	device_lock(dev);
 853	nvdimm_bus_lock(dev);
 854	wait_nvdimm_bus_probe_idle(dev);
 855	rc = __size_store(dev, val);
 856	if (rc >= 0)
 857		rc = nd_namespace_label_update(nd_region, dev);
 858
 859	/* setting size zero == 'delete namespace' */
 860	if (rc == 0 && val == 0 && is_namespace_pmem(dev)) {
 861		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 862
 863		kfree(nspm->uuid);
 864		nspm->uuid = NULL;
 865	}
 866
 867	dev_dbg(dev, "%llx %s (%d)\n", val, rc < 0 ? "fail" : "success", rc);
 868
 869	nvdimm_bus_unlock(dev);
 870	device_unlock(dev);
 871
 872	return rc < 0 ? rc : len;
 873}
 874
 875resource_size_t __nvdimm_namespace_capacity(struct nd_namespace_common *ndns)
 876{
 877	struct device *dev = &ndns->dev;
 878
 879	if (is_namespace_pmem(dev)) {
 880		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 881
 882		return resource_size(&nspm->nsio.res);
 883	} else if (is_namespace_io(dev)) {
 884		struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
 885
 886		return resource_size(&nsio->res);
 887	} else
 888		WARN_ONCE(1, "unknown namespace type\n");
 889	return 0;
 890}
 891
 892resource_size_t nvdimm_namespace_capacity(struct nd_namespace_common *ndns)
 893{
 894	resource_size_t size;
 895
 896	nvdimm_bus_lock(&ndns->dev);
 897	size = __nvdimm_namespace_capacity(ndns);
 898	nvdimm_bus_unlock(&ndns->dev);
 899
 900	return size;
 901}
 902EXPORT_SYMBOL(nvdimm_namespace_capacity);
 903
 904bool nvdimm_namespace_locked(struct nd_namespace_common *ndns)
 905{
 906	int i;
 907	bool locked = false;
 908	struct device *dev = &ndns->dev;
 909	struct nd_region *nd_region = to_nd_region(dev->parent);
 910
 911	for (i = 0; i < nd_region->ndr_mappings; i++) {
 912		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 913		struct nvdimm *nvdimm = nd_mapping->nvdimm;
 914
 915		if (test_bit(NDD_LOCKED, &nvdimm->flags)) {
 916			dev_dbg(dev, "%s locked\n", nvdimm_name(nvdimm));
 917			locked = true;
 918		}
 919	}
 920	return locked;
 921}
 922EXPORT_SYMBOL(nvdimm_namespace_locked);
 923
 924static ssize_t size_show(struct device *dev,
 925		struct device_attribute *attr, char *buf)
 926{
 927	return sprintf(buf, "%llu\n", (unsigned long long)
 928			nvdimm_namespace_capacity(to_ndns(dev)));
 929}
 930static DEVICE_ATTR(size, 0444, size_show, size_store);
 931
 932static uuid_t *namespace_to_uuid(struct device *dev)
 933{
 934	if (is_namespace_pmem(dev)) {
 935		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 936
 937		return nspm->uuid;
 938	}
 939	return ERR_PTR(-ENXIO);
 940}
 941
 942static ssize_t uuid_show(struct device *dev, struct device_attribute *attr,
 943			 char *buf)
 944{
 945	uuid_t *uuid = namespace_to_uuid(dev);
 946
 947	if (IS_ERR(uuid))
 948		return PTR_ERR(uuid);
 949	if (uuid)
 950		return sprintf(buf, "%pUb\n", uuid);
 951	return sprintf(buf, "\n");
 952}
 953
 954/**
 955 * namespace_update_uuid - check for a unique uuid and whether we're "renaming"
 956 * @nd_region: parent region so we can updates all dimms in the set
 957 * @dev: namespace type for generating label_id
 958 * @new_uuid: incoming uuid
 959 * @old_uuid: reference to the uuid storage location in the namespace object
 960 *
 961 * Returns: %0 on success on -errno on error
 962 */
 963static int namespace_update_uuid(struct nd_region *nd_region,
 964				 struct device *dev, uuid_t *new_uuid,
 965				 uuid_t **old_uuid)
 966{
 967	struct nd_label_id old_label_id;
 968	struct nd_label_id new_label_id;
 969	int i;
 970
 971	if (!nd_is_uuid_unique(dev, new_uuid))
 972		return -EINVAL;
 973
 974	if (*old_uuid == NULL)
 975		goto out;
 976
 977	/*
 978	 * If we've already written a label with this uuid, then it's
 979	 * too late to rename because we can't reliably update the uuid
 980	 * without losing the old namespace.  Userspace must delete this
 981	 * namespace to abandon the old uuid.
 982	 */
 983	for (i = 0; i < nd_region->ndr_mappings; i++) {
 984		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 985
 986		/*
 987		 * This check by itself is sufficient because old_uuid
 988		 * would be NULL above if this uuid did not exist in the
 989		 * currently written set.
 990		 *
 991		 * FIXME: can we delete uuid with zero dpa allocated?
 992		 */
 993		if (list_empty(&nd_mapping->labels))
 994			return -EBUSY;
 995	}
 996
 997	nd_label_gen_id(&old_label_id, *old_uuid, 0);
 998	nd_label_gen_id(&new_label_id, new_uuid, 0);
 999	for (i = 0; i < nd_region->ndr_mappings; i++) {
1000		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1001		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1002		struct nd_label_ent *label_ent;
1003		struct resource *res;
1004
1005		for_each_dpa_resource(ndd, res)
1006			if (strcmp(res->name, old_label_id.id) == 0)
1007				sprintf((void *) res->name, "%s",
1008						new_label_id.id);
1009
1010		mutex_lock(&nd_mapping->lock);
1011		list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1012			struct nd_namespace_label *nd_label = label_ent->label;
1013			struct nd_label_id label_id;
1014			uuid_t uuid;
1015
1016			if (!nd_label)
1017				continue;
1018			nsl_get_uuid(ndd, nd_label, &uuid);
1019			nd_label_gen_id(&label_id, &uuid,
1020					nsl_get_flags(ndd, nd_label));
1021			if (strcmp(old_label_id.id, label_id.id) == 0)
1022				set_bit(ND_LABEL_REAP, &label_ent->flags);
1023		}
1024		mutex_unlock(&nd_mapping->lock);
1025	}
1026	kfree(*old_uuid);
1027 out:
1028	*old_uuid = new_uuid;
1029	return 0;
1030}
1031
1032static ssize_t uuid_store(struct device *dev,
1033		struct device_attribute *attr, const char *buf, size_t len)
1034{
1035	struct nd_region *nd_region = to_nd_region(dev->parent);
1036	uuid_t *uuid = NULL;
1037	uuid_t **ns_uuid;
1038	ssize_t rc = 0;
1039
1040	if (is_namespace_pmem(dev)) {
1041		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1042
1043		ns_uuid = &nspm->uuid;
1044	} else
1045		return -ENXIO;
1046
1047	device_lock(dev);
1048	nvdimm_bus_lock(dev);
1049	wait_nvdimm_bus_probe_idle(dev);
1050	if (to_ndns(dev)->claim)
1051		rc = -EBUSY;
1052	if (rc >= 0)
1053		rc = nd_uuid_store(dev, &uuid, buf, len);
1054	if (rc >= 0)
1055		rc = namespace_update_uuid(nd_region, dev, uuid, ns_uuid);
1056	if (rc >= 0)
1057		rc = nd_namespace_label_update(nd_region, dev);
1058	else
1059		kfree(uuid);
1060	dev_dbg(dev, "result: %zd wrote: %s%s", rc, buf,
1061			buf[len - 1] == '\n' ? "" : "\n");
1062	nvdimm_bus_unlock(dev);
1063	device_unlock(dev);
1064
1065	return rc < 0 ? rc : len;
1066}
1067static DEVICE_ATTR_RW(uuid);
1068
1069static ssize_t resource_show(struct device *dev,
1070		struct device_attribute *attr, char *buf)
1071{
1072	struct resource *res;
1073
1074	if (is_namespace_pmem(dev)) {
1075		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1076
1077		res = &nspm->nsio.res;
1078	} else if (is_namespace_io(dev)) {
1079		struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
1080
1081		res = &nsio->res;
1082	} else
1083		return -ENXIO;
1084
1085	/* no address to convey if the namespace has no allocation */
1086	if (resource_size(res) == 0)
1087		return -ENXIO;
1088	return sprintf(buf, "%#llx\n", (unsigned long long) res->start);
1089}
1090static DEVICE_ATTR_ADMIN_RO(resource);
1091
1092static const unsigned long pmem_lbasize_supported[] = { 512, 4096, 0 };
1093
1094static ssize_t sector_size_show(struct device *dev,
1095		struct device_attribute *attr, char *buf)
1096{
1097	if (is_namespace_pmem(dev)) {
1098		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1099
1100		return nd_size_select_show(nspm->lbasize,
1101				pmem_lbasize_supported, buf);
1102	}
1103	return -ENXIO;
1104}
1105
1106static ssize_t sector_size_store(struct device *dev,
1107		struct device_attribute *attr, const char *buf, size_t len)
1108{
1109	struct nd_region *nd_region = to_nd_region(dev->parent);
1110	const unsigned long *supported;
1111	unsigned long *lbasize;
1112	ssize_t rc = 0;
1113
1114	if (is_namespace_pmem(dev)) {
1115		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1116
1117		lbasize = &nspm->lbasize;
1118		supported = pmem_lbasize_supported;
1119	} else
1120		return -ENXIO;
1121
1122	device_lock(dev);
1123	nvdimm_bus_lock(dev);
1124	if (to_ndns(dev)->claim)
1125		rc = -EBUSY;
1126	if (rc >= 0)
1127		rc = nd_size_select_store(dev, buf, lbasize, supported);
1128	if (rc >= 0)
1129		rc = nd_namespace_label_update(nd_region, dev);
1130	dev_dbg(dev, "result: %zd %s: %s%s", rc, rc < 0 ? "tried" : "wrote",
1131			buf, buf[len - 1] == '\n' ? "" : "\n");
1132	nvdimm_bus_unlock(dev);
1133	device_unlock(dev);
1134
1135	return rc ? rc : len;
1136}
1137static DEVICE_ATTR_RW(sector_size);
1138
1139static ssize_t dpa_extents_show(struct device *dev,
1140		struct device_attribute *attr, char *buf)
1141{
1142	struct nd_region *nd_region = to_nd_region(dev->parent);
1143	struct nd_label_id label_id;
1144	uuid_t *uuid = NULL;
1145	int count = 0, i;
1146	u32 flags = 0;
1147
1148	nvdimm_bus_lock(dev);
1149	if (is_namespace_pmem(dev)) {
1150		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1151
1152		uuid = nspm->uuid;
1153		flags = 0;
1154	}
1155
1156	if (!uuid)
1157		goto out;
1158
1159	nd_label_gen_id(&label_id, uuid, flags);
1160	for (i = 0; i < nd_region->ndr_mappings; i++) {
1161		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1162		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1163		struct resource *res;
1164
1165		for_each_dpa_resource(ndd, res)
1166			if (strcmp(res->name, label_id.id) == 0)
1167				count++;
1168	}
1169 out:
1170	nvdimm_bus_unlock(dev);
1171
1172	return sprintf(buf, "%d\n", count);
1173}
1174static DEVICE_ATTR_RO(dpa_extents);
1175
1176static int btt_claim_class(struct device *dev)
1177{
1178	struct nd_region *nd_region = to_nd_region(dev->parent);
1179	int i, loop_bitmask = 0;
1180
1181	for (i = 0; i < nd_region->ndr_mappings; i++) {
1182		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1183		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1184		struct nd_namespace_index *nsindex;
1185
1186		/*
1187		 * If any of the DIMMs do not support labels the only
1188		 * possible BTT format is v1.
1189		 */
1190		if (!ndd) {
1191			loop_bitmask = 0;
1192			break;
1193		}
1194
1195		nsindex = to_namespace_index(ndd, ndd->ns_current);
1196		if (nsindex == NULL)
1197			loop_bitmask |= 1;
1198		else {
1199			/* check whether existing labels are v1.1 or v1.2 */
1200			if (__le16_to_cpu(nsindex->major) == 1
1201					&& __le16_to_cpu(nsindex->minor) == 1)
1202				loop_bitmask |= 2;
1203			else
1204				loop_bitmask |= 4;
1205		}
1206	}
1207	/*
1208	 * If nsindex is null loop_bitmask's bit 0 will be set, and if an index
1209	 * block is found, a v1.1 label for any mapping will set bit 1, and a
1210	 * v1.2 label will set bit 2.
1211	 *
1212	 * At the end of the loop, at most one of the three bits must be set.
1213	 * If multiple bits were set, it means the different mappings disagree
1214	 * about their labels, and this must be cleaned up first.
1215	 *
1216	 * If all the label index blocks are found to agree, nsindex of NULL
1217	 * implies labels haven't been initialized yet, and when they will,
1218	 * they will be of the 1.2 format, so we can assume BTT2.0
1219	 *
1220	 * If 1.1 labels are found, we enforce BTT1.1, and if 1.2 labels are
1221	 * found, we enforce BTT2.0
1222	 *
1223	 * If the loop was never entered, default to BTT1.1 (legacy namespaces)
1224	 */
1225	switch (loop_bitmask) {
1226	case 0:
1227	case 2:
1228		return NVDIMM_CCLASS_BTT;
1229	case 1:
1230	case 4:
1231		return NVDIMM_CCLASS_BTT2;
1232	default:
1233		return -ENXIO;
1234	}
1235}
1236
1237static ssize_t holder_show(struct device *dev,
1238		struct device_attribute *attr, char *buf)
1239{
1240	struct nd_namespace_common *ndns = to_ndns(dev);
1241	ssize_t rc;
1242
1243	device_lock(dev);
1244	rc = sprintf(buf, "%s\n", ndns->claim ? dev_name(ndns->claim) : "");
1245	device_unlock(dev);
1246
1247	return rc;
1248}
1249static DEVICE_ATTR_RO(holder);
1250
1251static int __holder_class_store(struct device *dev, const char *buf)
1252{
1253	struct nd_namespace_common *ndns = to_ndns(dev);
1254
1255	if (dev->driver || ndns->claim)
1256		return -EBUSY;
1257
1258	if (sysfs_streq(buf, "btt")) {
1259		int rc = btt_claim_class(dev);
1260
1261		if (rc < NVDIMM_CCLASS_NONE)
1262			return rc;
1263		ndns->claim_class = rc;
1264	} else if (sysfs_streq(buf, "pfn"))
1265		ndns->claim_class = NVDIMM_CCLASS_PFN;
1266	else if (sysfs_streq(buf, "dax"))
1267		ndns->claim_class = NVDIMM_CCLASS_DAX;
1268	else if (sysfs_streq(buf, ""))
1269		ndns->claim_class = NVDIMM_CCLASS_NONE;
1270	else
1271		return -EINVAL;
1272
1273	return 0;
1274}
1275
1276static ssize_t holder_class_store(struct device *dev,
1277		struct device_attribute *attr, const char *buf, size_t len)
1278{
1279	struct nd_region *nd_region = to_nd_region(dev->parent);
1280	int rc;
1281
1282	device_lock(dev);
1283	nvdimm_bus_lock(dev);
1284	wait_nvdimm_bus_probe_idle(dev);
1285	rc = __holder_class_store(dev, buf);
1286	if (rc >= 0)
1287		rc = nd_namespace_label_update(nd_region, dev);
1288	dev_dbg(dev, "%s(%d)\n", rc < 0 ? "fail " : "", rc);
1289	nvdimm_bus_unlock(dev);
1290	device_unlock(dev);
1291
1292	return rc < 0 ? rc : len;
1293}
1294
1295static ssize_t holder_class_show(struct device *dev,
1296		struct device_attribute *attr, char *buf)
1297{
1298	struct nd_namespace_common *ndns = to_ndns(dev);
1299	ssize_t rc;
1300
1301	device_lock(dev);
1302	if (ndns->claim_class == NVDIMM_CCLASS_NONE)
1303		rc = sprintf(buf, "\n");
1304	else if ((ndns->claim_class == NVDIMM_CCLASS_BTT) ||
1305			(ndns->claim_class == NVDIMM_CCLASS_BTT2))
1306		rc = sprintf(buf, "btt\n");
1307	else if (ndns->claim_class == NVDIMM_CCLASS_PFN)
1308		rc = sprintf(buf, "pfn\n");
1309	else if (ndns->claim_class == NVDIMM_CCLASS_DAX)
1310		rc = sprintf(buf, "dax\n");
1311	else
1312		rc = sprintf(buf, "<unknown>\n");
1313	device_unlock(dev);
1314
1315	return rc;
1316}
1317static DEVICE_ATTR_RW(holder_class);
1318
1319static ssize_t mode_show(struct device *dev,
1320		struct device_attribute *attr, char *buf)
1321{
1322	struct nd_namespace_common *ndns = to_ndns(dev);
1323	struct device *claim;
1324	char *mode;
1325	ssize_t rc;
1326
1327	device_lock(dev);
1328	claim = ndns->claim;
1329	if (claim && is_nd_btt(claim))
1330		mode = "safe";
1331	else if (claim && is_nd_pfn(claim))
1332		mode = "memory";
1333	else if (claim && is_nd_dax(claim))
1334		mode = "dax";
1335	else if (!claim && pmem_should_map_pages(dev))
1336		mode = "memory";
1337	else
1338		mode = "raw";
1339	rc = sprintf(buf, "%s\n", mode);
1340	device_unlock(dev);
1341
1342	return rc;
1343}
1344static DEVICE_ATTR_RO(mode);
1345
1346static ssize_t force_raw_store(struct device *dev,
1347		struct device_attribute *attr, const char *buf, size_t len)
1348{
1349	bool force_raw;
1350	int rc = kstrtobool(buf, &force_raw);
1351
1352	if (rc)
1353		return rc;
1354
1355	to_ndns(dev)->force_raw = force_raw;
1356	return len;
1357}
1358
1359static ssize_t force_raw_show(struct device *dev,
1360		struct device_attribute *attr, char *buf)
1361{
1362	return sprintf(buf, "%d\n", to_ndns(dev)->force_raw);
1363}
1364static DEVICE_ATTR_RW(force_raw);
1365
1366static struct attribute *nd_namespace_attributes[] = {
1367	&dev_attr_nstype.attr,
1368	&dev_attr_size.attr,
1369	&dev_attr_mode.attr,
1370	&dev_attr_uuid.attr,
1371	&dev_attr_holder.attr,
1372	&dev_attr_resource.attr,
1373	&dev_attr_alt_name.attr,
1374	&dev_attr_force_raw.attr,
1375	&dev_attr_sector_size.attr,
1376	&dev_attr_dpa_extents.attr,
1377	&dev_attr_holder_class.attr,
1378	NULL,
1379};
1380
1381static umode_t namespace_visible(struct kobject *kobj,
1382		struct attribute *a, int n)
1383{
1384	struct device *dev = container_of(kobj, struct device, kobj);
1385
1386	if (is_namespace_pmem(dev)) {
1387		if (a == &dev_attr_size.attr)
1388			return 0644;
1389
1390		return a->mode;
1391	}
1392
1393	/* base is_namespace_io() attributes */
1394	if (a == &dev_attr_nstype.attr || a == &dev_attr_size.attr ||
1395	    a == &dev_attr_holder.attr || a == &dev_attr_holder_class.attr ||
1396	    a == &dev_attr_force_raw.attr || a == &dev_attr_mode.attr ||
1397	    a == &dev_attr_resource.attr)
1398		return a->mode;
1399
1400	return 0;
1401}
1402
1403static struct attribute_group nd_namespace_attribute_group = {
1404	.attrs = nd_namespace_attributes,
1405	.is_visible = namespace_visible,
1406};
1407
1408static const struct attribute_group *nd_namespace_attribute_groups[] = {
1409	&nd_device_attribute_group,
1410	&nd_namespace_attribute_group,
1411	&nd_numa_attribute_group,
1412	NULL,
1413};
1414
1415static const struct device_type namespace_io_device_type = {
1416	.name = "nd_namespace_io",
1417	.release = namespace_io_release,
1418	.groups = nd_namespace_attribute_groups,
1419};
1420
1421static const struct device_type namespace_pmem_device_type = {
1422	.name = "nd_namespace_pmem",
1423	.release = namespace_pmem_release,
1424	.groups = nd_namespace_attribute_groups,
1425};
1426
1427static bool is_namespace_pmem(const struct device *dev)
1428{
1429	return dev ? dev->type == &namespace_pmem_device_type : false;
1430}
1431
1432static bool is_namespace_io(const struct device *dev)
1433{
1434	return dev ? dev->type == &namespace_io_device_type : false;
1435}
1436
1437struct nd_namespace_common *nvdimm_namespace_common_probe(struct device *dev)
1438{
1439	struct nd_btt *nd_btt = is_nd_btt(dev) ? to_nd_btt(dev) : NULL;
1440	struct nd_pfn *nd_pfn = is_nd_pfn(dev) ? to_nd_pfn(dev) : NULL;
1441	struct nd_dax *nd_dax = is_nd_dax(dev) ? to_nd_dax(dev) : NULL;
1442	struct nd_namespace_common *ndns = NULL;
1443	resource_size_t size;
1444
1445	if (nd_btt || nd_pfn || nd_dax) {
1446		if (nd_btt)
1447			ndns = nd_btt->ndns;
1448		else if (nd_pfn)
1449			ndns = nd_pfn->ndns;
1450		else if (nd_dax)
1451			ndns = nd_dax->nd_pfn.ndns;
1452
1453		if (!ndns)
1454			return ERR_PTR(-ENODEV);
1455
1456		/*
1457		 * Flush any in-progess probes / removals in the driver
1458		 * for the raw personality of this namespace.
1459		 */
1460		device_lock(&ndns->dev);
1461		device_unlock(&ndns->dev);
1462		if (ndns->dev.driver) {
1463			dev_dbg(&ndns->dev, "is active, can't bind %s\n",
1464					dev_name(dev));
1465			return ERR_PTR(-EBUSY);
1466		}
1467		if (dev_WARN_ONCE(&ndns->dev, ndns->claim != dev,
1468					"host (%s) vs claim (%s) mismatch\n",
1469					dev_name(dev),
1470					dev_name(ndns->claim)))
1471			return ERR_PTR(-ENXIO);
1472	} else {
1473		ndns = to_ndns(dev);
1474		if (ndns->claim) {
1475			dev_dbg(dev, "claimed by %s, failing probe\n",
1476				dev_name(ndns->claim));
1477
1478			return ERR_PTR(-ENXIO);
1479		}
1480	}
1481
1482	if (nvdimm_namespace_locked(ndns))
1483		return ERR_PTR(-EACCES);
1484
1485	size = nvdimm_namespace_capacity(ndns);
1486	if (size < ND_MIN_NAMESPACE_SIZE) {
1487		dev_dbg(&ndns->dev, "%pa, too small must be at least %#x\n",
1488				&size, ND_MIN_NAMESPACE_SIZE);
1489		return ERR_PTR(-ENODEV);
1490	}
1491
1492	/*
1493	 * Note, alignment validation for fsdax and devdax mode
1494	 * namespaces happens in nd_pfn_validate() where infoblock
1495	 * padding parameters can be applied.
1496	 */
1497	if (pmem_should_map_pages(dev)) {
1498		struct nd_namespace_io *nsio = to_nd_namespace_io(&ndns->dev);
1499		struct resource *res = &nsio->res;
1500
1501		if (!IS_ALIGNED(res->start | (res->end + 1),
1502					memremap_compat_align())) {
1503			dev_err(&ndns->dev, "%pr misaligned, unable to map\n", res);
1504			return ERR_PTR(-EOPNOTSUPP);
1505		}
1506	}
1507
1508	if (is_namespace_pmem(&ndns->dev)) {
1509		struct nd_namespace_pmem *nspm;
1510
1511		nspm = to_nd_namespace_pmem(&ndns->dev);
1512		if (uuid_not_set(nspm->uuid, &ndns->dev, __func__))
1513			return ERR_PTR(-ENODEV);
1514	}
1515
1516	return ndns;
1517}
1518EXPORT_SYMBOL(nvdimm_namespace_common_probe);
1519
1520int devm_namespace_enable(struct device *dev, struct nd_namespace_common *ndns,
1521		resource_size_t size)
1522{
1523	return devm_nsio_enable(dev, to_nd_namespace_io(&ndns->dev), size);
1524}
1525EXPORT_SYMBOL_GPL(devm_namespace_enable);
1526
1527void devm_namespace_disable(struct device *dev, struct nd_namespace_common *ndns)
1528{
1529	devm_nsio_disable(dev, to_nd_namespace_io(&ndns->dev));
1530}
1531EXPORT_SYMBOL_GPL(devm_namespace_disable);
1532
1533static struct device **create_namespace_io(struct nd_region *nd_region)
1534{
1535	struct nd_namespace_io *nsio;
1536	struct device *dev, **devs;
1537	struct resource *res;
1538
1539	nsio = kzalloc(sizeof(*nsio), GFP_KERNEL);
1540	if (!nsio)
1541		return NULL;
1542
1543	devs = kcalloc(2, sizeof(struct device *), GFP_KERNEL);
1544	if (!devs) {
1545		kfree(nsio);
1546		return NULL;
1547	}
1548
1549	dev = &nsio->common.dev;
1550	dev->type = &namespace_io_device_type;
1551	dev->parent = &nd_region->dev;
1552	res = &nsio->res;
1553	res->name = dev_name(&nd_region->dev);
1554	res->flags = IORESOURCE_MEM;
1555	res->start = nd_region->ndr_start;
1556	res->end = res->start + nd_region->ndr_size - 1;
1557
1558	devs[0] = dev;
1559	return devs;
1560}
1561
1562static bool has_uuid_at_pos(struct nd_region *nd_region, const uuid_t *uuid,
1563			    u64 cookie, u16 pos)
1564{
1565	struct nd_namespace_label *found = NULL;
1566	int i;
1567
1568	for (i = 0; i < nd_region->ndr_mappings; i++) {
1569		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1570		struct nd_interleave_set *nd_set = nd_region->nd_set;
1571		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1572		struct nd_label_ent *label_ent;
1573		bool found_uuid = false;
1574
1575		list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1576			struct nd_namespace_label *nd_label = label_ent->label;
1577			u16 position;
1578
1579			if (!nd_label)
1580				continue;
1581			position = nsl_get_position(ndd, nd_label);
1582
1583			if (!nsl_validate_isetcookie(ndd, nd_label, cookie))
1584				continue;
1585
1586			if (!nsl_uuid_equal(ndd, nd_label, uuid))
1587				continue;
1588
1589			if (!nsl_validate_type_guid(ndd, nd_label,
1590						    &nd_set->type_guid))
1591				continue;
1592
1593			if (found_uuid) {
1594				dev_dbg(ndd->dev, "duplicate entry for uuid\n");
1595				return false;
1596			}
1597			found_uuid = true;
1598			if (!nsl_validate_nlabel(nd_region, ndd, nd_label))
1599				continue;
1600			if (position != pos)
1601				continue;
1602			found = nd_label;
1603			break;
1604		}
1605		if (found)
1606			break;
1607	}
1608	return found != NULL;
1609}
1610
1611static int select_pmem_id(struct nd_region *nd_region, const uuid_t *pmem_id)
1612{
1613	int i;
1614
 
 
 
1615	for (i = 0; i < nd_region->ndr_mappings; i++) {
1616		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1617		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1618		struct nd_namespace_label *nd_label = NULL;
1619		u64 hw_start, hw_end, pmem_start, pmem_end;
1620		struct nd_label_ent *label_ent;
1621
1622		lockdep_assert_held(&nd_mapping->lock);
1623		list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1624			nd_label = label_ent->label;
1625			if (!nd_label)
1626				continue;
1627			if (nsl_uuid_equal(ndd, nd_label, pmem_id))
1628				break;
1629			nd_label = NULL;
1630		}
1631
1632		if (!nd_label) {
1633			WARN_ON(1);
1634			return -EINVAL;
1635		}
1636
1637		/*
1638		 * Check that this label is compliant with the dpa
1639		 * range published in NFIT
1640		 */
1641		hw_start = nd_mapping->start;
1642		hw_end = hw_start + nd_mapping->size;
1643		pmem_start = nsl_get_dpa(ndd, nd_label);
1644		pmem_end = pmem_start + nsl_get_rawsize(ndd, nd_label);
1645		if (pmem_start >= hw_start && pmem_start < hw_end
1646				&& pmem_end <= hw_end && pmem_end > hw_start)
1647			/* pass */;
1648		else {
1649			dev_dbg(&nd_region->dev, "%s invalid label for %pUb\n",
1650				dev_name(ndd->dev),
1651				nsl_uuid_raw(ndd, nd_label));
1652			return -EINVAL;
1653		}
1654
1655		/* move recently validated label to the front of the list */
1656		list_move(&label_ent->list, &nd_mapping->labels);
1657	}
1658	return 0;
1659}
1660
1661/**
1662 * create_namespace_pmem - validate interleave set labelling, retrieve label0
1663 * @nd_region: region with mappings to validate
1664 * @nd_mapping: container of dpa-resource-root + labels
1665 * @nd_label: target pmem namespace label to evaluate
1666 *
1667 * Returns: the created &struct device on success or ERR_PTR(-errno) on error
1668 */
1669static struct device *create_namespace_pmem(struct nd_region *nd_region,
1670					    struct nd_mapping *nd_mapping,
1671					    struct nd_namespace_label *nd_label)
1672{
1673	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1674	struct nd_namespace_index *nsindex =
1675		to_namespace_index(ndd, ndd->ns_current);
1676	u64 cookie = nd_region_interleave_set_cookie(nd_region, nsindex);
1677	u64 altcookie = nd_region_interleave_set_altcookie(nd_region);
1678	struct nd_label_ent *label_ent;
1679	struct nd_namespace_pmem *nspm;
1680	resource_size_t size = 0;
1681	struct resource *res;
1682	struct device *dev;
1683	uuid_t uuid;
1684	int rc = 0;
1685	u16 i;
1686
1687	if (cookie == 0) {
1688		dev_dbg(&nd_region->dev, "invalid interleave-set-cookie\n");
1689		return ERR_PTR(-ENXIO);
1690	}
1691
1692	if (!nsl_validate_isetcookie(ndd, nd_label, cookie)) {
1693		dev_dbg(&nd_region->dev, "invalid cookie in label: %pUb\n",
1694			nsl_uuid_raw(ndd, nd_label));
1695		if (!nsl_validate_isetcookie(ndd, nd_label, altcookie))
1696			return ERR_PTR(-EAGAIN);
1697
1698		dev_dbg(&nd_region->dev, "valid altcookie in label: %pUb\n",
1699			nsl_uuid_raw(ndd, nd_label));
1700	}
1701
1702	nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1703	if (!nspm)
1704		return ERR_PTR(-ENOMEM);
1705
1706	nspm->id = -1;
1707	dev = &nspm->nsio.common.dev;
1708	dev->type = &namespace_pmem_device_type;
1709	dev->parent = &nd_region->dev;
1710	res = &nspm->nsio.res;
1711	res->name = dev_name(&nd_region->dev);
1712	res->flags = IORESOURCE_MEM;
1713
1714	for (i = 0; i < nd_region->ndr_mappings; i++) {
1715		nsl_get_uuid(ndd, nd_label, &uuid);
1716		if (has_uuid_at_pos(nd_region, &uuid, cookie, i))
1717			continue;
1718		if (has_uuid_at_pos(nd_region, &uuid, altcookie, i))
1719			continue;
1720		break;
1721	}
1722
1723	if (i < nd_region->ndr_mappings) {
1724		struct nvdimm *nvdimm = nd_region->mapping[i].nvdimm;
1725
1726		/*
1727		 * Give up if we don't find an instance of a uuid at each
1728		 * position (from 0 to nd_region->ndr_mappings - 1), or if we
1729		 * find a dimm with two instances of the same uuid.
1730		 */
1731		dev_err(&nd_region->dev, "%s missing label for %pUb\n",
1732			nvdimm_name(nvdimm), nsl_uuid_raw(ndd, nd_label));
1733		rc = -EINVAL;
1734		goto err;
1735	}
1736
1737	/*
1738	 * Fix up each mapping's 'labels' to have the validated pmem label for
1739	 * that position at labels[0], and NULL at labels[1].  In the process,
1740	 * check that the namespace aligns with interleave-set.
1741	 */
1742	nsl_get_uuid(ndd, nd_label, &uuid);
1743	rc = select_pmem_id(nd_region, &uuid);
1744	if (rc)
1745		goto err;
1746
1747	/* Calculate total size and populate namespace properties from label0 */
1748	for (i = 0; i < nd_region->ndr_mappings; i++) {
1749		struct nd_namespace_label *label0;
1750		struct nvdimm_drvdata *ndd;
1751
1752		nd_mapping = &nd_region->mapping[i];
1753		label_ent = list_first_entry_or_null(&nd_mapping->labels,
1754				typeof(*label_ent), list);
1755		label0 = label_ent ? label_ent->label : NULL;
1756
1757		if (!label0) {
1758			WARN_ON(1);
1759			continue;
1760		}
1761
1762		ndd = to_ndd(nd_mapping);
1763		size += nsl_get_rawsize(ndd, label0);
1764		if (nsl_get_position(ndd, label0) != 0)
1765			continue;
1766		WARN_ON(nspm->alt_name || nspm->uuid);
1767		nspm->alt_name = kmemdup(nsl_ref_name(ndd, label0),
1768					 NSLABEL_NAME_LEN, GFP_KERNEL);
1769		nsl_get_uuid(ndd, label0, &uuid);
1770		nspm->uuid = kmemdup(&uuid, sizeof(uuid_t), GFP_KERNEL);
1771		nspm->lbasize = nsl_get_lbasize(ndd, label0);
1772		nspm->nsio.common.claim_class =
1773			nsl_get_claim_class(ndd, label0);
1774	}
1775
1776	if (!nspm->alt_name || !nspm->uuid) {
1777		rc = -ENOMEM;
1778		goto err;
1779	}
1780
1781	nd_namespace_pmem_set_resource(nd_region, nspm, size);
1782
1783	return dev;
1784 err:
1785	namespace_pmem_release(dev);
1786	switch (rc) {
1787	case -EINVAL:
1788		dev_dbg(&nd_region->dev, "invalid label(s)\n");
1789		break;
 
 
 
1790	default:
1791		dev_dbg(&nd_region->dev, "unexpected err: %d\n", rc);
1792		break;
1793	}
1794	return ERR_PTR(rc);
1795}
1796
1797static struct device *nd_namespace_pmem_create(struct nd_region *nd_region)
1798{
1799	struct nd_namespace_pmem *nspm;
1800	struct resource *res;
1801	struct device *dev;
1802
1803	if (!is_memory(&nd_region->dev))
1804		return NULL;
1805
1806	nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1807	if (!nspm)
1808		return NULL;
1809
1810	dev = &nspm->nsio.common.dev;
1811	dev->type = &namespace_pmem_device_type;
1812	dev->parent = &nd_region->dev;
1813	res = &nspm->nsio.res;
1814	res->name = dev_name(&nd_region->dev);
1815	res->flags = IORESOURCE_MEM;
1816
1817	nspm->id = ida_alloc(&nd_region->ns_ida, GFP_KERNEL);
1818	if (nspm->id < 0) {
1819		kfree(nspm);
1820		return NULL;
1821	}
1822	dev_set_name(dev, "namespace%d.%d", nd_region->id, nspm->id);
1823	nd_namespace_pmem_set_resource(nd_region, nspm, 0);
1824
1825	return dev;
1826}
1827
1828static struct lock_class_key nvdimm_namespace_key;
1829
1830void nd_region_create_ns_seed(struct nd_region *nd_region)
1831{
1832	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1833
1834	if (nd_region_to_nstype(nd_region) == ND_DEVICE_NAMESPACE_IO)
1835		return;
1836
1837	nd_region->ns_seed = nd_namespace_pmem_create(nd_region);
1838
1839	/*
1840	 * Seed creation failures are not fatal, provisioning is simply
1841	 * disabled until memory becomes available
1842	 */
1843	if (!nd_region->ns_seed)
1844		dev_err(&nd_region->dev, "failed to create namespace\n");
1845	else {
1846		device_initialize(nd_region->ns_seed);
1847		lockdep_set_class(&nd_region->ns_seed->mutex,
1848				  &nvdimm_namespace_key);
1849		nd_device_register(nd_region->ns_seed);
1850	}
1851}
1852
1853void nd_region_create_dax_seed(struct nd_region *nd_region)
1854{
1855	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1856	nd_region->dax_seed = nd_dax_create(nd_region);
1857	/*
1858	 * Seed creation failures are not fatal, provisioning is simply
1859	 * disabled until memory becomes available
1860	 */
1861	if (!nd_region->dax_seed)
1862		dev_err(&nd_region->dev, "failed to create dax namespace\n");
1863}
1864
1865void nd_region_create_pfn_seed(struct nd_region *nd_region)
1866{
1867	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1868	nd_region->pfn_seed = nd_pfn_create(nd_region);
1869	/*
1870	 * Seed creation failures are not fatal, provisioning is simply
1871	 * disabled until memory becomes available
1872	 */
1873	if (!nd_region->pfn_seed)
1874		dev_err(&nd_region->dev, "failed to create pfn namespace\n");
1875}
1876
1877void nd_region_create_btt_seed(struct nd_region *nd_region)
1878{
1879	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1880	nd_region->btt_seed = nd_btt_create(nd_region);
1881	/*
1882	 * Seed creation failures are not fatal, provisioning is simply
1883	 * disabled until memory becomes available
1884	 */
1885	if (!nd_region->btt_seed)
1886		dev_err(&nd_region->dev, "failed to create btt namespace\n");
1887}
1888
1889static int add_namespace_resource(struct nd_region *nd_region,
1890		struct nd_namespace_label *nd_label, struct device **devs,
1891		int count)
1892{
1893	struct nd_mapping *nd_mapping = &nd_region->mapping[0];
1894	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1895	int i;
1896
1897	for (i = 0; i < count; i++) {
1898		uuid_t *uuid = namespace_to_uuid(devs[i]);
1899
1900		if (IS_ERR(uuid)) {
1901			WARN_ON(1);
1902			continue;
1903		}
1904
1905		if (!nsl_uuid_equal(ndd, nd_label, uuid))
1906			continue;
1907		dev_err(&nd_region->dev,
1908			"error: conflicting extents for uuid: %pUb\n", uuid);
1909		return -ENXIO;
1910	}
1911
1912	return i;
1913}
1914
1915static int cmp_dpa(const void *a, const void *b)
1916{
1917	const struct device *dev_a = *(const struct device **) a;
1918	const struct device *dev_b = *(const struct device **) b;
1919	struct nd_namespace_pmem *nspm_a, *nspm_b;
1920
1921	if (is_namespace_io(dev_a))
1922		return 0;
1923
1924	nspm_a = to_nd_namespace_pmem(dev_a);
1925	nspm_b = to_nd_namespace_pmem(dev_b);
1926
1927	return memcmp(&nspm_a->nsio.res.start, &nspm_b->nsio.res.start,
1928			sizeof(resource_size_t));
1929}
1930
1931static struct device **scan_labels(struct nd_region *nd_region)
1932{
1933	int i, count = 0;
1934	struct device *dev, **devs;
1935	struct nd_label_ent *label_ent, *e;
1936	struct nd_mapping *nd_mapping = &nd_region->mapping[0];
1937	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1938	resource_size_t map_end = nd_mapping->start + nd_mapping->size - 1;
1939
1940	devs = kcalloc(2, sizeof(dev), GFP_KERNEL);
1941	if (!devs)
1942		return NULL;
1943
1944	/* "safe" because create_namespace_pmem() might list_move() label_ent */
1945	list_for_each_entry_safe(label_ent, e, &nd_mapping->labels, list) {
1946		struct nd_namespace_label *nd_label = label_ent->label;
1947		struct device **__devs;
1948
1949		if (!nd_label)
1950			continue;
1951
1952		/* skip labels that describe extents outside of the region */
1953		if (nsl_get_dpa(ndd, nd_label) < nd_mapping->start ||
1954		    nsl_get_dpa(ndd, nd_label) > map_end)
1955			continue;
1956
1957		i = add_namespace_resource(nd_region, nd_label, devs, count);
1958		if (i < 0)
1959			goto err;
1960		if (i < count)
1961			continue;
1962		if (count) {
1963			__devs = kcalloc(count + 2, sizeof(dev), GFP_KERNEL);
1964			if (!__devs)
1965				goto err;
1966			memcpy(__devs, devs, sizeof(dev) * count);
1967			kfree(devs);
1968			devs = __devs;
1969		}
1970
1971		dev = create_namespace_pmem(nd_region, nd_mapping, nd_label);
1972		if (IS_ERR(dev)) {
1973			switch (PTR_ERR(dev)) {
1974			case -EAGAIN:
1975				/* skip invalid labels */
1976				continue;
 
 
 
1977			default:
1978				goto err;
1979			}
1980		} else
1981			devs[count++] = dev;
1982
1983	}
1984
1985	dev_dbg(&nd_region->dev, "discovered %d namespace%s\n", count,
1986		count == 1 ? "" : "s");
1987
1988	if (count == 0) {
1989		struct nd_namespace_pmem *nspm;
1990
1991		/* Publish a zero-sized namespace for userspace to configure. */
1992		nd_mapping_free_labels(nd_mapping);
 
 
 
 
 
1993		nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1994		if (!nspm)
1995			goto err;
1996		dev = &nspm->nsio.common.dev;
1997		dev->type = &namespace_pmem_device_type;
1998		nd_namespace_pmem_set_resource(nd_region, nspm, 0);
1999		dev->parent = &nd_region->dev;
2000		devs[count++] = dev;
2001	} else if (is_memory(&nd_region->dev)) {
2002		/* clean unselected labels */
2003		for (i = 0; i < nd_region->ndr_mappings; i++) {
2004			struct list_head *l, *e;
2005			LIST_HEAD(list);
2006			int j;
2007
2008			nd_mapping = &nd_region->mapping[i];
2009			if (list_empty(&nd_mapping->labels)) {
2010				WARN_ON(1);
2011				continue;
2012			}
2013
2014			j = count;
2015			list_for_each_safe(l, e, &nd_mapping->labels) {
2016				if (!j--)
2017					break;
2018				list_move_tail(l, &list);
2019			}
2020			nd_mapping_free_labels(nd_mapping);
2021			list_splice_init(&list, &nd_mapping->labels);
2022		}
2023	}
2024
2025	if (count > 1)
2026		sort(devs, count, sizeof(struct device *), cmp_dpa, NULL);
2027
2028	return devs;
2029
2030 err:
2031	for (i = 0; devs[i]; i++)
2032		namespace_pmem_release(devs[i]);
2033	kfree(devs);
2034
 
2035	return NULL;
2036}
2037
2038static struct device **create_namespaces(struct nd_region *nd_region)
2039{
2040	struct nd_mapping *nd_mapping;
2041	struct device **devs;
2042	int i;
2043
2044	if (nd_region->ndr_mappings == 0)
2045		return NULL;
2046
2047	/* lock down all mappings while we scan labels */
2048	for (i = 0; i < nd_region->ndr_mappings; i++) {
2049		nd_mapping = &nd_region->mapping[i];
2050		mutex_lock_nested(&nd_mapping->lock, i);
2051	}
2052
2053	devs = scan_labels(nd_region);
2054
2055	for (i = 0; i < nd_region->ndr_mappings; i++) {
2056		int reverse = nd_region->ndr_mappings - 1 - i;
2057
2058		nd_mapping = &nd_region->mapping[reverse];
2059		mutex_unlock(&nd_mapping->lock);
2060	}
2061
2062	return devs;
2063}
2064
2065static void deactivate_labels(void *region)
2066{
2067	struct nd_region *nd_region = region;
2068	int i;
2069
2070	for (i = 0; i < nd_region->ndr_mappings; i++) {
2071		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
2072		struct nvdimm_drvdata *ndd = nd_mapping->ndd;
2073		struct nvdimm *nvdimm = nd_mapping->nvdimm;
2074
2075		mutex_lock(&nd_mapping->lock);
2076		nd_mapping_free_labels(nd_mapping);
2077		mutex_unlock(&nd_mapping->lock);
2078
2079		put_ndd(ndd);
2080		nd_mapping->ndd = NULL;
2081		if (ndd)
2082			atomic_dec(&nvdimm->busy);
2083	}
2084}
2085
2086static int init_active_labels(struct nd_region *nd_region)
2087{
2088	int i, rc = 0;
2089
2090	for (i = 0; i < nd_region->ndr_mappings; i++) {
2091		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
2092		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
2093		struct nvdimm *nvdimm = nd_mapping->nvdimm;
2094		struct nd_label_ent *label_ent;
2095		int count, j;
2096
2097		/*
2098		 * If the dimm is disabled then we may need to prevent
2099		 * the region from being activated.
2100		 */
2101		if (!ndd) {
2102			if (test_bit(NDD_LOCKED, &nvdimm->flags))
2103				/* fail, label data may be unreadable */;
2104			else if (test_bit(NDD_LABELING, &nvdimm->flags))
2105				/* fail, labels needed to disambiguate dpa */;
2106			else
2107				continue;
2108
2109			dev_err(&nd_region->dev, "%s: is %s, failing probe\n",
2110					dev_name(&nd_mapping->nvdimm->dev),
2111					test_bit(NDD_LOCKED, &nvdimm->flags)
2112					? "locked" : "disabled");
2113			rc = -ENXIO;
2114			goto out;
2115		}
2116		nd_mapping->ndd = ndd;
2117		atomic_inc(&nvdimm->busy);
2118		get_ndd(ndd);
2119
2120		count = nd_label_active_count(ndd);
2121		dev_dbg(ndd->dev, "count: %d\n", count);
2122		if (!count)
2123			continue;
2124		for (j = 0; j < count; j++) {
2125			struct nd_namespace_label *label;
2126
2127			label_ent = kzalloc(sizeof(*label_ent), GFP_KERNEL);
2128			if (!label_ent)
2129				break;
2130			label = nd_label_active(ndd, j);
2131			label_ent->label = label;
2132
2133			mutex_lock(&nd_mapping->lock);
2134			list_add_tail(&label_ent->list, &nd_mapping->labels);
2135			mutex_unlock(&nd_mapping->lock);
2136		}
2137
2138		if (j < count)
2139			break;
2140	}
2141
2142	if (i < nd_region->ndr_mappings)
2143		rc = -ENOMEM;
2144
2145out:
2146	if (rc) {
2147		deactivate_labels(nd_region);
2148		return rc;
2149	}
2150
2151	return devm_add_action_or_reset(&nd_region->dev, deactivate_labels,
2152					nd_region);
2153}
2154
2155int nd_region_register_namespaces(struct nd_region *nd_region, int *err)
2156{
2157	struct device **devs = NULL;
2158	int i, rc = 0, type;
2159
2160	*err = 0;
2161	nvdimm_bus_lock(&nd_region->dev);
2162	rc = init_active_labels(nd_region);
2163	if (rc) {
2164		nvdimm_bus_unlock(&nd_region->dev);
2165		return rc;
2166	}
2167
2168	type = nd_region_to_nstype(nd_region);
2169	switch (type) {
2170	case ND_DEVICE_NAMESPACE_IO:
2171		devs = create_namespace_io(nd_region);
2172		break;
2173	case ND_DEVICE_NAMESPACE_PMEM:
2174		devs = create_namespaces(nd_region);
2175		break;
2176	default:
2177		break;
2178	}
2179	nvdimm_bus_unlock(&nd_region->dev);
2180
2181	if (!devs)
2182		return -ENODEV;
2183
2184	for (i = 0; devs[i]; i++) {
2185		struct device *dev = devs[i];
2186		int id;
2187
2188		if (type == ND_DEVICE_NAMESPACE_PMEM) {
2189			struct nd_namespace_pmem *nspm;
2190
2191			nspm = to_nd_namespace_pmem(dev);
2192			id = ida_alloc(&nd_region->ns_ida, GFP_KERNEL);
 
2193			nspm->id = id;
2194		} else
2195			id = i;
2196
2197		if (id < 0)
2198			break;
2199		dev_set_name(dev, "namespace%d.%d", nd_region->id, id);
2200		device_initialize(dev);
2201		lockdep_set_class(&dev->mutex, &nvdimm_namespace_key);
2202		nd_device_register(dev);
2203	}
2204	if (i)
2205		nd_region->ns_seed = devs[0];
2206
2207	if (devs[i]) {
2208		int j;
2209
2210		for (j = i; devs[j]; j++) {
2211			struct device *dev = devs[j];
2212
2213			device_initialize(dev);
2214			put_device(dev);
2215		}
2216		*err = j - i;
2217		/*
2218		 * All of the namespaces we tried to register failed, so
2219		 * fail region activation.
2220		 */
2221		if (*err == 0)
2222			rc = -ENODEV;
2223	}
2224	kfree(devs);
2225
2226	if (rc == -ENODEV)
2227		return rc;
2228
2229	return i;
2230}
v6.2
   1// SPDX-License-Identifier: GPL-2.0-only
   2/*
   3 * Copyright(c) 2013-2015 Intel Corporation. All rights reserved.
   4 */
 
   5#include <linux/module.h>
   6#include <linux/device.h>
   7#include <linux/sort.h>
   8#include <linux/slab.h>
   9#include <linux/list.h>
  10#include <linux/nd.h>
  11#include "nd-core.h"
  12#include "pmem.h"
  13#include "pfn.h"
  14#include "nd.h"
  15
  16static void namespace_io_release(struct device *dev)
  17{
  18	struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
  19
  20	kfree(nsio);
  21}
  22
  23static void namespace_pmem_release(struct device *dev)
  24{
  25	struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
  26	struct nd_region *nd_region = to_nd_region(dev->parent);
  27
  28	if (nspm->id >= 0)
  29		ida_simple_remove(&nd_region->ns_ida, nspm->id);
  30	kfree(nspm->alt_name);
  31	kfree(nspm->uuid);
  32	kfree(nspm);
  33}
  34
  35static bool is_namespace_pmem(const struct device *dev);
  36static bool is_namespace_io(const struct device *dev);
  37
  38static int is_uuid_busy(struct device *dev, void *data)
  39{
  40	uuid_t *uuid1 = data, *uuid2 = NULL;
  41
  42	if (is_namespace_pmem(dev)) {
  43		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
  44
  45		uuid2 = nspm->uuid;
  46	} else if (is_nd_btt(dev)) {
  47		struct nd_btt *nd_btt = to_nd_btt(dev);
  48
  49		uuid2 = nd_btt->uuid;
  50	} else if (is_nd_pfn(dev)) {
  51		struct nd_pfn *nd_pfn = to_nd_pfn(dev);
  52
  53		uuid2 = nd_pfn->uuid;
  54	}
  55
  56	if (uuid2 && uuid_equal(uuid1, uuid2))
  57		return -EBUSY;
  58
  59	return 0;
  60}
  61
  62static int is_namespace_uuid_busy(struct device *dev, void *data)
  63{
  64	if (is_nd_region(dev))
  65		return device_for_each_child(dev, data, is_uuid_busy);
  66	return 0;
  67}
  68
  69/**
  70 * nd_is_uuid_unique - verify that no other namespace has @uuid
  71 * @dev: any device on a nvdimm_bus
  72 * @uuid: uuid to check
 
 
  73 */
  74bool nd_is_uuid_unique(struct device *dev, uuid_t *uuid)
  75{
  76	struct nvdimm_bus *nvdimm_bus = walk_to_nvdimm_bus(dev);
  77
  78	if (!nvdimm_bus)
  79		return false;
  80	WARN_ON_ONCE(!is_nvdimm_bus_locked(&nvdimm_bus->dev));
  81	if (device_for_each_child(&nvdimm_bus->dev, uuid,
  82				is_namespace_uuid_busy) != 0)
  83		return false;
  84	return true;
  85}
  86
  87bool pmem_should_map_pages(struct device *dev)
  88{
  89	struct nd_region *nd_region = to_nd_region(dev->parent);
  90	struct nd_namespace_common *ndns = to_ndns(dev);
  91	struct nd_namespace_io *nsio;
  92
  93	if (!IS_ENABLED(CONFIG_ZONE_DEVICE))
  94		return false;
  95
  96	if (!test_bit(ND_REGION_PAGEMAP, &nd_region->flags))
  97		return false;
  98
  99	if (is_nd_pfn(dev) || is_nd_btt(dev))
 100		return false;
 101
 102	if (ndns->force_raw)
 103		return false;
 104
 105	nsio = to_nd_namespace_io(dev);
 106	if (region_intersects(nsio->res.start, resource_size(&nsio->res),
 107				IORESOURCE_SYSTEM_RAM,
 108				IORES_DESC_NONE) == REGION_MIXED)
 109		return false;
 110
 111	return ARCH_MEMREMAP_PMEM == MEMREMAP_WB;
 112}
 113EXPORT_SYMBOL(pmem_should_map_pages);
 114
 115unsigned int pmem_sector_size(struct nd_namespace_common *ndns)
 116{
 117	if (is_namespace_pmem(&ndns->dev)) {
 118		struct nd_namespace_pmem *nspm;
 119
 120		nspm = to_nd_namespace_pmem(&ndns->dev);
 121		if (nspm->lbasize == 0 || nspm->lbasize == 512)
 122			/* default */;
 123		else if (nspm->lbasize == 4096)
 124			return 4096;
 125		else
 126			dev_WARN(&ndns->dev, "unsupported sector size: %ld\n",
 127					nspm->lbasize);
 128	}
 129
 130	/*
 131	 * There is no namespace label (is_namespace_io()), or the label
 132	 * indicates the default sector size.
 133	 */
 134	return 512;
 135}
 136EXPORT_SYMBOL(pmem_sector_size);
 137
 138const char *nvdimm_namespace_disk_name(struct nd_namespace_common *ndns,
 139		char *name)
 140{
 141	struct nd_region *nd_region = to_nd_region(ndns->dev.parent);
 142	const char *suffix = NULL;
 143
 144	if (ndns->claim && is_nd_btt(ndns->claim))
 145		suffix = "s";
 146
 147	if (is_namespace_pmem(&ndns->dev) || is_namespace_io(&ndns->dev)) {
 148		int nsidx = 0;
 149
 150		if (is_namespace_pmem(&ndns->dev)) {
 151			struct nd_namespace_pmem *nspm;
 152
 153			nspm = to_nd_namespace_pmem(&ndns->dev);
 154			nsidx = nspm->id;
 155		}
 156
 157		if (nsidx)
 158			sprintf(name, "pmem%d.%d%s", nd_region->id, nsidx,
 159					suffix ? suffix : "");
 160		else
 161			sprintf(name, "pmem%d%s", nd_region->id,
 162					suffix ? suffix : "");
 163	} else {
 164		return NULL;
 165	}
 166
 167	return name;
 168}
 169EXPORT_SYMBOL(nvdimm_namespace_disk_name);
 170
 171const uuid_t *nd_dev_to_uuid(struct device *dev)
 172{
 173	if (dev && is_namespace_pmem(dev)) {
 174		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 175
 176		return nspm->uuid;
 177	}
 178	return &uuid_null;
 179}
 180EXPORT_SYMBOL(nd_dev_to_uuid);
 181
 182static ssize_t nstype_show(struct device *dev,
 183		struct device_attribute *attr, char *buf)
 184{
 185	struct nd_region *nd_region = to_nd_region(dev->parent);
 186
 187	return sprintf(buf, "%d\n", nd_region_to_nstype(nd_region));
 188}
 189static DEVICE_ATTR_RO(nstype);
 190
 191static ssize_t __alt_name_store(struct device *dev, const char *buf,
 192		const size_t len)
 193{
 194	char *input, *pos, *alt_name, **ns_altname;
 195	ssize_t rc;
 196
 197	if (is_namespace_pmem(dev)) {
 198		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 199
 200		ns_altname = &nspm->alt_name;
 201	} else
 202		return -ENXIO;
 203
 204	if (dev->driver || to_ndns(dev)->claim)
 205		return -EBUSY;
 206
 207	input = kstrndup(buf, len, GFP_KERNEL);
 208	if (!input)
 209		return -ENOMEM;
 210
 211	pos = strim(input);
 212	if (strlen(pos) + 1 > NSLABEL_NAME_LEN) {
 213		rc = -EINVAL;
 214		goto out;
 215	}
 216
 217	alt_name = kzalloc(NSLABEL_NAME_LEN, GFP_KERNEL);
 218	if (!alt_name) {
 219		rc = -ENOMEM;
 220		goto out;
 221	}
 222	kfree(*ns_altname);
 223	*ns_altname = alt_name;
 224	sprintf(*ns_altname, "%s", pos);
 225	rc = len;
 226
 227out:
 228	kfree(input);
 229	return rc;
 230}
 231
 232static int nd_namespace_label_update(struct nd_region *nd_region,
 233		struct device *dev)
 234{
 235	dev_WARN_ONCE(dev, dev->driver || to_ndns(dev)->claim,
 236			"namespace must be idle during label update\n");
 237	if (dev->driver || to_ndns(dev)->claim)
 238		return 0;
 239
 240	/*
 241	 * Only allow label writes that will result in a valid namespace
 242	 * or deletion of an existing namespace.
 243	 */
 244	if (is_namespace_pmem(dev)) {
 245		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 246		resource_size_t size = resource_size(&nspm->nsio.res);
 247
 248		if (size == 0 && nspm->uuid)
 249			/* delete allocation */;
 250		else if (!nspm->uuid)
 251			return 0;
 252
 253		return nd_pmem_namespace_label_update(nd_region, nspm, size);
 254	} else
 255		return -ENXIO;
 256}
 257
 258static ssize_t alt_name_store(struct device *dev,
 259		struct device_attribute *attr, const char *buf, size_t len)
 260{
 261	struct nd_region *nd_region = to_nd_region(dev->parent);
 262	ssize_t rc;
 263
 264	device_lock(dev);
 265	nvdimm_bus_lock(dev);
 266	wait_nvdimm_bus_probe_idle(dev);
 267	rc = __alt_name_store(dev, buf, len);
 268	if (rc >= 0)
 269		rc = nd_namespace_label_update(nd_region, dev);
 270	dev_dbg(dev, "%s(%zd)\n", rc < 0 ? "fail " : "", rc);
 271	nvdimm_bus_unlock(dev);
 272	device_unlock(dev);
 273
 274	return rc < 0 ? rc : len;
 275}
 276
 277static ssize_t alt_name_show(struct device *dev,
 278		struct device_attribute *attr, char *buf)
 279{
 280	char *ns_altname;
 281
 282	if (is_namespace_pmem(dev)) {
 283		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 284
 285		ns_altname = nspm->alt_name;
 286	} else
 287		return -ENXIO;
 288
 289	return sprintf(buf, "%s\n", ns_altname ? ns_altname : "");
 290}
 291static DEVICE_ATTR_RW(alt_name);
 292
 293static int scan_free(struct nd_region *nd_region,
 294		struct nd_mapping *nd_mapping, struct nd_label_id *label_id,
 295		resource_size_t n)
 296{
 297	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 298	int rc = 0;
 299
 300	while (n) {
 301		struct resource *res, *last;
 302
 303		last = NULL;
 304		for_each_dpa_resource(ndd, res)
 305			if (strcmp(res->name, label_id->id) == 0)
 306				last = res;
 307		res = last;
 308		if (!res)
 309			return 0;
 310
 311		if (n >= resource_size(res)) {
 312			n -= resource_size(res);
 313			nd_dbg_dpa(nd_region, ndd, res, "delete %d\n", rc);
 314			nvdimm_free_dpa(ndd, res);
 315			/* retry with last resource deleted */
 316			continue;
 317		}
 318
 319		rc = adjust_resource(res, res->start, resource_size(res) - n);
 320		if (rc == 0)
 321			res->flags |= DPA_RESOURCE_ADJUSTED;
 322		nd_dbg_dpa(nd_region, ndd, res, "shrink %d\n", rc);
 323		break;
 324	}
 325
 326	return rc;
 327}
 328
 329/**
 330 * shrink_dpa_allocation - for each dimm in region free n bytes for label_id
 331 * @nd_region: the set of dimms to reclaim @n bytes from
 332 * @label_id: unique identifier for the namespace consuming this dpa range
 333 * @n: number of bytes per-dimm to release
 334 *
 335 * Assumes resources are ordered.  Starting from the end try to
 336 * adjust_resource() the allocation to @n, but if @n is larger than the
 337 * allocation delete it and find the 'new' last allocation in the label
 338 * set.
 
 
 339 */
 340static int shrink_dpa_allocation(struct nd_region *nd_region,
 341		struct nd_label_id *label_id, resource_size_t n)
 342{
 343	int i;
 344
 345	for (i = 0; i < nd_region->ndr_mappings; i++) {
 346		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 347		int rc;
 348
 349		rc = scan_free(nd_region, nd_mapping, label_id, n);
 350		if (rc)
 351			return rc;
 352	}
 353
 354	return 0;
 355}
 356
 357static resource_size_t init_dpa_allocation(struct nd_label_id *label_id,
 358		struct nd_region *nd_region, struct nd_mapping *nd_mapping,
 359		resource_size_t n)
 360{
 361	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 362	struct resource *res;
 363	int rc = 0;
 364
 365	/* first resource allocation for this label-id or dimm */
 366	res = nvdimm_allocate_dpa(ndd, label_id, nd_mapping->start, n);
 367	if (!res)
 368		rc = -EBUSY;
 369
 370	nd_dbg_dpa(nd_region, ndd, res, "init %d\n", rc);
 371	return rc ? n : 0;
 372}
 373
 374
 375/**
 376 * space_valid() - validate free dpa space against constraints
 377 * @nd_region: hosting region of the free space
 378 * @ndd: dimm device data for debug
 379 * @label_id: namespace id to allocate space
 380 * @prev: potential allocation that precedes free space
 381 * @next: allocation that follows the given free space range
 382 * @exist: first allocation with same id in the mapping
 383 * @n: range that must satisfied for pmem allocations
 384 * @valid: free space range to validate
 385 *
 386 * BLK-space is valid as long as it does not precede a PMEM
 387 * allocation in a given region. PMEM-space must be contiguous
 388 * and adjacent to an existing allocation (if one
 389 * exists).  If reserving PMEM any space is valid.
 390 */
 391static void space_valid(struct nd_region *nd_region, struct nvdimm_drvdata *ndd,
 392		struct nd_label_id *label_id, struct resource *prev,
 393		struct resource *next, struct resource *exist,
 394		resource_size_t n, struct resource *valid)
 395{
 396	bool is_reserve = strcmp(label_id->id, "pmem-reserve") == 0;
 397	unsigned long align;
 398
 399	align = nd_region->align / nd_region->ndr_mappings;
 400	valid->start = ALIGN(valid->start, align);
 401	valid->end = ALIGN_DOWN(valid->end + 1, align) - 1;
 402
 403	if (valid->start >= valid->end)
 404		goto invalid;
 405
 406	if (is_reserve)
 407		return;
 408
 409	/* allocation needs to be contiguous, so this is all or nothing */
 410	if (resource_size(valid) < n)
 411		goto invalid;
 412
 413	/* we've got all the space we need and no existing allocation */
 414	if (!exist)
 415		return;
 416
 417	/* allocation needs to be contiguous with the existing namespace */
 418	if (valid->start == exist->end + 1
 419			|| valid->end == exist->start - 1)
 420		return;
 421
 422 invalid:
 423	/* truncate @valid size to 0 */
 424	valid->end = valid->start - 1;
 425}
 426
 427enum alloc_loc {
 428	ALLOC_ERR = 0, ALLOC_BEFORE, ALLOC_MID, ALLOC_AFTER,
 429};
 430
 431static resource_size_t scan_allocate(struct nd_region *nd_region,
 432		struct nd_mapping *nd_mapping, struct nd_label_id *label_id,
 433		resource_size_t n)
 434{
 435	resource_size_t mapping_end = nd_mapping->start + nd_mapping->size - 1;
 436	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 437	struct resource *res, *exist = NULL, valid;
 438	const resource_size_t to_allocate = n;
 439	int first;
 440
 441	for_each_dpa_resource(ndd, res)
 442		if (strcmp(label_id->id, res->name) == 0)
 443			exist = res;
 444
 445	valid.start = nd_mapping->start;
 446	valid.end = mapping_end;
 447	valid.name = "free space";
 448 retry:
 449	first = 0;
 450	for_each_dpa_resource(ndd, res) {
 451		struct resource *next = res->sibling, *new_res = NULL;
 452		resource_size_t allocate, available = 0;
 453		enum alloc_loc loc = ALLOC_ERR;
 454		const char *action;
 455		int rc = 0;
 456
 457		/* ignore resources outside this nd_mapping */
 458		if (res->start > mapping_end)
 459			continue;
 460		if (res->end < nd_mapping->start)
 461			continue;
 462
 463		/* space at the beginning of the mapping */
 464		if (!first++ && res->start > nd_mapping->start) {
 465			valid.start = nd_mapping->start;
 466			valid.end = res->start - 1;
 467			space_valid(nd_region, ndd, label_id, NULL, next, exist,
 468					to_allocate, &valid);
 469			available = resource_size(&valid);
 470			if (available)
 471				loc = ALLOC_BEFORE;
 472		}
 473
 474		/* space between allocations */
 475		if (!loc && next) {
 476			valid.start = res->start + resource_size(res);
 477			valid.end = min(mapping_end, next->start - 1);
 478			space_valid(nd_region, ndd, label_id, res, next, exist,
 479					to_allocate, &valid);
 480			available = resource_size(&valid);
 481			if (available)
 482				loc = ALLOC_MID;
 483		}
 484
 485		/* space at the end of the mapping */
 486		if (!loc && !next) {
 487			valid.start = res->start + resource_size(res);
 488			valid.end = mapping_end;
 489			space_valid(nd_region, ndd, label_id, res, next, exist,
 490					to_allocate, &valid);
 491			available = resource_size(&valid);
 492			if (available)
 493				loc = ALLOC_AFTER;
 494		}
 495
 496		if (!loc || !available)
 497			continue;
 498		allocate = min(available, n);
 499		switch (loc) {
 500		case ALLOC_BEFORE:
 501			if (strcmp(res->name, label_id->id) == 0) {
 502				/* adjust current resource up */
 503				rc = adjust_resource(res, res->start - allocate,
 504						resource_size(res) + allocate);
 505				action = "cur grow up";
 506			} else
 507				action = "allocate";
 508			break;
 509		case ALLOC_MID:
 510			if (strcmp(next->name, label_id->id) == 0) {
 511				/* adjust next resource up */
 512				rc = adjust_resource(next, next->start
 513						- allocate, resource_size(next)
 514						+ allocate);
 515				new_res = next;
 516				action = "next grow up";
 517			} else if (strcmp(res->name, label_id->id) == 0) {
 518				action = "grow down";
 519			} else
 520				action = "allocate";
 521			break;
 522		case ALLOC_AFTER:
 523			if (strcmp(res->name, label_id->id) == 0)
 524				action = "grow down";
 525			else
 526				action = "allocate";
 527			break;
 528		default:
 529			return n;
 530		}
 531
 532		if (strcmp(action, "allocate") == 0) {
 533			new_res = nvdimm_allocate_dpa(ndd, label_id,
 534					valid.start, allocate);
 535			if (!new_res)
 536				rc = -EBUSY;
 537		} else if (strcmp(action, "grow down") == 0) {
 538			/* adjust current resource down */
 539			rc = adjust_resource(res, res->start, resource_size(res)
 540					+ allocate);
 541			if (rc == 0)
 542				res->flags |= DPA_RESOURCE_ADJUSTED;
 543		}
 544
 545		if (!new_res)
 546			new_res = res;
 547
 548		nd_dbg_dpa(nd_region, ndd, new_res, "%s(%d) %d\n",
 549				action, loc, rc);
 550
 551		if (rc)
 552			return n;
 553
 554		n -= allocate;
 555		if (n) {
 556			/*
 557			 * Retry scan with newly inserted resources.
 558			 * For example, if we did an ALLOC_BEFORE
 559			 * insertion there may also have been space
 560			 * available for an ALLOC_AFTER insertion, so we
 561			 * need to check this same resource again
 562			 */
 563			goto retry;
 564		} else
 565			return 0;
 566	}
 567
 568	if (n == to_allocate)
 569		return init_dpa_allocation(label_id, nd_region, nd_mapping, n);
 570	return n;
 571}
 572
 573static int merge_dpa(struct nd_region *nd_region,
 574		struct nd_mapping *nd_mapping, struct nd_label_id *label_id)
 575{
 576	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 577	struct resource *res;
 578
 579	if (strncmp("pmem", label_id->id, 4) == 0)
 580		return 0;
 581 retry:
 582	for_each_dpa_resource(ndd, res) {
 583		int rc;
 584		struct resource *next = res->sibling;
 585		resource_size_t end = res->start + resource_size(res);
 586
 587		if (!next || strcmp(res->name, label_id->id) != 0
 588				|| strcmp(next->name, label_id->id) != 0
 589				|| end != next->start)
 590			continue;
 591		end += resource_size(next);
 592		nvdimm_free_dpa(ndd, next);
 593		rc = adjust_resource(res, res->start, end - res->start);
 594		nd_dbg_dpa(nd_region, ndd, res, "merge %d\n", rc);
 595		if (rc)
 596			return rc;
 597		res->flags |= DPA_RESOURCE_ADJUSTED;
 598		goto retry;
 599	}
 600
 601	return 0;
 602}
 603
 604int __reserve_free_pmem(struct device *dev, void *data)
 605{
 606	struct nvdimm *nvdimm = data;
 607	struct nd_region *nd_region;
 608	struct nd_label_id label_id;
 609	int i;
 610
 611	if (!is_memory(dev))
 612		return 0;
 613
 614	nd_region = to_nd_region(dev);
 615	if (nd_region->ndr_mappings == 0)
 616		return 0;
 617
 618	memset(&label_id, 0, sizeof(label_id));
 619	strcat(label_id.id, "pmem-reserve");
 620	for (i = 0; i < nd_region->ndr_mappings; i++) {
 621		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 622		resource_size_t n, rem = 0;
 623
 624		if (nd_mapping->nvdimm != nvdimm)
 625			continue;
 626
 627		n = nd_pmem_available_dpa(nd_region, nd_mapping);
 628		if (n == 0)
 629			return 0;
 630		rem = scan_allocate(nd_region, nd_mapping, &label_id, n);
 631		dev_WARN_ONCE(&nd_region->dev, rem,
 632				"pmem reserve underrun: %#llx of %#llx bytes\n",
 633				(unsigned long long) n - rem,
 634				(unsigned long long) n);
 635		return rem ? -ENXIO : 0;
 636	}
 637
 638	return 0;
 639}
 640
 641void release_free_pmem(struct nvdimm_bus *nvdimm_bus,
 642		struct nd_mapping *nd_mapping)
 643{
 644	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 645	struct resource *res, *_res;
 646
 647	for_each_dpa_resource_safe(ndd, res, _res)
 648		if (strcmp(res->name, "pmem-reserve") == 0)
 649			nvdimm_free_dpa(ndd, res);
 650}
 651
 652/**
 653 * grow_dpa_allocation - for each dimm allocate n bytes for @label_id
 654 * @nd_region: the set of dimms to allocate @n more bytes from
 655 * @label_id: unique identifier for the namespace consuming this dpa range
 656 * @n: number of bytes per-dimm to add to the existing allocation
 657 *
 658 * Assumes resources are ordered.  For BLK regions, first consume
 659 * BLK-only available DPA free space, then consume PMEM-aliased DPA
 660 * space starting at the highest DPA.  For PMEM regions start
 661 * allocations from the start of an interleave set and end at the first
 662 * BLK allocation or the end of the interleave set, whichever comes
 663 * first.
 
 
 664 */
 665static int grow_dpa_allocation(struct nd_region *nd_region,
 666		struct nd_label_id *label_id, resource_size_t n)
 667{
 668	int i;
 669
 670	for (i = 0; i < nd_region->ndr_mappings; i++) {
 671		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 672		resource_size_t rem = n;
 673		int rc;
 674
 675		rem = scan_allocate(nd_region, nd_mapping, label_id, rem);
 676		dev_WARN_ONCE(&nd_region->dev, rem,
 677				"allocation underrun: %#llx of %#llx bytes\n",
 678				(unsigned long long) n - rem,
 679				(unsigned long long) n);
 680		if (rem)
 681			return -ENXIO;
 682
 683		rc = merge_dpa(nd_region, nd_mapping, label_id);
 684		if (rc)
 685			return rc;
 686	}
 687
 688	return 0;
 689}
 690
 691static void nd_namespace_pmem_set_resource(struct nd_region *nd_region,
 692		struct nd_namespace_pmem *nspm, resource_size_t size)
 693{
 694	struct resource *res = &nspm->nsio.res;
 695	resource_size_t offset = 0;
 696
 697	if (size && !nspm->uuid) {
 698		WARN_ON_ONCE(1);
 699		size = 0;
 700	}
 701
 702	if (size && nspm->uuid) {
 703		struct nd_mapping *nd_mapping = &nd_region->mapping[0];
 704		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 705		struct nd_label_id label_id;
 706		struct resource *res;
 707
 708		if (!ndd) {
 709			size = 0;
 710			goto out;
 711		}
 712
 713		nd_label_gen_id(&label_id, nspm->uuid, 0);
 714
 715		/* calculate a spa offset from the dpa allocation offset */
 716		for_each_dpa_resource(ndd, res)
 717			if (strcmp(res->name, label_id.id) == 0) {
 718				offset = (res->start - nd_mapping->start)
 719					* nd_region->ndr_mappings;
 720				goto out;
 721			}
 722
 723		WARN_ON_ONCE(1);
 724		size = 0;
 725	}
 726
 727 out:
 728	res->start = nd_region->ndr_start + offset;
 729	res->end = res->start + size - 1;
 730}
 731
 732static bool uuid_not_set(const uuid_t *uuid, struct device *dev,
 733			 const char *where)
 734{
 735	if (!uuid) {
 736		dev_dbg(dev, "%s: uuid not set\n", where);
 737		return true;
 738	}
 739	return false;
 740}
 741
 742static ssize_t __size_store(struct device *dev, unsigned long long val)
 743{
 744	resource_size_t allocated = 0, available = 0;
 745	struct nd_region *nd_region = to_nd_region(dev->parent);
 746	struct nd_namespace_common *ndns = to_ndns(dev);
 747	struct nd_mapping *nd_mapping;
 748	struct nvdimm_drvdata *ndd;
 749	struct nd_label_id label_id;
 750	u32 flags = 0, remainder;
 751	int rc, i, id = -1;
 752	uuid_t *uuid = NULL;
 753
 754	if (dev->driver || ndns->claim)
 755		return -EBUSY;
 756
 757	if (is_namespace_pmem(dev)) {
 758		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 759
 760		uuid = nspm->uuid;
 761		id = nspm->id;
 762	}
 763
 764	/*
 765	 * We need a uuid for the allocation-label and dimm(s) on which
 766	 * to store the label.
 767	 */
 768	if (uuid_not_set(uuid, dev, __func__))
 769		return -ENXIO;
 770	if (nd_region->ndr_mappings == 0) {
 771		dev_dbg(dev, "not associated with dimm(s)\n");
 772		return -ENXIO;
 773	}
 774
 775	div_u64_rem(val, nd_region->align, &remainder);
 776	if (remainder) {
 777		dev_dbg(dev, "%llu is not %ldK aligned\n", val,
 778				nd_region->align / SZ_1K);
 779		return -EINVAL;
 780	}
 781
 782	nd_label_gen_id(&label_id, uuid, flags);
 783	for (i = 0; i < nd_region->ndr_mappings; i++) {
 784		nd_mapping = &nd_region->mapping[i];
 785		ndd = to_ndd(nd_mapping);
 786
 787		/*
 788		 * All dimms in an interleave set, need to be enabled
 789		 * for the size to be changed.
 790		 */
 791		if (!ndd)
 792			return -ENXIO;
 793
 794		allocated += nvdimm_allocated_dpa(ndd, &label_id);
 795	}
 796	available = nd_region_allocatable_dpa(nd_region);
 797
 798	if (val > available + allocated)
 799		return -ENOSPC;
 800
 801	if (val == allocated)
 802		return 0;
 803
 804	val = div_u64(val, nd_region->ndr_mappings);
 805	allocated = div_u64(allocated, nd_region->ndr_mappings);
 806	if (val < allocated)
 807		rc = shrink_dpa_allocation(nd_region, &label_id,
 808				allocated - val);
 809	else
 810		rc = grow_dpa_allocation(nd_region, &label_id, val - allocated);
 811
 812	if (rc)
 813		return rc;
 814
 815	if (is_namespace_pmem(dev)) {
 816		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 817
 818		nd_namespace_pmem_set_resource(nd_region, nspm,
 819				val * nd_region->ndr_mappings);
 820	}
 821
 822	/*
 823	 * Try to delete the namespace if we deleted all of its
 824	 * allocation, this is not the seed or 0th device for the
 825	 * region, and it is not actively claimed by a btt, pfn, or dax
 826	 * instance.
 827	 */
 828	if (val == 0 && id != 0 && nd_region->ns_seed != dev && !ndns->claim)
 829		nd_device_unregister(dev, ND_ASYNC);
 830
 831	return rc;
 832}
 833
 834static ssize_t size_store(struct device *dev,
 835		struct device_attribute *attr, const char *buf, size_t len)
 836{
 837	struct nd_region *nd_region = to_nd_region(dev->parent);
 838	unsigned long long val;
 839	int rc;
 840
 841	rc = kstrtoull(buf, 0, &val);
 842	if (rc)
 843		return rc;
 844
 845	device_lock(dev);
 846	nvdimm_bus_lock(dev);
 847	wait_nvdimm_bus_probe_idle(dev);
 848	rc = __size_store(dev, val);
 849	if (rc >= 0)
 850		rc = nd_namespace_label_update(nd_region, dev);
 851
 852	/* setting size zero == 'delete namespace' */
 853	if (rc == 0 && val == 0 && is_namespace_pmem(dev)) {
 854		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 855
 856		kfree(nspm->uuid);
 857		nspm->uuid = NULL;
 858	}
 859
 860	dev_dbg(dev, "%llx %s (%d)\n", val, rc < 0 ? "fail" : "success", rc);
 861
 862	nvdimm_bus_unlock(dev);
 863	device_unlock(dev);
 864
 865	return rc < 0 ? rc : len;
 866}
 867
 868resource_size_t __nvdimm_namespace_capacity(struct nd_namespace_common *ndns)
 869{
 870	struct device *dev = &ndns->dev;
 871
 872	if (is_namespace_pmem(dev)) {
 873		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 874
 875		return resource_size(&nspm->nsio.res);
 876	} else if (is_namespace_io(dev)) {
 877		struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
 878
 879		return resource_size(&nsio->res);
 880	} else
 881		WARN_ONCE(1, "unknown namespace type\n");
 882	return 0;
 883}
 884
 885resource_size_t nvdimm_namespace_capacity(struct nd_namespace_common *ndns)
 886{
 887	resource_size_t size;
 888
 889	nvdimm_bus_lock(&ndns->dev);
 890	size = __nvdimm_namespace_capacity(ndns);
 891	nvdimm_bus_unlock(&ndns->dev);
 892
 893	return size;
 894}
 895EXPORT_SYMBOL(nvdimm_namespace_capacity);
 896
 897bool nvdimm_namespace_locked(struct nd_namespace_common *ndns)
 898{
 899	int i;
 900	bool locked = false;
 901	struct device *dev = &ndns->dev;
 902	struct nd_region *nd_region = to_nd_region(dev->parent);
 903
 904	for (i = 0; i < nd_region->ndr_mappings; i++) {
 905		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 906		struct nvdimm *nvdimm = nd_mapping->nvdimm;
 907
 908		if (test_bit(NDD_LOCKED, &nvdimm->flags)) {
 909			dev_dbg(dev, "%s locked\n", nvdimm_name(nvdimm));
 910			locked = true;
 911		}
 912	}
 913	return locked;
 914}
 915EXPORT_SYMBOL(nvdimm_namespace_locked);
 916
 917static ssize_t size_show(struct device *dev,
 918		struct device_attribute *attr, char *buf)
 919{
 920	return sprintf(buf, "%llu\n", (unsigned long long)
 921			nvdimm_namespace_capacity(to_ndns(dev)));
 922}
 923static DEVICE_ATTR(size, 0444, size_show, size_store);
 924
 925static uuid_t *namespace_to_uuid(struct device *dev)
 926{
 927	if (is_namespace_pmem(dev)) {
 928		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
 929
 930		return nspm->uuid;
 931	}
 932	return ERR_PTR(-ENXIO);
 933}
 934
 935static ssize_t uuid_show(struct device *dev, struct device_attribute *attr,
 936			 char *buf)
 937{
 938	uuid_t *uuid = namespace_to_uuid(dev);
 939
 940	if (IS_ERR(uuid))
 941		return PTR_ERR(uuid);
 942	if (uuid)
 943		return sprintf(buf, "%pUb\n", uuid);
 944	return sprintf(buf, "\n");
 945}
 946
 947/**
 948 * namespace_update_uuid - check for a unique uuid and whether we're "renaming"
 949 * @nd_region: parent region so we can updates all dimms in the set
 950 * @dev: namespace type for generating label_id
 951 * @new_uuid: incoming uuid
 952 * @old_uuid: reference to the uuid storage location in the namespace object
 
 
 953 */
 954static int namespace_update_uuid(struct nd_region *nd_region,
 955				 struct device *dev, uuid_t *new_uuid,
 956				 uuid_t **old_uuid)
 957{
 958	struct nd_label_id old_label_id;
 959	struct nd_label_id new_label_id;
 960	int i;
 961
 962	if (!nd_is_uuid_unique(dev, new_uuid))
 963		return -EINVAL;
 964
 965	if (*old_uuid == NULL)
 966		goto out;
 967
 968	/*
 969	 * If we've already written a label with this uuid, then it's
 970	 * too late to rename because we can't reliably update the uuid
 971	 * without losing the old namespace.  Userspace must delete this
 972	 * namespace to abandon the old uuid.
 973	 */
 974	for (i = 0; i < nd_region->ndr_mappings; i++) {
 975		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 976
 977		/*
 978		 * This check by itself is sufficient because old_uuid
 979		 * would be NULL above if this uuid did not exist in the
 980		 * currently written set.
 981		 *
 982		 * FIXME: can we delete uuid with zero dpa allocated?
 983		 */
 984		if (list_empty(&nd_mapping->labels))
 985			return -EBUSY;
 986	}
 987
 988	nd_label_gen_id(&old_label_id, *old_uuid, 0);
 989	nd_label_gen_id(&new_label_id, new_uuid, 0);
 990	for (i = 0; i < nd_region->ndr_mappings; i++) {
 991		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
 992		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
 993		struct nd_label_ent *label_ent;
 994		struct resource *res;
 995
 996		for_each_dpa_resource(ndd, res)
 997			if (strcmp(res->name, old_label_id.id) == 0)
 998				sprintf((void *) res->name, "%s",
 999						new_label_id.id);
1000
1001		mutex_lock(&nd_mapping->lock);
1002		list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1003			struct nd_namespace_label *nd_label = label_ent->label;
1004			struct nd_label_id label_id;
1005			uuid_t uuid;
1006
1007			if (!nd_label)
1008				continue;
1009			nsl_get_uuid(ndd, nd_label, &uuid);
1010			nd_label_gen_id(&label_id, &uuid,
1011					nsl_get_flags(ndd, nd_label));
1012			if (strcmp(old_label_id.id, label_id.id) == 0)
1013				set_bit(ND_LABEL_REAP, &label_ent->flags);
1014		}
1015		mutex_unlock(&nd_mapping->lock);
1016	}
1017	kfree(*old_uuid);
1018 out:
1019	*old_uuid = new_uuid;
1020	return 0;
1021}
1022
1023static ssize_t uuid_store(struct device *dev,
1024		struct device_attribute *attr, const char *buf, size_t len)
1025{
1026	struct nd_region *nd_region = to_nd_region(dev->parent);
1027	uuid_t *uuid = NULL;
1028	uuid_t **ns_uuid;
1029	ssize_t rc = 0;
1030
1031	if (is_namespace_pmem(dev)) {
1032		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1033
1034		ns_uuid = &nspm->uuid;
1035	} else
1036		return -ENXIO;
1037
1038	device_lock(dev);
1039	nvdimm_bus_lock(dev);
1040	wait_nvdimm_bus_probe_idle(dev);
1041	if (to_ndns(dev)->claim)
1042		rc = -EBUSY;
1043	if (rc >= 0)
1044		rc = nd_uuid_store(dev, &uuid, buf, len);
1045	if (rc >= 0)
1046		rc = namespace_update_uuid(nd_region, dev, uuid, ns_uuid);
1047	if (rc >= 0)
1048		rc = nd_namespace_label_update(nd_region, dev);
1049	else
1050		kfree(uuid);
1051	dev_dbg(dev, "result: %zd wrote: %s%s", rc, buf,
1052			buf[len - 1] == '\n' ? "" : "\n");
1053	nvdimm_bus_unlock(dev);
1054	device_unlock(dev);
1055
1056	return rc < 0 ? rc : len;
1057}
1058static DEVICE_ATTR_RW(uuid);
1059
1060static ssize_t resource_show(struct device *dev,
1061		struct device_attribute *attr, char *buf)
1062{
1063	struct resource *res;
1064
1065	if (is_namespace_pmem(dev)) {
1066		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1067
1068		res = &nspm->nsio.res;
1069	} else if (is_namespace_io(dev)) {
1070		struct nd_namespace_io *nsio = to_nd_namespace_io(dev);
1071
1072		res = &nsio->res;
1073	} else
1074		return -ENXIO;
1075
1076	/* no address to convey if the namespace has no allocation */
1077	if (resource_size(res) == 0)
1078		return -ENXIO;
1079	return sprintf(buf, "%#llx\n", (unsigned long long) res->start);
1080}
1081static DEVICE_ATTR_ADMIN_RO(resource);
1082
1083static const unsigned long pmem_lbasize_supported[] = { 512, 4096, 0 };
1084
1085static ssize_t sector_size_show(struct device *dev,
1086		struct device_attribute *attr, char *buf)
1087{
1088	if (is_namespace_pmem(dev)) {
1089		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1090
1091		return nd_size_select_show(nspm->lbasize,
1092				pmem_lbasize_supported, buf);
1093	}
1094	return -ENXIO;
1095}
1096
1097static ssize_t sector_size_store(struct device *dev,
1098		struct device_attribute *attr, const char *buf, size_t len)
1099{
1100	struct nd_region *nd_region = to_nd_region(dev->parent);
1101	const unsigned long *supported;
1102	unsigned long *lbasize;
1103	ssize_t rc = 0;
1104
1105	if (is_namespace_pmem(dev)) {
1106		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1107
1108		lbasize = &nspm->lbasize;
1109		supported = pmem_lbasize_supported;
1110	} else
1111		return -ENXIO;
1112
1113	device_lock(dev);
1114	nvdimm_bus_lock(dev);
1115	if (to_ndns(dev)->claim)
1116		rc = -EBUSY;
1117	if (rc >= 0)
1118		rc = nd_size_select_store(dev, buf, lbasize, supported);
1119	if (rc >= 0)
1120		rc = nd_namespace_label_update(nd_region, dev);
1121	dev_dbg(dev, "result: %zd %s: %s%s", rc, rc < 0 ? "tried" : "wrote",
1122			buf, buf[len - 1] == '\n' ? "" : "\n");
1123	nvdimm_bus_unlock(dev);
1124	device_unlock(dev);
1125
1126	return rc ? rc : len;
1127}
1128static DEVICE_ATTR_RW(sector_size);
1129
1130static ssize_t dpa_extents_show(struct device *dev,
1131		struct device_attribute *attr, char *buf)
1132{
1133	struct nd_region *nd_region = to_nd_region(dev->parent);
1134	struct nd_label_id label_id;
1135	uuid_t *uuid = NULL;
1136	int count = 0, i;
1137	u32 flags = 0;
1138
1139	nvdimm_bus_lock(dev);
1140	if (is_namespace_pmem(dev)) {
1141		struct nd_namespace_pmem *nspm = to_nd_namespace_pmem(dev);
1142
1143		uuid = nspm->uuid;
1144		flags = 0;
1145	}
1146
1147	if (!uuid)
1148		goto out;
1149
1150	nd_label_gen_id(&label_id, uuid, flags);
1151	for (i = 0; i < nd_region->ndr_mappings; i++) {
1152		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1153		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1154		struct resource *res;
1155
1156		for_each_dpa_resource(ndd, res)
1157			if (strcmp(res->name, label_id.id) == 0)
1158				count++;
1159	}
1160 out:
1161	nvdimm_bus_unlock(dev);
1162
1163	return sprintf(buf, "%d\n", count);
1164}
1165static DEVICE_ATTR_RO(dpa_extents);
1166
1167static int btt_claim_class(struct device *dev)
1168{
1169	struct nd_region *nd_region = to_nd_region(dev->parent);
1170	int i, loop_bitmask = 0;
1171
1172	for (i = 0; i < nd_region->ndr_mappings; i++) {
1173		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1174		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1175		struct nd_namespace_index *nsindex;
1176
1177		/*
1178		 * If any of the DIMMs do not support labels the only
1179		 * possible BTT format is v1.
1180		 */
1181		if (!ndd) {
1182			loop_bitmask = 0;
1183			break;
1184		}
1185
1186		nsindex = to_namespace_index(ndd, ndd->ns_current);
1187		if (nsindex == NULL)
1188			loop_bitmask |= 1;
1189		else {
1190			/* check whether existing labels are v1.1 or v1.2 */
1191			if (__le16_to_cpu(nsindex->major) == 1
1192					&& __le16_to_cpu(nsindex->minor) == 1)
1193				loop_bitmask |= 2;
1194			else
1195				loop_bitmask |= 4;
1196		}
1197	}
1198	/*
1199	 * If nsindex is null loop_bitmask's bit 0 will be set, and if an index
1200	 * block is found, a v1.1 label for any mapping will set bit 1, and a
1201	 * v1.2 label will set bit 2.
1202	 *
1203	 * At the end of the loop, at most one of the three bits must be set.
1204	 * If multiple bits were set, it means the different mappings disagree
1205	 * about their labels, and this must be cleaned up first.
1206	 *
1207	 * If all the label index blocks are found to agree, nsindex of NULL
1208	 * implies labels haven't been initialized yet, and when they will,
1209	 * they will be of the 1.2 format, so we can assume BTT2.0
1210	 *
1211	 * If 1.1 labels are found, we enforce BTT1.1, and if 1.2 labels are
1212	 * found, we enforce BTT2.0
1213	 *
1214	 * If the loop was never entered, default to BTT1.1 (legacy namespaces)
1215	 */
1216	switch (loop_bitmask) {
1217	case 0:
1218	case 2:
1219		return NVDIMM_CCLASS_BTT;
1220	case 1:
1221	case 4:
1222		return NVDIMM_CCLASS_BTT2;
1223	default:
1224		return -ENXIO;
1225	}
1226}
1227
1228static ssize_t holder_show(struct device *dev,
1229		struct device_attribute *attr, char *buf)
1230{
1231	struct nd_namespace_common *ndns = to_ndns(dev);
1232	ssize_t rc;
1233
1234	device_lock(dev);
1235	rc = sprintf(buf, "%s\n", ndns->claim ? dev_name(ndns->claim) : "");
1236	device_unlock(dev);
1237
1238	return rc;
1239}
1240static DEVICE_ATTR_RO(holder);
1241
1242static int __holder_class_store(struct device *dev, const char *buf)
1243{
1244	struct nd_namespace_common *ndns = to_ndns(dev);
1245
1246	if (dev->driver || ndns->claim)
1247		return -EBUSY;
1248
1249	if (sysfs_streq(buf, "btt")) {
1250		int rc = btt_claim_class(dev);
1251
1252		if (rc < NVDIMM_CCLASS_NONE)
1253			return rc;
1254		ndns->claim_class = rc;
1255	} else if (sysfs_streq(buf, "pfn"))
1256		ndns->claim_class = NVDIMM_CCLASS_PFN;
1257	else if (sysfs_streq(buf, "dax"))
1258		ndns->claim_class = NVDIMM_CCLASS_DAX;
1259	else if (sysfs_streq(buf, ""))
1260		ndns->claim_class = NVDIMM_CCLASS_NONE;
1261	else
1262		return -EINVAL;
1263
1264	return 0;
1265}
1266
1267static ssize_t holder_class_store(struct device *dev,
1268		struct device_attribute *attr, const char *buf, size_t len)
1269{
1270	struct nd_region *nd_region = to_nd_region(dev->parent);
1271	int rc;
1272
1273	device_lock(dev);
1274	nvdimm_bus_lock(dev);
1275	wait_nvdimm_bus_probe_idle(dev);
1276	rc = __holder_class_store(dev, buf);
1277	if (rc >= 0)
1278		rc = nd_namespace_label_update(nd_region, dev);
1279	dev_dbg(dev, "%s(%d)\n", rc < 0 ? "fail " : "", rc);
1280	nvdimm_bus_unlock(dev);
1281	device_unlock(dev);
1282
1283	return rc < 0 ? rc : len;
1284}
1285
1286static ssize_t holder_class_show(struct device *dev,
1287		struct device_attribute *attr, char *buf)
1288{
1289	struct nd_namespace_common *ndns = to_ndns(dev);
1290	ssize_t rc;
1291
1292	device_lock(dev);
1293	if (ndns->claim_class == NVDIMM_CCLASS_NONE)
1294		rc = sprintf(buf, "\n");
1295	else if ((ndns->claim_class == NVDIMM_CCLASS_BTT) ||
1296			(ndns->claim_class == NVDIMM_CCLASS_BTT2))
1297		rc = sprintf(buf, "btt\n");
1298	else if (ndns->claim_class == NVDIMM_CCLASS_PFN)
1299		rc = sprintf(buf, "pfn\n");
1300	else if (ndns->claim_class == NVDIMM_CCLASS_DAX)
1301		rc = sprintf(buf, "dax\n");
1302	else
1303		rc = sprintf(buf, "<unknown>\n");
1304	device_unlock(dev);
1305
1306	return rc;
1307}
1308static DEVICE_ATTR_RW(holder_class);
1309
1310static ssize_t mode_show(struct device *dev,
1311		struct device_attribute *attr, char *buf)
1312{
1313	struct nd_namespace_common *ndns = to_ndns(dev);
1314	struct device *claim;
1315	char *mode;
1316	ssize_t rc;
1317
1318	device_lock(dev);
1319	claim = ndns->claim;
1320	if (claim && is_nd_btt(claim))
1321		mode = "safe";
1322	else if (claim && is_nd_pfn(claim))
1323		mode = "memory";
1324	else if (claim && is_nd_dax(claim))
1325		mode = "dax";
1326	else if (!claim && pmem_should_map_pages(dev))
1327		mode = "memory";
1328	else
1329		mode = "raw";
1330	rc = sprintf(buf, "%s\n", mode);
1331	device_unlock(dev);
1332
1333	return rc;
1334}
1335static DEVICE_ATTR_RO(mode);
1336
1337static ssize_t force_raw_store(struct device *dev,
1338		struct device_attribute *attr, const char *buf, size_t len)
1339{
1340	bool force_raw;
1341	int rc = strtobool(buf, &force_raw);
1342
1343	if (rc)
1344		return rc;
1345
1346	to_ndns(dev)->force_raw = force_raw;
1347	return len;
1348}
1349
1350static ssize_t force_raw_show(struct device *dev,
1351		struct device_attribute *attr, char *buf)
1352{
1353	return sprintf(buf, "%d\n", to_ndns(dev)->force_raw);
1354}
1355static DEVICE_ATTR_RW(force_raw);
1356
1357static struct attribute *nd_namespace_attributes[] = {
1358	&dev_attr_nstype.attr,
1359	&dev_attr_size.attr,
1360	&dev_attr_mode.attr,
1361	&dev_attr_uuid.attr,
1362	&dev_attr_holder.attr,
1363	&dev_attr_resource.attr,
1364	&dev_attr_alt_name.attr,
1365	&dev_attr_force_raw.attr,
1366	&dev_attr_sector_size.attr,
1367	&dev_attr_dpa_extents.attr,
1368	&dev_attr_holder_class.attr,
1369	NULL,
1370};
1371
1372static umode_t namespace_visible(struct kobject *kobj,
1373		struct attribute *a, int n)
1374{
1375	struct device *dev = container_of(kobj, struct device, kobj);
1376
1377	if (is_namespace_pmem(dev)) {
1378		if (a == &dev_attr_size.attr)
1379			return 0644;
1380
1381		return a->mode;
1382	}
1383
1384	/* base is_namespace_io() attributes */
1385	if (a == &dev_attr_nstype.attr || a == &dev_attr_size.attr ||
1386	    a == &dev_attr_holder.attr || a == &dev_attr_holder_class.attr ||
1387	    a == &dev_attr_force_raw.attr || a == &dev_attr_mode.attr ||
1388	    a == &dev_attr_resource.attr)
1389		return a->mode;
1390
1391	return 0;
1392}
1393
1394static struct attribute_group nd_namespace_attribute_group = {
1395	.attrs = nd_namespace_attributes,
1396	.is_visible = namespace_visible,
1397};
1398
1399static const struct attribute_group *nd_namespace_attribute_groups[] = {
1400	&nd_device_attribute_group,
1401	&nd_namespace_attribute_group,
1402	&nd_numa_attribute_group,
1403	NULL,
1404};
1405
1406static const struct device_type namespace_io_device_type = {
1407	.name = "nd_namespace_io",
1408	.release = namespace_io_release,
1409	.groups = nd_namespace_attribute_groups,
1410};
1411
1412static const struct device_type namespace_pmem_device_type = {
1413	.name = "nd_namespace_pmem",
1414	.release = namespace_pmem_release,
1415	.groups = nd_namespace_attribute_groups,
1416};
1417
1418static bool is_namespace_pmem(const struct device *dev)
1419{
1420	return dev ? dev->type == &namespace_pmem_device_type : false;
1421}
1422
1423static bool is_namespace_io(const struct device *dev)
1424{
1425	return dev ? dev->type == &namespace_io_device_type : false;
1426}
1427
1428struct nd_namespace_common *nvdimm_namespace_common_probe(struct device *dev)
1429{
1430	struct nd_btt *nd_btt = is_nd_btt(dev) ? to_nd_btt(dev) : NULL;
1431	struct nd_pfn *nd_pfn = is_nd_pfn(dev) ? to_nd_pfn(dev) : NULL;
1432	struct nd_dax *nd_dax = is_nd_dax(dev) ? to_nd_dax(dev) : NULL;
1433	struct nd_namespace_common *ndns = NULL;
1434	resource_size_t size;
1435
1436	if (nd_btt || nd_pfn || nd_dax) {
1437		if (nd_btt)
1438			ndns = nd_btt->ndns;
1439		else if (nd_pfn)
1440			ndns = nd_pfn->ndns;
1441		else if (nd_dax)
1442			ndns = nd_dax->nd_pfn.ndns;
1443
1444		if (!ndns)
1445			return ERR_PTR(-ENODEV);
1446
1447		/*
1448		 * Flush any in-progess probes / removals in the driver
1449		 * for the raw personality of this namespace.
1450		 */
1451		device_lock(&ndns->dev);
1452		device_unlock(&ndns->dev);
1453		if (ndns->dev.driver) {
1454			dev_dbg(&ndns->dev, "is active, can't bind %s\n",
1455					dev_name(dev));
1456			return ERR_PTR(-EBUSY);
1457		}
1458		if (dev_WARN_ONCE(&ndns->dev, ndns->claim != dev,
1459					"host (%s) vs claim (%s) mismatch\n",
1460					dev_name(dev),
1461					dev_name(ndns->claim)))
1462			return ERR_PTR(-ENXIO);
1463	} else {
1464		ndns = to_ndns(dev);
1465		if (ndns->claim) {
1466			dev_dbg(dev, "claimed by %s, failing probe\n",
1467				dev_name(ndns->claim));
1468
1469			return ERR_PTR(-ENXIO);
1470		}
1471	}
1472
1473	if (nvdimm_namespace_locked(ndns))
1474		return ERR_PTR(-EACCES);
1475
1476	size = nvdimm_namespace_capacity(ndns);
1477	if (size < ND_MIN_NAMESPACE_SIZE) {
1478		dev_dbg(&ndns->dev, "%pa, too small must be at least %#x\n",
1479				&size, ND_MIN_NAMESPACE_SIZE);
1480		return ERR_PTR(-ENODEV);
1481	}
1482
1483	/*
1484	 * Note, alignment validation for fsdax and devdax mode
1485	 * namespaces happens in nd_pfn_validate() where infoblock
1486	 * padding parameters can be applied.
1487	 */
1488	if (pmem_should_map_pages(dev)) {
1489		struct nd_namespace_io *nsio = to_nd_namespace_io(&ndns->dev);
1490		struct resource *res = &nsio->res;
1491
1492		if (!IS_ALIGNED(res->start | (res->end + 1),
1493					memremap_compat_align())) {
1494			dev_err(&ndns->dev, "%pr misaligned, unable to map\n", res);
1495			return ERR_PTR(-EOPNOTSUPP);
1496		}
1497	}
1498
1499	if (is_namespace_pmem(&ndns->dev)) {
1500		struct nd_namespace_pmem *nspm;
1501
1502		nspm = to_nd_namespace_pmem(&ndns->dev);
1503		if (uuid_not_set(nspm->uuid, &ndns->dev, __func__))
1504			return ERR_PTR(-ENODEV);
1505	}
1506
1507	return ndns;
1508}
1509EXPORT_SYMBOL(nvdimm_namespace_common_probe);
1510
1511int devm_namespace_enable(struct device *dev, struct nd_namespace_common *ndns,
1512		resource_size_t size)
1513{
1514	return devm_nsio_enable(dev, to_nd_namespace_io(&ndns->dev), size);
1515}
1516EXPORT_SYMBOL_GPL(devm_namespace_enable);
1517
1518void devm_namespace_disable(struct device *dev, struct nd_namespace_common *ndns)
1519{
1520	devm_nsio_disable(dev, to_nd_namespace_io(&ndns->dev));
1521}
1522EXPORT_SYMBOL_GPL(devm_namespace_disable);
1523
1524static struct device **create_namespace_io(struct nd_region *nd_region)
1525{
1526	struct nd_namespace_io *nsio;
1527	struct device *dev, **devs;
1528	struct resource *res;
1529
1530	nsio = kzalloc(sizeof(*nsio), GFP_KERNEL);
1531	if (!nsio)
1532		return NULL;
1533
1534	devs = kcalloc(2, sizeof(struct device *), GFP_KERNEL);
1535	if (!devs) {
1536		kfree(nsio);
1537		return NULL;
1538	}
1539
1540	dev = &nsio->common.dev;
1541	dev->type = &namespace_io_device_type;
1542	dev->parent = &nd_region->dev;
1543	res = &nsio->res;
1544	res->name = dev_name(&nd_region->dev);
1545	res->flags = IORESOURCE_MEM;
1546	res->start = nd_region->ndr_start;
1547	res->end = res->start + nd_region->ndr_size - 1;
1548
1549	devs[0] = dev;
1550	return devs;
1551}
1552
1553static bool has_uuid_at_pos(struct nd_region *nd_region, const uuid_t *uuid,
1554			    u64 cookie, u16 pos)
1555{
1556	struct nd_namespace_label *found = NULL;
1557	int i;
1558
1559	for (i = 0; i < nd_region->ndr_mappings; i++) {
1560		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1561		struct nd_interleave_set *nd_set = nd_region->nd_set;
1562		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1563		struct nd_label_ent *label_ent;
1564		bool found_uuid = false;
1565
1566		list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1567			struct nd_namespace_label *nd_label = label_ent->label;
1568			u16 position;
1569
1570			if (!nd_label)
1571				continue;
1572			position = nsl_get_position(ndd, nd_label);
1573
1574			if (!nsl_validate_isetcookie(ndd, nd_label, cookie))
1575				continue;
1576
1577			if (!nsl_uuid_equal(ndd, nd_label, uuid))
1578				continue;
1579
1580			if (!nsl_validate_type_guid(ndd, nd_label,
1581						    &nd_set->type_guid))
1582				continue;
1583
1584			if (found_uuid) {
1585				dev_dbg(ndd->dev, "duplicate entry for uuid\n");
1586				return false;
1587			}
1588			found_uuid = true;
1589			if (!nsl_validate_nlabel(nd_region, ndd, nd_label))
1590				continue;
1591			if (position != pos)
1592				continue;
1593			found = nd_label;
1594			break;
1595		}
1596		if (found)
1597			break;
1598	}
1599	return found != NULL;
1600}
1601
1602static int select_pmem_id(struct nd_region *nd_region, const uuid_t *pmem_id)
1603{
1604	int i;
1605
1606	if (!pmem_id)
1607		return -ENODEV;
1608
1609	for (i = 0; i < nd_region->ndr_mappings; i++) {
1610		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
1611		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1612		struct nd_namespace_label *nd_label = NULL;
1613		u64 hw_start, hw_end, pmem_start, pmem_end;
1614		struct nd_label_ent *label_ent;
1615
1616		lockdep_assert_held(&nd_mapping->lock);
1617		list_for_each_entry(label_ent, &nd_mapping->labels, list) {
1618			nd_label = label_ent->label;
1619			if (!nd_label)
1620				continue;
1621			if (nsl_uuid_equal(ndd, nd_label, pmem_id))
1622				break;
1623			nd_label = NULL;
1624		}
1625
1626		if (!nd_label) {
1627			WARN_ON(1);
1628			return -EINVAL;
1629		}
1630
1631		/*
1632		 * Check that this label is compliant with the dpa
1633		 * range published in NFIT
1634		 */
1635		hw_start = nd_mapping->start;
1636		hw_end = hw_start + nd_mapping->size;
1637		pmem_start = nsl_get_dpa(ndd, nd_label);
1638		pmem_end = pmem_start + nsl_get_rawsize(ndd, nd_label);
1639		if (pmem_start >= hw_start && pmem_start < hw_end
1640				&& pmem_end <= hw_end && pmem_end > hw_start)
1641			/* pass */;
1642		else {
1643			dev_dbg(&nd_region->dev, "%s invalid label for %pUb\n",
1644				dev_name(ndd->dev),
1645				nsl_uuid_raw(ndd, nd_label));
1646			return -EINVAL;
1647		}
1648
1649		/* move recently validated label to the front of the list */
1650		list_move(&label_ent->list, &nd_mapping->labels);
1651	}
1652	return 0;
1653}
1654
1655/**
1656 * create_namespace_pmem - validate interleave set labelling, retrieve label0
1657 * @nd_region: region with mappings to validate
1658 * @nspm: target namespace to create
1659 * @nd_label: target pmem namespace label to evaluate
 
 
1660 */
1661static struct device *create_namespace_pmem(struct nd_region *nd_region,
1662					    struct nd_mapping *nd_mapping,
1663					    struct nd_namespace_label *nd_label)
1664{
1665	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1666	struct nd_namespace_index *nsindex =
1667		to_namespace_index(ndd, ndd->ns_current);
1668	u64 cookie = nd_region_interleave_set_cookie(nd_region, nsindex);
1669	u64 altcookie = nd_region_interleave_set_altcookie(nd_region);
1670	struct nd_label_ent *label_ent;
1671	struct nd_namespace_pmem *nspm;
1672	resource_size_t size = 0;
1673	struct resource *res;
1674	struct device *dev;
1675	uuid_t uuid;
1676	int rc = 0;
1677	u16 i;
1678
1679	if (cookie == 0) {
1680		dev_dbg(&nd_region->dev, "invalid interleave-set-cookie\n");
1681		return ERR_PTR(-ENXIO);
1682	}
1683
1684	if (!nsl_validate_isetcookie(ndd, nd_label, cookie)) {
1685		dev_dbg(&nd_region->dev, "invalid cookie in label: %pUb\n",
1686			nsl_uuid_raw(ndd, nd_label));
1687		if (!nsl_validate_isetcookie(ndd, nd_label, altcookie))
1688			return ERR_PTR(-EAGAIN);
1689
1690		dev_dbg(&nd_region->dev, "valid altcookie in label: %pUb\n",
1691			nsl_uuid_raw(ndd, nd_label));
1692	}
1693
1694	nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1695	if (!nspm)
1696		return ERR_PTR(-ENOMEM);
1697
1698	nspm->id = -1;
1699	dev = &nspm->nsio.common.dev;
1700	dev->type = &namespace_pmem_device_type;
1701	dev->parent = &nd_region->dev;
1702	res = &nspm->nsio.res;
1703	res->name = dev_name(&nd_region->dev);
1704	res->flags = IORESOURCE_MEM;
1705
1706	for (i = 0; i < nd_region->ndr_mappings; i++) {
1707		nsl_get_uuid(ndd, nd_label, &uuid);
1708		if (has_uuid_at_pos(nd_region, &uuid, cookie, i))
1709			continue;
1710		if (has_uuid_at_pos(nd_region, &uuid, altcookie, i))
1711			continue;
1712		break;
1713	}
1714
1715	if (i < nd_region->ndr_mappings) {
1716		struct nvdimm *nvdimm = nd_region->mapping[i].nvdimm;
1717
1718		/*
1719		 * Give up if we don't find an instance of a uuid at each
1720		 * position (from 0 to nd_region->ndr_mappings - 1), or if we
1721		 * find a dimm with two instances of the same uuid.
1722		 */
1723		dev_err(&nd_region->dev, "%s missing label for %pUb\n",
1724			nvdimm_name(nvdimm), nsl_uuid_raw(ndd, nd_label));
1725		rc = -EINVAL;
1726		goto err;
1727	}
1728
1729	/*
1730	 * Fix up each mapping's 'labels' to have the validated pmem label for
1731	 * that position at labels[0], and NULL at labels[1].  In the process,
1732	 * check that the namespace aligns with interleave-set.
1733	 */
1734	nsl_get_uuid(ndd, nd_label, &uuid);
1735	rc = select_pmem_id(nd_region, &uuid);
1736	if (rc)
1737		goto err;
1738
1739	/* Calculate total size and populate namespace properties from label0 */
1740	for (i = 0; i < nd_region->ndr_mappings; i++) {
1741		struct nd_namespace_label *label0;
1742		struct nvdimm_drvdata *ndd;
1743
1744		nd_mapping = &nd_region->mapping[i];
1745		label_ent = list_first_entry_or_null(&nd_mapping->labels,
1746				typeof(*label_ent), list);
1747		label0 = label_ent ? label_ent->label : NULL;
1748
1749		if (!label0) {
1750			WARN_ON(1);
1751			continue;
1752		}
1753
1754		ndd = to_ndd(nd_mapping);
1755		size += nsl_get_rawsize(ndd, label0);
1756		if (nsl_get_position(ndd, label0) != 0)
1757			continue;
1758		WARN_ON(nspm->alt_name || nspm->uuid);
1759		nspm->alt_name = kmemdup(nsl_ref_name(ndd, label0),
1760					 NSLABEL_NAME_LEN, GFP_KERNEL);
1761		nsl_get_uuid(ndd, label0, &uuid);
1762		nspm->uuid = kmemdup(&uuid, sizeof(uuid_t), GFP_KERNEL);
1763		nspm->lbasize = nsl_get_lbasize(ndd, label0);
1764		nspm->nsio.common.claim_class =
1765			nsl_get_claim_class(ndd, label0);
1766	}
1767
1768	if (!nspm->alt_name || !nspm->uuid) {
1769		rc = -ENOMEM;
1770		goto err;
1771	}
1772
1773	nd_namespace_pmem_set_resource(nd_region, nspm, size);
1774
1775	return dev;
1776 err:
1777	namespace_pmem_release(dev);
1778	switch (rc) {
1779	case -EINVAL:
1780		dev_dbg(&nd_region->dev, "invalid label(s)\n");
1781		break;
1782	case -ENODEV:
1783		dev_dbg(&nd_region->dev, "label not found\n");
1784		break;
1785	default:
1786		dev_dbg(&nd_region->dev, "unexpected err: %d\n", rc);
1787		break;
1788	}
1789	return ERR_PTR(rc);
1790}
1791
1792static struct device *nd_namespace_pmem_create(struct nd_region *nd_region)
1793{
1794	struct nd_namespace_pmem *nspm;
1795	struct resource *res;
1796	struct device *dev;
1797
1798	if (!is_memory(&nd_region->dev))
1799		return NULL;
1800
1801	nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1802	if (!nspm)
1803		return NULL;
1804
1805	dev = &nspm->nsio.common.dev;
1806	dev->type = &namespace_pmem_device_type;
1807	dev->parent = &nd_region->dev;
1808	res = &nspm->nsio.res;
1809	res->name = dev_name(&nd_region->dev);
1810	res->flags = IORESOURCE_MEM;
1811
1812	nspm->id = ida_simple_get(&nd_region->ns_ida, 0, 0, GFP_KERNEL);
1813	if (nspm->id < 0) {
1814		kfree(nspm);
1815		return NULL;
1816	}
1817	dev_set_name(dev, "namespace%d.%d", nd_region->id, nspm->id);
1818	nd_namespace_pmem_set_resource(nd_region, nspm, 0);
1819
1820	return dev;
1821}
1822
1823static struct lock_class_key nvdimm_namespace_key;
1824
1825void nd_region_create_ns_seed(struct nd_region *nd_region)
1826{
1827	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1828
1829	if (nd_region_to_nstype(nd_region) == ND_DEVICE_NAMESPACE_IO)
1830		return;
1831
1832	nd_region->ns_seed = nd_namespace_pmem_create(nd_region);
1833
1834	/*
1835	 * Seed creation failures are not fatal, provisioning is simply
1836	 * disabled until memory becomes available
1837	 */
1838	if (!nd_region->ns_seed)
1839		dev_err(&nd_region->dev, "failed to create namespace\n");
1840	else {
1841		device_initialize(nd_region->ns_seed);
1842		lockdep_set_class(&nd_region->ns_seed->mutex,
1843				  &nvdimm_namespace_key);
1844		nd_device_register(nd_region->ns_seed);
1845	}
1846}
1847
1848void nd_region_create_dax_seed(struct nd_region *nd_region)
1849{
1850	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1851	nd_region->dax_seed = nd_dax_create(nd_region);
1852	/*
1853	 * Seed creation failures are not fatal, provisioning is simply
1854	 * disabled until memory becomes available
1855	 */
1856	if (!nd_region->dax_seed)
1857		dev_err(&nd_region->dev, "failed to create dax namespace\n");
1858}
1859
1860void nd_region_create_pfn_seed(struct nd_region *nd_region)
1861{
1862	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1863	nd_region->pfn_seed = nd_pfn_create(nd_region);
1864	/*
1865	 * Seed creation failures are not fatal, provisioning is simply
1866	 * disabled until memory becomes available
1867	 */
1868	if (!nd_region->pfn_seed)
1869		dev_err(&nd_region->dev, "failed to create pfn namespace\n");
1870}
1871
1872void nd_region_create_btt_seed(struct nd_region *nd_region)
1873{
1874	WARN_ON(!is_nvdimm_bus_locked(&nd_region->dev));
1875	nd_region->btt_seed = nd_btt_create(nd_region);
1876	/*
1877	 * Seed creation failures are not fatal, provisioning is simply
1878	 * disabled until memory becomes available
1879	 */
1880	if (!nd_region->btt_seed)
1881		dev_err(&nd_region->dev, "failed to create btt namespace\n");
1882}
1883
1884static int add_namespace_resource(struct nd_region *nd_region,
1885		struct nd_namespace_label *nd_label, struct device **devs,
1886		int count)
1887{
1888	struct nd_mapping *nd_mapping = &nd_region->mapping[0];
1889	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1890	int i;
1891
1892	for (i = 0; i < count; i++) {
1893		uuid_t *uuid = namespace_to_uuid(devs[i]);
1894
1895		if (IS_ERR(uuid)) {
1896			WARN_ON(1);
1897			continue;
1898		}
1899
1900		if (!nsl_uuid_equal(ndd, nd_label, uuid))
1901			continue;
1902		dev_err(&nd_region->dev,
1903			"error: conflicting extents for uuid: %pUb\n", uuid);
1904		return -ENXIO;
1905	}
1906
1907	return i;
1908}
1909
1910static int cmp_dpa(const void *a, const void *b)
1911{
1912	const struct device *dev_a = *(const struct device **) a;
1913	const struct device *dev_b = *(const struct device **) b;
1914	struct nd_namespace_pmem *nspm_a, *nspm_b;
1915
1916	if (is_namespace_io(dev_a))
1917		return 0;
1918
1919	nspm_a = to_nd_namespace_pmem(dev_a);
1920	nspm_b = to_nd_namespace_pmem(dev_b);
1921
1922	return memcmp(&nspm_a->nsio.res.start, &nspm_b->nsio.res.start,
1923			sizeof(resource_size_t));
1924}
1925
1926static struct device **scan_labels(struct nd_region *nd_region)
1927{
1928	int i, count = 0;
1929	struct device *dev, **devs = NULL;
1930	struct nd_label_ent *label_ent, *e;
1931	struct nd_mapping *nd_mapping = &nd_region->mapping[0];
1932	struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
1933	resource_size_t map_end = nd_mapping->start + nd_mapping->size - 1;
1934
 
 
 
 
1935	/* "safe" because create_namespace_pmem() might list_move() label_ent */
1936	list_for_each_entry_safe(label_ent, e, &nd_mapping->labels, list) {
1937		struct nd_namespace_label *nd_label = label_ent->label;
1938		struct device **__devs;
1939
1940		if (!nd_label)
1941			continue;
1942
1943		/* skip labels that describe extents outside of the region */
1944		if (nsl_get_dpa(ndd, nd_label) < nd_mapping->start ||
1945		    nsl_get_dpa(ndd, nd_label) > map_end)
1946			continue;
1947
1948		i = add_namespace_resource(nd_region, nd_label, devs, count);
1949		if (i < 0)
1950			goto err;
1951		if (i < count)
1952			continue;
1953		__devs = kcalloc(count + 2, sizeof(dev), GFP_KERNEL);
1954		if (!__devs)
1955			goto err;
1956		memcpy(__devs, devs, sizeof(dev) * count);
1957		kfree(devs);
1958		devs = __devs;
 
 
1959
1960		dev = create_namespace_pmem(nd_region, nd_mapping, nd_label);
1961		if (IS_ERR(dev)) {
1962			switch (PTR_ERR(dev)) {
1963			case -EAGAIN:
1964				/* skip invalid labels */
1965				continue;
1966			case -ENODEV:
1967				/* fallthrough to seed creation */
1968				break;
1969			default:
1970				goto err;
1971			}
1972		} else
1973			devs[count++] = dev;
1974
1975	}
1976
1977	dev_dbg(&nd_region->dev, "discovered %d namespace%s\n", count,
1978		count == 1 ? "" : "s");
1979
1980	if (count == 0) {
1981		struct nd_namespace_pmem *nspm;
1982
1983		/* Publish a zero-sized namespace for userspace to configure. */
1984		nd_mapping_free_labels(nd_mapping);
1985
1986		devs = kcalloc(2, sizeof(dev), GFP_KERNEL);
1987		if (!devs)
1988			goto err;
1989
1990		nspm = kzalloc(sizeof(*nspm), GFP_KERNEL);
1991		if (!nspm)
1992			goto err;
1993		dev = &nspm->nsio.common.dev;
1994		dev->type = &namespace_pmem_device_type;
1995		nd_namespace_pmem_set_resource(nd_region, nspm, 0);
1996		dev->parent = &nd_region->dev;
1997		devs[count++] = dev;
1998	} else if (is_memory(&nd_region->dev)) {
1999		/* clean unselected labels */
2000		for (i = 0; i < nd_region->ndr_mappings; i++) {
2001			struct list_head *l, *e;
2002			LIST_HEAD(list);
2003			int j;
2004
2005			nd_mapping = &nd_region->mapping[i];
2006			if (list_empty(&nd_mapping->labels)) {
2007				WARN_ON(1);
2008				continue;
2009			}
2010
2011			j = count;
2012			list_for_each_safe(l, e, &nd_mapping->labels) {
2013				if (!j--)
2014					break;
2015				list_move_tail(l, &list);
2016			}
2017			nd_mapping_free_labels(nd_mapping);
2018			list_splice_init(&list, &nd_mapping->labels);
2019		}
2020	}
2021
2022	if (count > 1)
2023		sort(devs, count, sizeof(struct device *), cmp_dpa, NULL);
2024
2025	return devs;
2026
2027 err:
2028	if (devs) {
2029		for (i = 0; devs[i]; i++)
2030			namespace_pmem_release(devs[i]);
2031		kfree(devs);
2032	}
2033	return NULL;
2034}
2035
2036static struct device **create_namespaces(struct nd_region *nd_region)
2037{
2038	struct nd_mapping *nd_mapping;
2039	struct device **devs;
2040	int i;
2041
2042	if (nd_region->ndr_mappings == 0)
2043		return NULL;
2044
2045	/* lock down all mappings while we scan labels */
2046	for (i = 0; i < nd_region->ndr_mappings; i++) {
2047		nd_mapping = &nd_region->mapping[i];
2048		mutex_lock_nested(&nd_mapping->lock, i);
2049	}
2050
2051	devs = scan_labels(nd_region);
2052
2053	for (i = 0; i < nd_region->ndr_mappings; i++) {
2054		int reverse = nd_region->ndr_mappings - 1 - i;
2055
2056		nd_mapping = &nd_region->mapping[reverse];
2057		mutex_unlock(&nd_mapping->lock);
2058	}
2059
2060	return devs;
2061}
2062
2063static void deactivate_labels(void *region)
2064{
2065	struct nd_region *nd_region = region;
2066	int i;
2067
2068	for (i = 0; i < nd_region->ndr_mappings; i++) {
2069		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
2070		struct nvdimm_drvdata *ndd = nd_mapping->ndd;
2071		struct nvdimm *nvdimm = nd_mapping->nvdimm;
2072
2073		mutex_lock(&nd_mapping->lock);
2074		nd_mapping_free_labels(nd_mapping);
2075		mutex_unlock(&nd_mapping->lock);
2076
2077		put_ndd(ndd);
2078		nd_mapping->ndd = NULL;
2079		if (ndd)
2080			atomic_dec(&nvdimm->busy);
2081	}
2082}
2083
2084static int init_active_labels(struct nd_region *nd_region)
2085{
2086	int i, rc = 0;
2087
2088	for (i = 0; i < nd_region->ndr_mappings; i++) {
2089		struct nd_mapping *nd_mapping = &nd_region->mapping[i];
2090		struct nvdimm_drvdata *ndd = to_ndd(nd_mapping);
2091		struct nvdimm *nvdimm = nd_mapping->nvdimm;
2092		struct nd_label_ent *label_ent;
2093		int count, j;
2094
2095		/*
2096		 * If the dimm is disabled then we may need to prevent
2097		 * the region from being activated.
2098		 */
2099		if (!ndd) {
2100			if (test_bit(NDD_LOCKED, &nvdimm->flags))
2101				/* fail, label data may be unreadable */;
2102			else if (test_bit(NDD_LABELING, &nvdimm->flags))
2103				/* fail, labels needed to disambiguate dpa */;
2104			else
2105				continue;
2106
2107			dev_err(&nd_region->dev, "%s: is %s, failing probe\n",
2108					dev_name(&nd_mapping->nvdimm->dev),
2109					test_bit(NDD_LOCKED, &nvdimm->flags)
2110					? "locked" : "disabled");
2111			rc = -ENXIO;
2112			goto out;
2113		}
2114		nd_mapping->ndd = ndd;
2115		atomic_inc(&nvdimm->busy);
2116		get_ndd(ndd);
2117
2118		count = nd_label_active_count(ndd);
2119		dev_dbg(ndd->dev, "count: %d\n", count);
2120		if (!count)
2121			continue;
2122		for (j = 0; j < count; j++) {
2123			struct nd_namespace_label *label;
2124
2125			label_ent = kzalloc(sizeof(*label_ent), GFP_KERNEL);
2126			if (!label_ent)
2127				break;
2128			label = nd_label_active(ndd, j);
2129			label_ent->label = label;
2130
2131			mutex_lock(&nd_mapping->lock);
2132			list_add_tail(&label_ent->list, &nd_mapping->labels);
2133			mutex_unlock(&nd_mapping->lock);
2134		}
2135
2136		if (j < count)
2137			break;
2138	}
2139
2140	if (i < nd_region->ndr_mappings)
2141		rc = -ENOMEM;
2142
2143out:
2144	if (rc) {
2145		deactivate_labels(nd_region);
2146		return rc;
2147	}
2148
2149	return devm_add_action_or_reset(&nd_region->dev, deactivate_labels,
2150					nd_region);
2151}
2152
2153int nd_region_register_namespaces(struct nd_region *nd_region, int *err)
2154{
2155	struct device **devs = NULL;
2156	int i, rc = 0, type;
2157
2158	*err = 0;
2159	nvdimm_bus_lock(&nd_region->dev);
2160	rc = init_active_labels(nd_region);
2161	if (rc) {
2162		nvdimm_bus_unlock(&nd_region->dev);
2163		return rc;
2164	}
2165
2166	type = nd_region_to_nstype(nd_region);
2167	switch (type) {
2168	case ND_DEVICE_NAMESPACE_IO:
2169		devs = create_namespace_io(nd_region);
2170		break;
2171	case ND_DEVICE_NAMESPACE_PMEM:
2172		devs = create_namespaces(nd_region);
2173		break;
2174	default:
2175		break;
2176	}
2177	nvdimm_bus_unlock(&nd_region->dev);
2178
2179	if (!devs)
2180		return -ENODEV;
2181
2182	for (i = 0; devs[i]; i++) {
2183		struct device *dev = devs[i];
2184		int id;
2185
2186		if (type == ND_DEVICE_NAMESPACE_PMEM) {
2187			struct nd_namespace_pmem *nspm;
2188
2189			nspm = to_nd_namespace_pmem(dev);
2190			id = ida_simple_get(&nd_region->ns_ida, 0, 0,
2191					    GFP_KERNEL);
2192			nspm->id = id;
2193		} else
2194			id = i;
2195
2196		if (id < 0)
2197			break;
2198		dev_set_name(dev, "namespace%d.%d", nd_region->id, id);
2199		device_initialize(dev);
2200		lockdep_set_class(&dev->mutex, &nvdimm_namespace_key);
2201		nd_device_register(dev);
2202	}
2203	if (i)
2204		nd_region->ns_seed = devs[0];
2205
2206	if (devs[i]) {
2207		int j;
2208
2209		for (j = i; devs[j]; j++) {
2210			struct device *dev = devs[j];
2211
2212			device_initialize(dev);
2213			put_device(dev);
2214		}
2215		*err = j - i;
2216		/*
2217		 * All of the namespaces we tried to register failed, so
2218		 * fail region activation.
2219		 */
2220		if (*err == 0)
2221			rc = -ENODEV;
2222	}
2223	kfree(devs);
2224
2225	if (rc == -ENODEV)
2226		return rc;
2227
2228	return i;
2229}