Linux Audio

Check our new training course

Loading...
v4.17
   1/* ds.c: Domain Services driver for Logical Domains
   2 *
   3 * Copyright (C) 2007, 2008 David S. Miller <davem@davemloft.net>
   4 */
   5
   6#include <linux/kernel.h>
   7#include <linux/module.h>
   8#include <linux/types.h>
   9#include <linux/string.h>
  10#include <linux/slab.h>
  11#include <linux/sched.h>
  12#include <linux/sched/clock.h>
  13#include <linux/delay.h>
  14#include <linux/mutex.h>
  15#include <linux/kthread.h>
  16#include <linux/reboot.h>
  17#include <linux/cpu.h>
  18
  19#include <asm/hypervisor.h>
  20#include <asm/ldc.h>
  21#include <asm/vio.h>
  22#include <asm/mdesc.h>
  23#include <asm/head.h>
  24#include <asm/irq.h>
  25
  26#include "kernel.h"
  27
  28#define DRV_MODULE_NAME		"ds"
  29#define PFX DRV_MODULE_NAME	": "
  30#define DRV_MODULE_VERSION	"1.0"
  31#define DRV_MODULE_RELDATE	"Jul 11, 2007"
  32
  33static char version[] =
  34	DRV_MODULE_NAME ".c:v" DRV_MODULE_VERSION " (" DRV_MODULE_RELDATE ")\n";
  35MODULE_AUTHOR("David S. Miller (davem@davemloft.net)");
  36MODULE_DESCRIPTION("Sun LDOM domain services driver");
  37MODULE_LICENSE("GPL");
  38MODULE_VERSION(DRV_MODULE_VERSION);
  39
  40struct ds_msg_tag {
  41	__u32			type;
  42#define DS_INIT_REQ		0x00
  43#define DS_INIT_ACK		0x01
  44#define DS_INIT_NACK		0x02
  45#define DS_REG_REQ		0x03
  46#define DS_REG_ACK		0x04
  47#define DS_REG_NACK		0x05
  48#define DS_UNREG_REQ		0x06
  49#define DS_UNREG_ACK		0x07
  50#define DS_UNREG_NACK		0x08
  51#define DS_DATA			0x09
  52#define DS_NACK			0x0a
  53
  54	__u32			len;
  55};
  56
  57/* Result codes */
  58#define DS_OK			0x00
  59#define DS_REG_VER_NACK		0x01
  60#define DS_REG_DUP		0x02
  61#define DS_INV_HDL		0x03
  62#define DS_TYPE_UNKNOWN		0x04
  63
  64struct ds_version {
  65	__u16			major;
  66	__u16			minor;
  67};
  68
  69struct ds_ver_req {
  70	struct ds_msg_tag	tag;
  71	struct ds_version	ver;
  72};
  73
  74struct ds_ver_ack {
  75	struct ds_msg_tag	tag;
  76	__u16			minor;
  77};
  78
  79struct ds_ver_nack {
  80	struct ds_msg_tag	tag;
  81	__u16			major;
  82};
  83
  84struct ds_reg_req {
  85	struct ds_msg_tag	tag;
  86	__u64			handle;
  87	__u16			major;
  88	__u16			minor;
  89	char			svc_id[0];
  90};
  91
  92struct ds_reg_ack {
  93	struct ds_msg_tag	tag;
  94	__u64			handle;
  95	__u16			minor;
  96};
  97
  98struct ds_reg_nack {
  99	struct ds_msg_tag	tag;
 100	__u64			handle;
 101	__u16			major;
 102};
 103
 104struct ds_unreg_req {
 105	struct ds_msg_tag	tag;
 106	__u64			handle;
 107};
 108
 109struct ds_unreg_ack {
 110	struct ds_msg_tag	tag;
 111	__u64			handle;
 112};
 113
 114struct ds_unreg_nack {
 115	struct ds_msg_tag	tag;
 116	__u64			handle;
 117};
 118
 119struct ds_data {
 120	struct ds_msg_tag	tag;
 121	__u64			handle;
 122};
 123
 124struct ds_data_nack {
 125	struct ds_msg_tag	tag;
 126	__u64			handle;
 127	__u64			result;
 128};
 129
 130struct ds_info;
 131struct ds_cap_state {
 132	__u64			handle;
 133
 134	void			(*data)(struct ds_info *dp,
 135					struct ds_cap_state *cp,
 136					void *buf, int len);
 137
 138	const char		*service_id;
 139
 140	u8			state;
 141#define CAP_STATE_UNKNOWN	0x00
 142#define CAP_STATE_REG_SENT	0x01
 143#define CAP_STATE_REGISTERED	0x02
 144};
 145
 146static void md_update_data(struct ds_info *dp, struct ds_cap_state *cp,
 147			   void *buf, int len);
 148static void domain_shutdown_data(struct ds_info *dp,
 149				 struct ds_cap_state *cp,
 150				 void *buf, int len);
 151static void domain_panic_data(struct ds_info *dp,
 152			      struct ds_cap_state *cp,
 153			      void *buf, int len);
 154#ifdef CONFIG_HOTPLUG_CPU
 155static void dr_cpu_data(struct ds_info *dp,
 156			struct ds_cap_state *cp,
 157			void *buf, int len);
 158#endif
 159static void ds_pri_data(struct ds_info *dp,
 160			struct ds_cap_state *cp,
 161			void *buf, int len);
 162static void ds_var_data(struct ds_info *dp,
 163			struct ds_cap_state *cp,
 164			void *buf, int len);
 165
 166static struct ds_cap_state ds_states_template[] = {
 167	{
 168		.service_id	= "md-update",
 169		.data		= md_update_data,
 170	},
 171	{
 172		.service_id	= "domain-shutdown",
 173		.data		= domain_shutdown_data,
 174	},
 175	{
 176		.service_id	= "domain-panic",
 177		.data		= domain_panic_data,
 178	},
 179#ifdef CONFIG_HOTPLUG_CPU
 180	{
 181		.service_id	= "dr-cpu",
 182		.data		= dr_cpu_data,
 183	},
 184#endif
 185	{
 186		.service_id	= "pri",
 187		.data		= ds_pri_data,
 188	},
 189	{
 190		.service_id	= "var-config",
 191		.data		= ds_var_data,
 192	},
 193	{
 194		.service_id	= "var-config-backup",
 195		.data		= ds_var_data,
 196	},
 197};
 198
 199static DEFINE_SPINLOCK(ds_lock);
 200
 201struct ds_info {
 202	struct ldc_channel	*lp;
 203	u8			hs_state;
 204#define DS_HS_START		0x01
 205#define DS_HS_DONE		0x02
 206
 207	u64			id;
 208
 209	void			*rcv_buf;
 210	int			rcv_buf_len;
 211
 212	struct ds_cap_state	*ds_states;
 213	int			num_ds_states;
 214
 215	struct ds_info		*next;
 216};
 217
 218static struct ds_info *ds_info_list;
 219
 220static struct ds_cap_state *find_cap(struct ds_info *dp, u64 handle)
 221{
 222	unsigned int index = handle >> 32;
 223
 224	if (index >= dp->num_ds_states)
 225		return NULL;
 226	return &dp->ds_states[index];
 227}
 228
 229static struct ds_cap_state *find_cap_by_string(struct ds_info *dp,
 230					       const char *name)
 231{
 232	int i;
 233
 234	for (i = 0; i < dp->num_ds_states; i++) {
 235		if (strcmp(dp->ds_states[i].service_id, name))
 236			continue;
 237
 238		return &dp->ds_states[i];
 239	}
 240	return NULL;
 241}
 242
 243static int __ds_send(struct ldc_channel *lp, void *data, int len)
 244{
 245	int err, limit = 1000;
 246
 247	err = -EINVAL;
 248	while (limit-- > 0) {
 249		err = ldc_write(lp, data, len);
 250		if (!err || (err != -EAGAIN))
 251			break;
 252		udelay(1);
 253	}
 254
 255	return err;
 256}
 257
 258static int ds_send(struct ldc_channel *lp, void *data, int len)
 259{
 260	unsigned long flags;
 261	int err;
 262
 263	spin_lock_irqsave(&ds_lock, flags);
 264	err = __ds_send(lp, data, len);
 265	spin_unlock_irqrestore(&ds_lock, flags);
 266
 267	return err;
 268}
 269
 270struct ds_md_update_req {
 271	__u64				req_num;
 272};
 273
 274struct ds_md_update_res {
 275	__u64				req_num;
 276	__u32				result;
 277};
 278
 279static void md_update_data(struct ds_info *dp,
 280			   struct ds_cap_state *cp,
 281			   void *buf, int len)
 282{
 283	struct ldc_channel *lp = dp->lp;
 284	struct ds_data *dpkt = buf;
 285	struct ds_md_update_req *rp;
 286	struct {
 287		struct ds_data		data;
 288		struct ds_md_update_res	res;
 289	} pkt;
 290
 291	rp = (struct ds_md_update_req *) (dpkt + 1);
 292
 293	printk(KERN_INFO "ds-%llu: Machine description update.\n", dp->id);
 294
 295	mdesc_update();
 296
 297	memset(&pkt, 0, sizeof(pkt));
 298	pkt.data.tag.type = DS_DATA;
 299	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
 300	pkt.data.handle = cp->handle;
 301	pkt.res.req_num = rp->req_num;
 302	pkt.res.result = DS_OK;
 303
 304	ds_send(lp, &pkt, sizeof(pkt));
 305}
 306
 307struct ds_shutdown_req {
 308	__u64				req_num;
 309	__u32				ms_delay;
 310};
 311
 312struct ds_shutdown_res {
 313	__u64				req_num;
 314	__u32				result;
 315	char				reason[1];
 316};
 317
 318static void domain_shutdown_data(struct ds_info *dp,
 319				 struct ds_cap_state *cp,
 320				 void *buf, int len)
 321{
 322	struct ldc_channel *lp = dp->lp;
 323	struct ds_data *dpkt = buf;
 324	struct ds_shutdown_req *rp;
 325	struct {
 326		struct ds_data		data;
 327		struct ds_shutdown_res	res;
 328	} pkt;
 329
 330	rp = (struct ds_shutdown_req *) (dpkt + 1);
 331
 332	printk(KERN_ALERT "ds-%llu: Shutdown request from "
 333	       "LDOM manager received.\n", dp->id);
 334
 335	memset(&pkt, 0, sizeof(pkt));
 336	pkt.data.tag.type = DS_DATA;
 337	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
 338	pkt.data.handle = cp->handle;
 339	pkt.res.req_num = rp->req_num;
 340	pkt.res.result = DS_OK;
 341	pkt.res.reason[0] = 0;
 342
 343	ds_send(lp, &pkt, sizeof(pkt));
 344
 345	orderly_poweroff(true);
 346}
 347
 348struct ds_panic_req {
 349	__u64				req_num;
 350};
 351
 352struct ds_panic_res {
 353	__u64				req_num;
 354	__u32				result;
 355	char				reason[1];
 356};
 357
 358static void domain_panic_data(struct ds_info *dp,
 359			      struct ds_cap_state *cp,
 360			      void *buf, int len)
 361{
 362	struct ldc_channel *lp = dp->lp;
 363	struct ds_data *dpkt = buf;
 364	struct ds_panic_req *rp;
 365	struct {
 366		struct ds_data		data;
 367		struct ds_panic_res	res;
 368	} pkt;
 369
 370	rp = (struct ds_panic_req *) (dpkt + 1);
 371
 372	printk(KERN_ALERT "ds-%llu: Panic request from "
 373	       "LDOM manager received.\n", dp->id);
 374
 375	memset(&pkt, 0, sizeof(pkt));
 376	pkt.data.tag.type = DS_DATA;
 377	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
 378	pkt.data.handle = cp->handle;
 379	pkt.res.req_num = rp->req_num;
 380	pkt.res.result = DS_OK;
 381	pkt.res.reason[0] = 0;
 382
 383	ds_send(lp, &pkt, sizeof(pkt));
 384
 385	panic("PANIC requested by LDOM manager.");
 386}
 387
 388#ifdef CONFIG_HOTPLUG_CPU
 389struct dr_cpu_tag {
 390	__u64				req_num;
 391	__u32				type;
 392#define DR_CPU_CONFIGURE		0x43
 393#define DR_CPU_UNCONFIGURE		0x55
 394#define DR_CPU_FORCE_UNCONFIGURE	0x46
 395#define DR_CPU_STATUS			0x53
 396
 397/* Responses */
 398#define DR_CPU_OK			0x6f
 399#define DR_CPU_ERROR			0x65
 400
 401	__u32				num_records;
 402};
 403
 404struct dr_cpu_resp_entry {
 405	__u32				cpu;
 406	__u32				result;
 407#define DR_CPU_RES_OK			0x00
 408#define DR_CPU_RES_FAILURE		0x01
 409#define DR_CPU_RES_BLOCKED		0x02
 410#define DR_CPU_RES_CPU_NOT_RESPONDING	0x03
 411#define DR_CPU_RES_NOT_IN_MD		0x04
 412
 413	__u32				stat;
 414#define DR_CPU_STAT_NOT_PRESENT		0x00
 415#define DR_CPU_STAT_UNCONFIGURED	0x01
 416#define DR_CPU_STAT_CONFIGURED		0x02
 417
 418	__u32				str_off;
 419};
 420
 421static void __dr_cpu_send_error(struct ds_info *dp,
 422				struct ds_cap_state *cp,
 423				struct ds_data *data)
 424{
 425	struct dr_cpu_tag *tag = (struct dr_cpu_tag *) (data + 1);
 426	struct {
 427		struct ds_data		data;
 428		struct dr_cpu_tag	tag;
 429	} pkt;
 430	int msg_len;
 431
 432	memset(&pkt, 0, sizeof(pkt));
 433	pkt.data.tag.type = DS_DATA;
 434	pkt.data.handle = cp->handle;
 435	pkt.tag.req_num = tag->req_num;
 436	pkt.tag.type = DR_CPU_ERROR;
 437	pkt.tag.num_records = 0;
 438
 439	msg_len = (sizeof(struct ds_data) +
 440		   sizeof(struct dr_cpu_tag));
 441
 442	pkt.data.tag.len = msg_len - sizeof(struct ds_msg_tag);
 443
 444	__ds_send(dp->lp, &pkt, msg_len);
 445}
 446
 447static void dr_cpu_send_error(struct ds_info *dp,
 448			      struct ds_cap_state *cp,
 449			      struct ds_data *data)
 450{
 451	unsigned long flags;
 452
 453	spin_lock_irqsave(&ds_lock, flags);
 454	__dr_cpu_send_error(dp, cp, data);
 455	spin_unlock_irqrestore(&ds_lock, flags);
 456}
 457
 458#define CPU_SENTINEL	0xffffffff
 459
 460static void purge_dups(u32 *list, u32 num_ents)
 461{
 462	unsigned int i;
 463
 464	for (i = 0; i < num_ents; i++) {
 465		u32 cpu = list[i];
 466		unsigned int j;
 467
 468		if (cpu == CPU_SENTINEL)
 469			continue;
 470
 471		for (j = i + 1; j < num_ents; j++) {
 472			if (list[j] == cpu)
 473				list[j] = CPU_SENTINEL;
 474		}
 475	}
 476}
 477
 478static int dr_cpu_size_response(int ncpus)
 479{
 480	return (sizeof(struct ds_data) +
 481		sizeof(struct dr_cpu_tag) +
 482		(sizeof(struct dr_cpu_resp_entry) * ncpus));
 483}
 484
 485static void dr_cpu_init_response(struct ds_data *resp, u64 req_num,
 486				 u64 handle, int resp_len, int ncpus,
 487				 cpumask_t *mask, u32 default_stat)
 488{
 489	struct dr_cpu_resp_entry *ent;
 490	struct dr_cpu_tag *tag;
 491	int i, cpu;
 492
 493	tag = (struct dr_cpu_tag *) (resp + 1);
 494	ent = (struct dr_cpu_resp_entry *) (tag + 1);
 495
 496	resp->tag.type = DS_DATA;
 497	resp->tag.len = resp_len - sizeof(struct ds_msg_tag);
 498	resp->handle = handle;
 499	tag->req_num = req_num;
 500	tag->type = DR_CPU_OK;
 501	tag->num_records = ncpus;
 502
 503	i = 0;
 504	for_each_cpu(cpu, mask) {
 505		ent[i].cpu = cpu;
 506		ent[i].result = DR_CPU_RES_OK;
 507		ent[i].stat = default_stat;
 508		i++;
 509	}
 510	BUG_ON(i != ncpus);
 511}
 512
 513static void dr_cpu_mark(struct ds_data *resp, int cpu, int ncpus,
 514			u32 res, u32 stat)
 515{
 516	struct dr_cpu_resp_entry *ent;
 517	struct dr_cpu_tag *tag;
 518	int i;
 519
 520	tag = (struct dr_cpu_tag *) (resp + 1);
 521	ent = (struct dr_cpu_resp_entry *) (tag + 1);
 522
 523	for (i = 0; i < ncpus; i++) {
 524		if (ent[i].cpu != cpu)
 525			continue;
 526		ent[i].result = res;
 527		ent[i].stat = stat;
 528		break;
 529	}
 530}
 531
 532static int dr_cpu_configure(struct ds_info *dp, struct ds_cap_state *cp,
 533			    u64 req_num, cpumask_t *mask)
 534{
 535	struct ds_data *resp;
 536	int resp_len, ncpus, cpu;
 537	unsigned long flags;
 538
 539	ncpus = cpumask_weight(mask);
 540	resp_len = dr_cpu_size_response(ncpus);
 541	resp = kzalloc(resp_len, GFP_KERNEL);
 542	if (!resp)
 543		return -ENOMEM;
 544
 545	dr_cpu_init_response(resp, req_num, cp->handle,
 546			     resp_len, ncpus, mask,
 547			     DR_CPU_STAT_CONFIGURED);
 548
 549	mdesc_populate_present_mask(mask);
 550	mdesc_fill_in_cpu_data(mask);
 551
 552	for_each_cpu(cpu, mask) {
 553		int err;
 554
 555		printk(KERN_INFO "ds-%llu: Starting cpu %d...\n",
 556		       dp->id, cpu);
 557		err = cpu_up(cpu);
 558		if (err) {
 559			__u32 res = DR_CPU_RES_FAILURE;
 560			__u32 stat = DR_CPU_STAT_UNCONFIGURED;
 561
 562			if (!cpu_present(cpu)) {
 563				/* CPU not present in MD */
 564				res = DR_CPU_RES_NOT_IN_MD;
 565				stat = DR_CPU_STAT_NOT_PRESENT;
 566			} else if (err == -ENODEV) {
 567				/* CPU did not call in successfully */
 568				res = DR_CPU_RES_CPU_NOT_RESPONDING;
 569			}
 570
 571			printk(KERN_INFO "ds-%llu: CPU startup failed err=%d\n",
 572			       dp->id, err);
 573			dr_cpu_mark(resp, cpu, ncpus, res, stat);
 574		}
 575	}
 576
 577	spin_lock_irqsave(&ds_lock, flags);
 578	__ds_send(dp->lp, resp, resp_len);
 579	spin_unlock_irqrestore(&ds_lock, flags);
 580
 581	kfree(resp);
 582
 583	/* Redistribute IRQs, taking into account the new cpus.  */
 584	fixup_irqs();
 585
 586	return 0;
 587}
 588
 589static int dr_cpu_unconfigure(struct ds_info *dp,
 590			      struct ds_cap_state *cp,
 591			      u64 req_num,
 592			      cpumask_t *mask)
 593{
 594	struct ds_data *resp;
 595	int resp_len, ncpus, cpu;
 596	unsigned long flags;
 597
 598	ncpus = cpumask_weight(mask);
 599	resp_len = dr_cpu_size_response(ncpus);
 600	resp = kzalloc(resp_len, GFP_KERNEL);
 601	if (!resp)
 602		return -ENOMEM;
 603
 604	dr_cpu_init_response(resp, req_num, cp->handle,
 605			     resp_len, ncpus, mask,
 606			     DR_CPU_STAT_UNCONFIGURED);
 607
 608	for_each_cpu(cpu, mask) {
 609		int err;
 610
 611		printk(KERN_INFO "ds-%llu: Shutting down cpu %d...\n",
 612		       dp->id, cpu);
 613		err = cpu_down(cpu);
 614		if (err)
 615			dr_cpu_mark(resp, cpu, ncpus,
 616				    DR_CPU_RES_FAILURE,
 617				    DR_CPU_STAT_CONFIGURED);
 618	}
 619
 620	spin_lock_irqsave(&ds_lock, flags);
 621	__ds_send(dp->lp, resp, resp_len);
 622	spin_unlock_irqrestore(&ds_lock, flags);
 623
 624	kfree(resp);
 625
 626	return 0;
 627}
 628
 629static void dr_cpu_data(struct ds_info *dp, struct ds_cap_state *cp, void *buf,
 630			int len)
 631{
 632	struct ds_data *data = buf;
 633	struct dr_cpu_tag *tag = (struct dr_cpu_tag *) (data + 1);
 634	u32 *cpu_list = (u32 *) (tag + 1);
 635	u64 req_num = tag->req_num;
 636	cpumask_t mask;
 637	unsigned int i;
 638	int err;
 639
 640	switch (tag->type) {
 641	case DR_CPU_CONFIGURE:
 642	case DR_CPU_UNCONFIGURE:
 643	case DR_CPU_FORCE_UNCONFIGURE:
 644		break;
 645
 646	default:
 647		dr_cpu_send_error(dp, cp, data);
 648		return;
 649	}
 650
 651	purge_dups(cpu_list, tag->num_records);
 652
 653	cpumask_clear(&mask);
 654	for (i = 0; i < tag->num_records; i++) {
 655		if (cpu_list[i] == CPU_SENTINEL)
 656			continue;
 657
 658		if (cpu_list[i] < nr_cpu_ids)
 659			cpumask_set_cpu(cpu_list[i], &mask);
 660	}
 661
 662	if (tag->type == DR_CPU_CONFIGURE)
 663		err = dr_cpu_configure(dp, cp, req_num, &mask);
 664	else
 665		err = dr_cpu_unconfigure(dp, cp, req_num, &mask);
 666
 667	if (err)
 668		dr_cpu_send_error(dp, cp, data);
 669}
 670#endif /* CONFIG_HOTPLUG_CPU */
 671
 672struct ds_pri_msg {
 673	__u64				req_num;
 674	__u64				type;
 675#define DS_PRI_REQUEST			0x00
 676#define DS_PRI_DATA			0x01
 677#define DS_PRI_UPDATE			0x02
 678};
 679
 680static void ds_pri_data(struct ds_info *dp,
 681			struct ds_cap_state *cp,
 682			void *buf, int len)
 683{
 684	struct ds_data *dpkt = buf;
 685	struct ds_pri_msg *rp;
 686
 687	rp = (struct ds_pri_msg *) (dpkt + 1);
 688
 689	printk(KERN_INFO "ds-%llu: PRI REQ [%llx:%llx], len=%d\n",
 690	       dp->id, rp->req_num, rp->type, len);
 691}
 692
 693struct ds_var_hdr {
 694	__u32				type;
 695#define DS_VAR_SET_REQ			0x00
 696#define DS_VAR_DELETE_REQ		0x01
 697#define DS_VAR_SET_RESP			0x02
 698#define DS_VAR_DELETE_RESP		0x03
 699};
 700
 701struct ds_var_set_msg {
 702	struct ds_var_hdr		hdr;
 703	char				name_and_value[0];
 704};
 705
 706struct ds_var_delete_msg {
 707	struct ds_var_hdr		hdr;
 708	char				name[0];
 709};
 710
 711struct ds_var_resp {
 712	struct ds_var_hdr		hdr;
 713	__u32				result;
 714#define DS_VAR_SUCCESS			0x00
 715#define DS_VAR_NO_SPACE			0x01
 716#define DS_VAR_INVALID_VAR		0x02
 717#define DS_VAR_INVALID_VAL		0x03
 718#define DS_VAR_NOT_PRESENT		0x04
 719};
 720
 721static DEFINE_MUTEX(ds_var_mutex);
 722static int ds_var_doorbell;
 723static int ds_var_response;
 724
 725static void ds_var_data(struct ds_info *dp,
 726			struct ds_cap_state *cp,
 727			void *buf, int len)
 728{
 729	struct ds_data *dpkt = buf;
 730	struct ds_var_resp *rp;
 731
 732	rp = (struct ds_var_resp *) (dpkt + 1);
 733
 734	if (rp->hdr.type != DS_VAR_SET_RESP &&
 735	    rp->hdr.type != DS_VAR_DELETE_RESP)
 736		return;
 737
 738	ds_var_response = rp->result;
 739	wmb();
 740	ds_var_doorbell = 1;
 741}
 742
 743void ldom_set_var(const char *var, const char *value)
 744{
 745	struct ds_cap_state *cp;
 746	struct ds_info *dp;
 747	unsigned long flags;
 748
 749	spin_lock_irqsave(&ds_lock, flags);
 750	cp = NULL;
 751	for (dp = ds_info_list; dp; dp = dp->next) {
 752		struct ds_cap_state *tmp;
 753
 754		tmp = find_cap_by_string(dp, "var-config");
 755		if (tmp && tmp->state == CAP_STATE_REGISTERED) {
 756			cp = tmp;
 757			break;
 758		}
 759	}
 760	if (!cp) {
 761		for (dp = ds_info_list; dp; dp = dp->next) {
 762			struct ds_cap_state *tmp;
 763
 764			tmp = find_cap_by_string(dp, "var-config-backup");
 765			if (tmp && tmp->state == CAP_STATE_REGISTERED) {
 766				cp = tmp;
 767				break;
 768			}
 769		}
 770	}
 771	spin_unlock_irqrestore(&ds_lock, flags);
 772
 773	if (cp) {
 774		union {
 775			struct {
 776				struct ds_data		data;
 777				struct ds_var_set_msg	msg;
 778			} header;
 779			char			all[512];
 780		} pkt;
 781		char  *base, *p;
 782		int msg_len, loops;
 783
 784		if (strlen(var) + strlen(value) + 2 >
 785		    sizeof(pkt) - sizeof(pkt.header)) {
 786			printk(KERN_ERR PFX
 787				"contents length: %zu, which more than max: %lu,"
 788				"so could not set (%s) variable to (%s).\n",
 789				strlen(var) + strlen(value) + 2,
 790				sizeof(pkt) - sizeof(pkt.header), var, value);
 791			return;
 792		}
 793
 794		memset(&pkt, 0, sizeof(pkt));
 795		pkt.header.data.tag.type = DS_DATA;
 796		pkt.header.data.handle = cp->handle;
 797		pkt.header.msg.hdr.type = DS_VAR_SET_REQ;
 798		base = p = &pkt.header.msg.name_and_value[0];
 799		strcpy(p, var);
 800		p += strlen(var) + 1;
 801		strcpy(p, value);
 802		p += strlen(value) + 1;
 803
 804		msg_len = (sizeof(struct ds_data) +
 805			   sizeof(struct ds_var_set_msg) +
 806			   (p - base));
 807		msg_len = (msg_len + 3) & ~3;
 808		pkt.header.data.tag.len = msg_len - sizeof(struct ds_msg_tag);
 809
 810		mutex_lock(&ds_var_mutex);
 811
 812		spin_lock_irqsave(&ds_lock, flags);
 813		ds_var_doorbell = 0;
 814		ds_var_response = -1;
 815
 816		__ds_send(dp->lp, &pkt, msg_len);
 817		spin_unlock_irqrestore(&ds_lock, flags);
 818
 819		loops = 1000;
 820		while (ds_var_doorbell == 0) {
 821			if (loops-- < 0)
 822				break;
 823			barrier();
 824			udelay(100);
 825		}
 826
 827		mutex_unlock(&ds_var_mutex);
 828
 829		if (ds_var_doorbell == 0 ||
 830		    ds_var_response != DS_VAR_SUCCESS)
 831			printk(KERN_ERR "ds-%llu: var-config [%s:%s] "
 832			       "failed, response(%d).\n",
 833			       dp->id, var, value,
 834			       ds_var_response);
 835	} else {
 836		printk(KERN_ERR PFX "var-config not registered so "
 837		       "could not set (%s) variable to (%s).\n",
 838		       var, value);
 839	}
 840}
 841
 842static char full_boot_str[256] __attribute__((aligned(32)));
 843static int reboot_data_supported;
 844
 845void ldom_reboot(const char *boot_command)
 846{
 847	/* Don't bother with any of this if the boot_command
 848	 * is empty.
 849	 */
 850	if (boot_command && strlen(boot_command)) {
 851		unsigned long len;
 852
 853		snprintf(full_boot_str, sizeof(full_boot_str), "boot %s",
 854			 boot_command);
 855		len = strlen(full_boot_str);
 856
 857		if (reboot_data_supported) {
 858			unsigned long ra = kimage_addr_to_ra(full_boot_str);
 859			unsigned long hv_ret;
 860
 861			hv_ret = sun4v_reboot_data_set(ra, len);
 862			if (hv_ret != HV_EOK)
 863				pr_err("SUN4V: Unable to set reboot data "
 864				       "hv_ret=%lu\n", hv_ret);
 865		} else {
 866			ldom_set_var("reboot-command", full_boot_str);
 867		}
 868	}
 869	sun4v_mach_sir();
 870}
 871
 872void ldom_power_off(void)
 873{
 874	sun4v_mach_exit(0);
 875}
 876
 877static void ds_conn_reset(struct ds_info *dp)
 878{
 879	printk(KERN_ERR "ds-%llu: ds_conn_reset() from %pf\n",
 880	       dp->id, __builtin_return_address(0));
 881}
 882
 883static int register_services(struct ds_info *dp)
 884{
 885	struct ldc_channel *lp = dp->lp;
 886	int i;
 887
 888	for (i = 0; i < dp->num_ds_states; i++) {
 889		struct {
 890			struct ds_reg_req req;
 891			u8 id_buf[256];
 892		} pbuf;
 893		struct ds_cap_state *cp = &dp->ds_states[i];
 894		int err, msg_len;
 895		u64 new_count;
 896
 897		if (cp->state == CAP_STATE_REGISTERED)
 898			continue;
 899
 900		new_count = sched_clock() & 0xffffffff;
 901		cp->handle = ((u64) i << 32) | new_count;
 902
 903		msg_len = (sizeof(struct ds_reg_req) +
 904			   strlen(cp->service_id));
 905
 906		memset(&pbuf, 0, sizeof(pbuf));
 907		pbuf.req.tag.type = DS_REG_REQ;
 908		pbuf.req.tag.len = (msg_len - sizeof(struct ds_msg_tag));
 909		pbuf.req.handle = cp->handle;
 910		pbuf.req.major = 1;
 911		pbuf.req.minor = 0;
 912		strcpy(pbuf.id_buf, cp->service_id);
 913
 914		err = __ds_send(lp, &pbuf, msg_len);
 915		if (err > 0)
 916			cp->state = CAP_STATE_REG_SENT;
 917	}
 918	return 0;
 919}
 920
 921static int ds_handshake(struct ds_info *dp, struct ds_msg_tag *pkt)
 922{
 923
 924	if (dp->hs_state == DS_HS_START) {
 925		if (pkt->type != DS_INIT_ACK)
 926			goto conn_reset;
 927
 928		dp->hs_state = DS_HS_DONE;
 929
 930		return register_services(dp);
 931	}
 932
 933	if (dp->hs_state != DS_HS_DONE)
 934		goto conn_reset;
 935
 936	if (pkt->type == DS_REG_ACK) {
 937		struct ds_reg_ack *ap = (struct ds_reg_ack *) pkt;
 938		struct ds_cap_state *cp = find_cap(dp, ap->handle);
 939
 940		if (!cp) {
 941			printk(KERN_ERR "ds-%llu: REG ACK for unknown "
 942			       "handle %llx\n", dp->id, ap->handle);
 943			return 0;
 944		}
 945		printk(KERN_INFO "ds-%llu: Registered %s service.\n",
 946		       dp->id, cp->service_id);
 947		cp->state = CAP_STATE_REGISTERED;
 948	} else if (pkt->type == DS_REG_NACK) {
 949		struct ds_reg_nack *np = (struct ds_reg_nack *) pkt;
 950		struct ds_cap_state *cp = find_cap(dp, np->handle);
 951
 952		if (!cp) {
 953			printk(KERN_ERR "ds-%llu: REG NACK for "
 954			       "unknown handle %llx\n",
 955			       dp->id, np->handle);
 956			return 0;
 957		}
 958		cp->state = CAP_STATE_UNKNOWN;
 959	}
 960
 961	return 0;
 962
 963conn_reset:
 964	ds_conn_reset(dp);
 965	return -ECONNRESET;
 966}
 967
 968static void __send_ds_nack(struct ds_info *dp, u64 handle)
 969{
 970	struct ds_data_nack nack = {
 971		.tag = {
 972			.type = DS_NACK,
 973			.len = (sizeof(struct ds_data_nack) -
 974				sizeof(struct ds_msg_tag)),
 975		},
 976		.handle = handle,
 977		.result = DS_INV_HDL,
 978	};
 979
 980	__ds_send(dp->lp, &nack, sizeof(nack));
 981}
 982
 983static LIST_HEAD(ds_work_list);
 984static DECLARE_WAIT_QUEUE_HEAD(ds_wait);
 985
 986struct ds_queue_entry {
 987	struct list_head		list;
 988	struct ds_info			*dp;
 989	int				req_len;
 990	int				__pad;
 991	u64				req[0];
 992};
 993
 994static void process_ds_work(void)
 995{
 996	struct ds_queue_entry *qp, *tmp;
 997	unsigned long flags;
 998	LIST_HEAD(todo);
 999
1000	spin_lock_irqsave(&ds_lock, flags);
1001	list_splice_init(&ds_work_list, &todo);
1002	spin_unlock_irqrestore(&ds_lock, flags);
1003
1004	list_for_each_entry_safe(qp, tmp, &todo, list) {
1005		struct ds_data *dpkt = (struct ds_data *) qp->req;
1006		struct ds_info *dp = qp->dp;
1007		struct ds_cap_state *cp = find_cap(dp, dpkt->handle);
1008		int req_len = qp->req_len;
1009
1010		if (!cp) {
1011			printk(KERN_ERR "ds-%llu: Data for unknown "
1012			       "handle %llu\n",
1013			       dp->id, dpkt->handle);
1014
1015			spin_lock_irqsave(&ds_lock, flags);
1016			__send_ds_nack(dp, dpkt->handle);
1017			spin_unlock_irqrestore(&ds_lock, flags);
1018		} else {
1019			cp->data(dp, cp, dpkt, req_len);
1020		}
1021
1022		list_del(&qp->list);
1023		kfree(qp);
1024	}
1025}
1026
1027static int ds_thread(void *__unused)
1028{
1029	DEFINE_WAIT(wait);
1030
1031	while (1) {
1032		prepare_to_wait(&ds_wait, &wait, TASK_INTERRUPTIBLE);
1033		if (list_empty(&ds_work_list))
1034			schedule();
1035		finish_wait(&ds_wait, &wait);
1036
1037		if (kthread_should_stop())
1038			break;
1039
1040		process_ds_work();
1041	}
1042
1043	return 0;
1044}
1045
1046static int ds_data(struct ds_info *dp, struct ds_msg_tag *pkt, int len)
1047{
1048	struct ds_data *dpkt = (struct ds_data *) pkt;
1049	struct ds_queue_entry *qp;
1050
1051	qp = kmalloc(sizeof(struct ds_queue_entry) + len, GFP_ATOMIC);
1052	if (!qp) {
1053		__send_ds_nack(dp, dpkt->handle);
1054	} else {
1055		qp->dp = dp;
1056		memcpy(&qp->req, pkt, len);
1057		list_add_tail(&qp->list, &ds_work_list);
1058		wake_up(&ds_wait);
1059	}
1060	return 0;
1061}
1062
1063static void ds_up(struct ds_info *dp)
1064{
1065	struct ldc_channel *lp = dp->lp;
1066	struct ds_ver_req req;
1067	int err;
1068
1069	req.tag.type = DS_INIT_REQ;
1070	req.tag.len = sizeof(req) - sizeof(struct ds_msg_tag);
1071	req.ver.major = 1;
1072	req.ver.minor = 0;
1073
1074	err = __ds_send(lp, &req, sizeof(req));
1075	if (err > 0)
1076		dp->hs_state = DS_HS_START;
1077}
1078
1079static void ds_reset(struct ds_info *dp)
1080{
1081	int i;
1082
1083	dp->hs_state = 0;
1084
1085	for (i = 0; i < dp->num_ds_states; i++) {
1086		struct ds_cap_state *cp = &dp->ds_states[i];
1087
1088		cp->state = CAP_STATE_UNKNOWN;
1089	}
1090}
1091
1092static void ds_event(void *arg, int event)
1093{
1094	struct ds_info *dp = arg;
1095	struct ldc_channel *lp = dp->lp;
1096	unsigned long flags;
1097	int err;
1098
1099	spin_lock_irqsave(&ds_lock, flags);
1100
1101	if (event == LDC_EVENT_UP) {
1102		ds_up(dp);
1103		spin_unlock_irqrestore(&ds_lock, flags);
1104		return;
1105	}
1106
1107	if (event == LDC_EVENT_RESET) {
1108		ds_reset(dp);
1109		spin_unlock_irqrestore(&ds_lock, flags);
1110		return;
1111	}
1112
1113	if (event != LDC_EVENT_DATA_READY) {
1114		printk(KERN_WARNING "ds-%llu: Unexpected LDC event %d\n",
1115		       dp->id, event);
1116		spin_unlock_irqrestore(&ds_lock, flags);
1117		return;
1118	}
1119
1120	err = 0;
1121	while (1) {
1122		struct ds_msg_tag *tag;
1123
1124		err = ldc_read(lp, dp->rcv_buf, sizeof(*tag));
1125
1126		if (unlikely(err < 0)) {
1127			if (err == -ECONNRESET)
1128				ds_conn_reset(dp);
1129			break;
1130		}
1131		if (err == 0)
1132			break;
1133
1134		tag = dp->rcv_buf;
1135		err = ldc_read(lp, tag + 1, tag->len);
1136
1137		if (unlikely(err < 0)) {
1138			if (err == -ECONNRESET)
1139				ds_conn_reset(dp);
1140			break;
1141		}
1142		if (err < tag->len)
1143			break;
1144
1145		if (tag->type < DS_DATA)
1146			err = ds_handshake(dp, dp->rcv_buf);
1147		else
1148			err = ds_data(dp, dp->rcv_buf,
1149				      sizeof(*tag) + err);
1150		if (err == -ECONNRESET)
1151			break;
1152	}
1153
1154	spin_unlock_irqrestore(&ds_lock, flags);
1155}
1156
1157static int ds_probe(struct vio_dev *vdev, const struct vio_device_id *id)
1158{
1159	static int ds_version_printed;
1160	struct ldc_channel_config ds_cfg = {
1161		.event		= ds_event,
1162		.mtu		= 4096,
1163		.mode		= LDC_MODE_STREAM,
1164	};
1165	struct mdesc_handle *hp;
1166	struct ldc_channel *lp;
1167	struct ds_info *dp;
1168	const u64 *val;
1169	int err, i;
1170
1171	if (ds_version_printed++ == 0)
1172		printk(KERN_INFO "%s", version);
1173
1174	dp = kzalloc(sizeof(*dp), GFP_KERNEL);
1175	err = -ENOMEM;
1176	if (!dp)
1177		goto out_err;
1178
1179	hp = mdesc_grab();
1180	val = mdesc_get_property(hp, vdev->mp, "id", NULL);
1181	if (val)
1182		dp->id = *val;
1183	mdesc_release(hp);
1184
1185	dp->rcv_buf = kzalloc(4096, GFP_KERNEL);
1186	if (!dp->rcv_buf)
1187		goto out_free_dp;
1188
1189	dp->rcv_buf_len = 4096;
1190
1191	dp->ds_states = kmemdup(ds_states_template,
1192				sizeof(ds_states_template), GFP_KERNEL);
1193	if (!dp->ds_states)
1194		goto out_free_rcv_buf;
1195
1196	dp->num_ds_states = ARRAY_SIZE(ds_states_template);
1197
1198	for (i = 0; i < dp->num_ds_states; i++)
1199		dp->ds_states[i].handle = ((u64)i << 32);
1200
1201	ds_cfg.tx_irq = vdev->tx_irq;
1202	ds_cfg.rx_irq = vdev->rx_irq;
1203
1204	lp = ldc_alloc(vdev->channel_id, &ds_cfg, dp, "DS");
1205	if (IS_ERR(lp)) {
1206		err = PTR_ERR(lp);
1207		goto out_free_ds_states;
1208	}
1209	dp->lp = lp;
1210
1211	err = ldc_bind(lp);
1212	if (err)
1213		goto out_free_ldc;
1214
1215	spin_lock_irq(&ds_lock);
1216	dp->next = ds_info_list;
1217	ds_info_list = dp;
1218	spin_unlock_irq(&ds_lock);
1219
1220	return err;
1221
1222out_free_ldc:
1223	ldc_free(dp->lp);
1224
1225out_free_ds_states:
1226	kfree(dp->ds_states);
1227
1228out_free_rcv_buf:
1229	kfree(dp->rcv_buf);
1230
1231out_free_dp:
1232	kfree(dp);
1233
1234out_err:
1235	return err;
1236}
1237
1238static int ds_remove(struct vio_dev *vdev)
1239{
1240	return 0;
1241}
1242
1243static const struct vio_device_id ds_match[] = {
1244	{
1245		.type = "domain-services-port",
1246	},
1247	{},
1248};
1249
1250static struct vio_driver ds_driver = {
1251	.id_table	= ds_match,
1252	.probe		= ds_probe,
1253	.remove		= ds_remove,
1254	.name		= "ds",
1255};
1256
1257static int __init ds_init(void)
1258{
1259	unsigned long hv_ret, major, minor;
1260
1261	if (tlb_type == hypervisor) {
1262		hv_ret = sun4v_get_version(HV_GRP_REBOOT_DATA, &major, &minor);
1263		if (hv_ret == HV_EOK) {
1264			pr_info("SUN4V: Reboot data supported (maj=%lu,min=%lu).\n",
1265				major, minor);
1266			reboot_data_supported = 1;
1267		}
1268	}
1269	kthread_run(ds_thread, NULL, "kldomd");
1270
1271	return vio_register_driver(&ds_driver);
1272}
1273
1274fs_initcall(ds_init);
v4.6
   1/* ds.c: Domain Services driver for Logical Domains
   2 *
   3 * Copyright (C) 2007, 2008 David S. Miller <davem@davemloft.net>
   4 */
   5
   6#include <linux/kernel.h>
   7#include <linux/module.h>
   8#include <linux/types.h>
   9#include <linux/string.h>
  10#include <linux/slab.h>
  11#include <linux/sched.h>
 
  12#include <linux/delay.h>
  13#include <linux/mutex.h>
  14#include <linux/kthread.h>
  15#include <linux/reboot.h>
  16#include <linux/cpu.h>
  17
  18#include <asm/hypervisor.h>
  19#include <asm/ldc.h>
  20#include <asm/vio.h>
  21#include <asm/mdesc.h>
  22#include <asm/head.h>
  23#include <asm/irq.h>
  24
  25#include "kernel.h"
  26
  27#define DRV_MODULE_NAME		"ds"
  28#define PFX DRV_MODULE_NAME	": "
  29#define DRV_MODULE_VERSION	"1.0"
  30#define DRV_MODULE_RELDATE	"Jul 11, 2007"
  31
  32static char version[] =
  33	DRV_MODULE_NAME ".c:v" DRV_MODULE_VERSION " (" DRV_MODULE_RELDATE ")\n";
  34MODULE_AUTHOR("David S. Miller (davem@davemloft.net)");
  35MODULE_DESCRIPTION("Sun LDOM domain services driver");
  36MODULE_LICENSE("GPL");
  37MODULE_VERSION(DRV_MODULE_VERSION);
  38
  39struct ds_msg_tag {
  40	__u32			type;
  41#define DS_INIT_REQ		0x00
  42#define DS_INIT_ACK		0x01
  43#define DS_INIT_NACK		0x02
  44#define DS_REG_REQ		0x03
  45#define DS_REG_ACK		0x04
  46#define DS_REG_NACK		0x05
  47#define DS_UNREG_REQ		0x06
  48#define DS_UNREG_ACK		0x07
  49#define DS_UNREG_NACK		0x08
  50#define DS_DATA			0x09
  51#define DS_NACK			0x0a
  52
  53	__u32			len;
  54};
  55
  56/* Result codes */
  57#define DS_OK			0x00
  58#define DS_REG_VER_NACK		0x01
  59#define DS_REG_DUP		0x02
  60#define DS_INV_HDL		0x03
  61#define DS_TYPE_UNKNOWN		0x04
  62
  63struct ds_version {
  64	__u16			major;
  65	__u16			minor;
  66};
  67
  68struct ds_ver_req {
  69	struct ds_msg_tag	tag;
  70	struct ds_version	ver;
  71};
  72
  73struct ds_ver_ack {
  74	struct ds_msg_tag	tag;
  75	__u16			minor;
  76};
  77
  78struct ds_ver_nack {
  79	struct ds_msg_tag	tag;
  80	__u16			major;
  81};
  82
  83struct ds_reg_req {
  84	struct ds_msg_tag	tag;
  85	__u64			handle;
  86	__u16			major;
  87	__u16			minor;
  88	char			svc_id[0];
  89};
  90
  91struct ds_reg_ack {
  92	struct ds_msg_tag	tag;
  93	__u64			handle;
  94	__u16			minor;
  95};
  96
  97struct ds_reg_nack {
  98	struct ds_msg_tag	tag;
  99	__u64			handle;
 100	__u16			major;
 101};
 102
 103struct ds_unreg_req {
 104	struct ds_msg_tag	tag;
 105	__u64			handle;
 106};
 107
 108struct ds_unreg_ack {
 109	struct ds_msg_tag	tag;
 110	__u64			handle;
 111};
 112
 113struct ds_unreg_nack {
 114	struct ds_msg_tag	tag;
 115	__u64			handle;
 116};
 117
 118struct ds_data {
 119	struct ds_msg_tag	tag;
 120	__u64			handle;
 121};
 122
 123struct ds_data_nack {
 124	struct ds_msg_tag	tag;
 125	__u64			handle;
 126	__u64			result;
 127};
 128
 129struct ds_info;
 130struct ds_cap_state {
 131	__u64			handle;
 132
 133	void			(*data)(struct ds_info *dp,
 134					struct ds_cap_state *cp,
 135					void *buf, int len);
 136
 137	const char		*service_id;
 138
 139	u8			state;
 140#define CAP_STATE_UNKNOWN	0x00
 141#define CAP_STATE_REG_SENT	0x01
 142#define CAP_STATE_REGISTERED	0x02
 143};
 144
 145static void md_update_data(struct ds_info *dp, struct ds_cap_state *cp,
 146			   void *buf, int len);
 147static void domain_shutdown_data(struct ds_info *dp,
 148				 struct ds_cap_state *cp,
 149				 void *buf, int len);
 150static void domain_panic_data(struct ds_info *dp,
 151			      struct ds_cap_state *cp,
 152			      void *buf, int len);
 153#ifdef CONFIG_HOTPLUG_CPU
 154static void dr_cpu_data(struct ds_info *dp,
 155			struct ds_cap_state *cp,
 156			void *buf, int len);
 157#endif
 158static void ds_pri_data(struct ds_info *dp,
 159			struct ds_cap_state *cp,
 160			void *buf, int len);
 161static void ds_var_data(struct ds_info *dp,
 162			struct ds_cap_state *cp,
 163			void *buf, int len);
 164
 165static struct ds_cap_state ds_states_template[] = {
 166	{
 167		.service_id	= "md-update",
 168		.data		= md_update_data,
 169	},
 170	{
 171		.service_id	= "domain-shutdown",
 172		.data		= domain_shutdown_data,
 173	},
 174	{
 175		.service_id	= "domain-panic",
 176		.data		= domain_panic_data,
 177	},
 178#ifdef CONFIG_HOTPLUG_CPU
 179	{
 180		.service_id	= "dr-cpu",
 181		.data		= dr_cpu_data,
 182	},
 183#endif
 184	{
 185		.service_id	= "pri",
 186		.data		= ds_pri_data,
 187	},
 188	{
 189		.service_id	= "var-config",
 190		.data		= ds_var_data,
 191	},
 192	{
 193		.service_id	= "var-config-backup",
 194		.data		= ds_var_data,
 195	},
 196};
 197
 198static DEFINE_SPINLOCK(ds_lock);
 199
 200struct ds_info {
 201	struct ldc_channel	*lp;
 202	u8			hs_state;
 203#define DS_HS_START		0x01
 204#define DS_HS_DONE		0x02
 205
 206	u64			id;
 207
 208	void			*rcv_buf;
 209	int			rcv_buf_len;
 210
 211	struct ds_cap_state	*ds_states;
 212	int			num_ds_states;
 213
 214	struct ds_info		*next;
 215};
 216
 217static struct ds_info *ds_info_list;
 218
 219static struct ds_cap_state *find_cap(struct ds_info *dp, u64 handle)
 220{
 221	unsigned int index = handle >> 32;
 222
 223	if (index >= dp->num_ds_states)
 224		return NULL;
 225	return &dp->ds_states[index];
 226}
 227
 228static struct ds_cap_state *find_cap_by_string(struct ds_info *dp,
 229					       const char *name)
 230{
 231	int i;
 232
 233	for (i = 0; i < dp->num_ds_states; i++) {
 234		if (strcmp(dp->ds_states[i].service_id, name))
 235			continue;
 236
 237		return &dp->ds_states[i];
 238	}
 239	return NULL;
 240}
 241
 242static int __ds_send(struct ldc_channel *lp, void *data, int len)
 243{
 244	int err, limit = 1000;
 245
 246	err = -EINVAL;
 247	while (limit-- > 0) {
 248		err = ldc_write(lp, data, len);
 249		if (!err || (err != -EAGAIN))
 250			break;
 251		udelay(1);
 252	}
 253
 254	return err;
 255}
 256
 257static int ds_send(struct ldc_channel *lp, void *data, int len)
 258{
 259	unsigned long flags;
 260	int err;
 261
 262	spin_lock_irqsave(&ds_lock, flags);
 263	err = __ds_send(lp, data, len);
 264	spin_unlock_irqrestore(&ds_lock, flags);
 265
 266	return err;
 267}
 268
 269struct ds_md_update_req {
 270	__u64				req_num;
 271};
 272
 273struct ds_md_update_res {
 274	__u64				req_num;
 275	__u32				result;
 276};
 277
 278static void md_update_data(struct ds_info *dp,
 279			   struct ds_cap_state *cp,
 280			   void *buf, int len)
 281{
 282	struct ldc_channel *lp = dp->lp;
 283	struct ds_data *dpkt = buf;
 284	struct ds_md_update_req *rp;
 285	struct {
 286		struct ds_data		data;
 287		struct ds_md_update_res	res;
 288	} pkt;
 289
 290	rp = (struct ds_md_update_req *) (dpkt + 1);
 291
 292	printk(KERN_INFO "ds-%llu: Machine description update.\n", dp->id);
 293
 294	mdesc_update();
 295
 296	memset(&pkt, 0, sizeof(pkt));
 297	pkt.data.tag.type = DS_DATA;
 298	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
 299	pkt.data.handle = cp->handle;
 300	pkt.res.req_num = rp->req_num;
 301	pkt.res.result = DS_OK;
 302
 303	ds_send(lp, &pkt, sizeof(pkt));
 304}
 305
 306struct ds_shutdown_req {
 307	__u64				req_num;
 308	__u32				ms_delay;
 309};
 310
 311struct ds_shutdown_res {
 312	__u64				req_num;
 313	__u32				result;
 314	char				reason[1];
 315};
 316
 317static void domain_shutdown_data(struct ds_info *dp,
 318				 struct ds_cap_state *cp,
 319				 void *buf, int len)
 320{
 321	struct ldc_channel *lp = dp->lp;
 322	struct ds_data *dpkt = buf;
 323	struct ds_shutdown_req *rp;
 324	struct {
 325		struct ds_data		data;
 326		struct ds_shutdown_res	res;
 327	} pkt;
 328
 329	rp = (struct ds_shutdown_req *) (dpkt + 1);
 330
 331	printk(KERN_ALERT "ds-%llu: Shutdown request from "
 332	       "LDOM manager received.\n", dp->id);
 333
 334	memset(&pkt, 0, sizeof(pkt));
 335	pkt.data.tag.type = DS_DATA;
 336	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
 337	pkt.data.handle = cp->handle;
 338	pkt.res.req_num = rp->req_num;
 339	pkt.res.result = DS_OK;
 340	pkt.res.reason[0] = 0;
 341
 342	ds_send(lp, &pkt, sizeof(pkt));
 343
 344	orderly_poweroff(true);
 345}
 346
 347struct ds_panic_req {
 348	__u64				req_num;
 349};
 350
 351struct ds_panic_res {
 352	__u64				req_num;
 353	__u32				result;
 354	char				reason[1];
 355};
 356
 357static void domain_panic_data(struct ds_info *dp,
 358			      struct ds_cap_state *cp,
 359			      void *buf, int len)
 360{
 361	struct ldc_channel *lp = dp->lp;
 362	struct ds_data *dpkt = buf;
 363	struct ds_panic_req *rp;
 364	struct {
 365		struct ds_data		data;
 366		struct ds_panic_res	res;
 367	} pkt;
 368
 369	rp = (struct ds_panic_req *) (dpkt + 1);
 370
 371	printk(KERN_ALERT "ds-%llu: Panic request from "
 372	       "LDOM manager received.\n", dp->id);
 373
 374	memset(&pkt, 0, sizeof(pkt));
 375	pkt.data.tag.type = DS_DATA;
 376	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
 377	pkt.data.handle = cp->handle;
 378	pkt.res.req_num = rp->req_num;
 379	pkt.res.result = DS_OK;
 380	pkt.res.reason[0] = 0;
 381
 382	ds_send(lp, &pkt, sizeof(pkt));
 383
 384	panic("PANIC requested by LDOM manager.");
 385}
 386
 387#ifdef CONFIG_HOTPLUG_CPU
 388struct dr_cpu_tag {
 389	__u64				req_num;
 390	__u32				type;
 391#define DR_CPU_CONFIGURE		0x43
 392#define DR_CPU_UNCONFIGURE		0x55
 393#define DR_CPU_FORCE_UNCONFIGURE	0x46
 394#define DR_CPU_STATUS			0x53
 395
 396/* Responses */
 397#define DR_CPU_OK			0x6f
 398#define DR_CPU_ERROR			0x65
 399
 400	__u32				num_records;
 401};
 402
 403struct dr_cpu_resp_entry {
 404	__u32				cpu;
 405	__u32				result;
 406#define DR_CPU_RES_OK			0x00
 407#define DR_CPU_RES_FAILURE		0x01
 408#define DR_CPU_RES_BLOCKED		0x02
 409#define DR_CPU_RES_CPU_NOT_RESPONDING	0x03
 410#define DR_CPU_RES_NOT_IN_MD		0x04
 411
 412	__u32				stat;
 413#define DR_CPU_STAT_NOT_PRESENT		0x00
 414#define DR_CPU_STAT_UNCONFIGURED	0x01
 415#define DR_CPU_STAT_CONFIGURED		0x02
 416
 417	__u32				str_off;
 418};
 419
 420static void __dr_cpu_send_error(struct ds_info *dp,
 421				struct ds_cap_state *cp,
 422				struct ds_data *data)
 423{
 424	struct dr_cpu_tag *tag = (struct dr_cpu_tag *) (data + 1);
 425	struct {
 426		struct ds_data		data;
 427		struct dr_cpu_tag	tag;
 428	} pkt;
 429	int msg_len;
 430
 431	memset(&pkt, 0, sizeof(pkt));
 432	pkt.data.tag.type = DS_DATA;
 433	pkt.data.handle = cp->handle;
 434	pkt.tag.req_num = tag->req_num;
 435	pkt.tag.type = DR_CPU_ERROR;
 436	pkt.tag.num_records = 0;
 437
 438	msg_len = (sizeof(struct ds_data) +
 439		   sizeof(struct dr_cpu_tag));
 440
 441	pkt.data.tag.len = msg_len - sizeof(struct ds_msg_tag);
 442
 443	__ds_send(dp->lp, &pkt, msg_len);
 444}
 445
 446static void dr_cpu_send_error(struct ds_info *dp,
 447			      struct ds_cap_state *cp,
 448			      struct ds_data *data)
 449{
 450	unsigned long flags;
 451
 452	spin_lock_irqsave(&ds_lock, flags);
 453	__dr_cpu_send_error(dp, cp, data);
 454	spin_unlock_irqrestore(&ds_lock, flags);
 455}
 456
 457#define CPU_SENTINEL	0xffffffff
 458
 459static void purge_dups(u32 *list, u32 num_ents)
 460{
 461	unsigned int i;
 462
 463	for (i = 0; i < num_ents; i++) {
 464		u32 cpu = list[i];
 465		unsigned int j;
 466
 467		if (cpu == CPU_SENTINEL)
 468			continue;
 469
 470		for (j = i + 1; j < num_ents; j++) {
 471			if (list[j] == cpu)
 472				list[j] = CPU_SENTINEL;
 473		}
 474	}
 475}
 476
 477static int dr_cpu_size_response(int ncpus)
 478{
 479	return (sizeof(struct ds_data) +
 480		sizeof(struct dr_cpu_tag) +
 481		(sizeof(struct dr_cpu_resp_entry) * ncpus));
 482}
 483
 484static void dr_cpu_init_response(struct ds_data *resp, u64 req_num,
 485				 u64 handle, int resp_len, int ncpus,
 486				 cpumask_t *mask, u32 default_stat)
 487{
 488	struct dr_cpu_resp_entry *ent;
 489	struct dr_cpu_tag *tag;
 490	int i, cpu;
 491
 492	tag = (struct dr_cpu_tag *) (resp + 1);
 493	ent = (struct dr_cpu_resp_entry *) (tag + 1);
 494
 495	resp->tag.type = DS_DATA;
 496	resp->tag.len = resp_len - sizeof(struct ds_msg_tag);
 497	resp->handle = handle;
 498	tag->req_num = req_num;
 499	tag->type = DR_CPU_OK;
 500	tag->num_records = ncpus;
 501
 502	i = 0;
 503	for_each_cpu(cpu, mask) {
 504		ent[i].cpu = cpu;
 505		ent[i].result = DR_CPU_RES_OK;
 506		ent[i].stat = default_stat;
 507		i++;
 508	}
 509	BUG_ON(i != ncpus);
 510}
 511
 512static void dr_cpu_mark(struct ds_data *resp, int cpu, int ncpus,
 513			u32 res, u32 stat)
 514{
 515	struct dr_cpu_resp_entry *ent;
 516	struct dr_cpu_tag *tag;
 517	int i;
 518
 519	tag = (struct dr_cpu_tag *) (resp + 1);
 520	ent = (struct dr_cpu_resp_entry *) (tag + 1);
 521
 522	for (i = 0; i < ncpus; i++) {
 523		if (ent[i].cpu != cpu)
 524			continue;
 525		ent[i].result = res;
 526		ent[i].stat = stat;
 527		break;
 528	}
 529}
 530
 531static int dr_cpu_configure(struct ds_info *dp, struct ds_cap_state *cp,
 532			    u64 req_num, cpumask_t *mask)
 533{
 534	struct ds_data *resp;
 535	int resp_len, ncpus, cpu;
 536	unsigned long flags;
 537
 538	ncpus = cpumask_weight(mask);
 539	resp_len = dr_cpu_size_response(ncpus);
 540	resp = kzalloc(resp_len, GFP_KERNEL);
 541	if (!resp)
 542		return -ENOMEM;
 543
 544	dr_cpu_init_response(resp, req_num, cp->handle,
 545			     resp_len, ncpus, mask,
 546			     DR_CPU_STAT_CONFIGURED);
 547
 548	mdesc_populate_present_mask(mask);
 549	mdesc_fill_in_cpu_data(mask);
 550
 551	for_each_cpu(cpu, mask) {
 552		int err;
 553
 554		printk(KERN_INFO "ds-%llu: Starting cpu %d...\n",
 555		       dp->id, cpu);
 556		err = cpu_up(cpu);
 557		if (err) {
 558			__u32 res = DR_CPU_RES_FAILURE;
 559			__u32 stat = DR_CPU_STAT_UNCONFIGURED;
 560
 561			if (!cpu_present(cpu)) {
 562				/* CPU not present in MD */
 563				res = DR_CPU_RES_NOT_IN_MD;
 564				stat = DR_CPU_STAT_NOT_PRESENT;
 565			} else if (err == -ENODEV) {
 566				/* CPU did not call in successfully */
 567				res = DR_CPU_RES_CPU_NOT_RESPONDING;
 568			}
 569
 570			printk(KERN_INFO "ds-%llu: CPU startup failed err=%d\n",
 571			       dp->id, err);
 572			dr_cpu_mark(resp, cpu, ncpus, res, stat);
 573		}
 574	}
 575
 576	spin_lock_irqsave(&ds_lock, flags);
 577	__ds_send(dp->lp, resp, resp_len);
 578	spin_unlock_irqrestore(&ds_lock, flags);
 579
 580	kfree(resp);
 581
 582	/* Redistribute IRQs, taking into account the new cpus.  */
 583	fixup_irqs();
 584
 585	return 0;
 586}
 587
 588static int dr_cpu_unconfigure(struct ds_info *dp,
 589			      struct ds_cap_state *cp,
 590			      u64 req_num,
 591			      cpumask_t *mask)
 592{
 593	struct ds_data *resp;
 594	int resp_len, ncpus, cpu;
 595	unsigned long flags;
 596
 597	ncpus = cpumask_weight(mask);
 598	resp_len = dr_cpu_size_response(ncpus);
 599	resp = kzalloc(resp_len, GFP_KERNEL);
 600	if (!resp)
 601		return -ENOMEM;
 602
 603	dr_cpu_init_response(resp, req_num, cp->handle,
 604			     resp_len, ncpus, mask,
 605			     DR_CPU_STAT_UNCONFIGURED);
 606
 607	for_each_cpu(cpu, mask) {
 608		int err;
 609
 610		printk(KERN_INFO "ds-%llu: Shutting down cpu %d...\n",
 611		       dp->id, cpu);
 612		err = cpu_down(cpu);
 613		if (err)
 614			dr_cpu_mark(resp, cpu, ncpus,
 615				    DR_CPU_RES_FAILURE,
 616				    DR_CPU_STAT_CONFIGURED);
 617	}
 618
 619	spin_lock_irqsave(&ds_lock, flags);
 620	__ds_send(dp->lp, resp, resp_len);
 621	spin_unlock_irqrestore(&ds_lock, flags);
 622
 623	kfree(resp);
 624
 625	return 0;
 626}
 627
 628static void dr_cpu_data(struct ds_info *dp, struct ds_cap_state *cp, void *buf,
 629			int len)
 630{
 631	struct ds_data *data = buf;
 632	struct dr_cpu_tag *tag = (struct dr_cpu_tag *) (data + 1);
 633	u32 *cpu_list = (u32 *) (tag + 1);
 634	u64 req_num = tag->req_num;
 635	cpumask_t mask;
 636	unsigned int i;
 637	int err;
 638
 639	switch (tag->type) {
 640	case DR_CPU_CONFIGURE:
 641	case DR_CPU_UNCONFIGURE:
 642	case DR_CPU_FORCE_UNCONFIGURE:
 643		break;
 644
 645	default:
 646		dr_cpu_send_error(dp, cp, data);
 647		return;
 648	}
 649
 650	purge_dups(cpu_list, tag->num_records);
 651
 652	cpumask_clear(&mask);
 653	for (i = 0; i < tag->num_records; i++) {
 654		if (cpu_list[i] == CPU_SENTINEL)
 655			continue;
 656
 657		if (cpu_list[i] < nr_cpu_ids)
 658			cpumask_set_cpu(cpu_list[i], &mask);
 659	}
 660
 661	if (tag->type == DR_CPU_CONFIGURE)
 662		err = dr_cpu_configure(dp, cp, req_num, &mask);
 663	else
 664		err = dr_cpu_unconfigure(dp, cp, req_num, &mask);
 665
 666	if (err)
 667		dr_cpu_send_error(dp, cp, data);
 668}
 669#endif /* CONFIG_HOTPLUG_CPU */
 670
 671struct ds_pri_msg {
 672	__u64				req_num;
 673	__u64				type;
 674#define DS_PRI_REQUEST			0x00
 675#define DS_PRI_DATA			0x01
 676#define DS_PRI_UPDATE			0x02
 677};
 678
 679static void ds_pri_data(struct ds_info *dp,
 680			struct ds_cap_state *cp,
 681			void *buf, int len)
 682{
 683	struct ds_data *dpkt = buf;
 684	struct ds_pri_msg *rp;
 685
 686	rp = (struct ds_pri_msg *) (dpkt + 1);
 687
 688	printk(KERN_INFO "ds-%llu: PRI REQ [%llx:%llx], len=%d\n",
 689	       dp->id, rp->req_num, rp->type, len);
 690}
 691
 692struct ds_var_hdr {
 693	__u32				type;
 694#define DS_VAR_SET_REQ			0x00
 695#define DS_VAR_DELETE_REQ		0x01
 696#define DS_VAR_SET_RESP			0x02
 697#define DS_VAR_DELETE_RESP		0x03
 698};
 699
 700struct ds_var_set_msg {
 701	struct ds_var_hdr		hdr;
 702	char				name_and_value[0];
 703};
 704
 705struct ds_var_delete_msg {
 706	struct ds_var_hdr		hdr;
 707	char				name[0];
 708};
 709
 710struct ds_var_resp {
 711	struct ds_var_hdr		hdr;
 712	__u32				result;
 713#define DS_VAR_SUCCESS			0x00
 714#define DS_VAR_NO_SPACE			0x01
 715#define DS_VAR_INVALID_VAR		0x02
 716#define DS_VAR_INVALID_VAL		0x03
 717#define DS_VAR_NOT_PRESENT		0x04
 718};
 719
 720static DEFINE_MUTEX(ds_var_mutex);
 721static int ds_var_doorbell;
 722static int ds_var_response;
 723
 724static void ds_var_data(struct ds_info *dp,
 725			struct ds_cap_state *cp,
 726			void *buf, int len)
 727{
 728	struct ds_data *dpkt = buf;
 729	struct ds_var_resp *rp;
 730
 731	rp = (struct ds_var_resp *) (dpkt + 1);
 732
 733	if (rp->hdr.type != DS_VAR_SET_RESP &&
 734	    rp->hdr.type != DS_VAR_DELETE_RESP)
 735		return;
 736
 737	ds_var_response = rp->result;
 738	wmb();
 739	ds_var_doorbell = 1;
 740}
 741
 742void ldom_set_var(const char *var, const char *value)
 743{
 744	struct ds_cap_state *cp;
 745	struct ds_info *dp;
 746	unsigned long flags;
 747
 748	spin_lock_irqsave(&ds_lock, flags);
 749	cp = NULL;
 750	for (dp = ds_info_list; dp; dp = dp->next) {
 751		struct ds_cap_state *tmp;
 752
 753		tmp = find_cap_by_string(dp, "var-config");
 754		if (tmp && tmp->state == CAP_STATE_REGISTERED) {
 755			cp = tmp;
 756			break;
 757		}
 758	}
 759	if (!cp) {
 760		for (dp = ds_info_list; dp; dp = dp->next) {
 761			struct ds_cap_state *tmp;
 762
 763			tmp = find_cap_by_string(dp, "var-config-backup");
 764			if (tmp && tmp->state == CAP_STATE_REGISTERED) {
 765				cp = tmp;
 766				break;
 767			}
 768		}
 769	}
 770	spin_unlock_irqrestore(&ds_lock, flags);
 771
 772	if (cp) {
 773		union {
 774			struct {
 775				struct ds_data		data;
 776				struct ds_var_set_msg	msg;
 777			} header;
 778			char			all[512];
 779		} pkt;
 780		char  *base, *p;
 781		int msg_len, loops;
 782
 783		if (strlen(var) + strlen(value) + 2 >
 784		    sizeof(pkt) - sizeof(pkt.header)) {
 785			printk(KERN_ERR PFX
 786				"contents length: %zu, which more than max: %lu,"
 787				"so could not set (%s) variable to (%s).\n",
 788				strlen(var) + strlen(value) + 2,
 789				sizeof(pkt) - sizeof(pkt.header), var, value);
 790			return;
 791		}
 792
 793		memset(&pkt, 0, sizeof(pkt));
 794		pkt.header.data.tag.type = DS_DATA;
 795		pkt.header.data.handle = cp->handle;
 796		pkt.header.msg.hdr.type = DS_VAR_SET_REQ;
 797		base = p = &pkt.header.msg.name_and_value[0];
 798		strcpy(p, var);
 799		p += strlen(var) + 1;
 800		strcpy(p, value);
 801		p += strlen(value) + 1;
 802
 803		msg_len = (sizeof(struct ds_data) +
 804			   sizeof(struct ds_var_set_msg) +
 805			   (p - base));
 806		msg_len = (msg_len + 3) & ~3;
 807		pkt.header.data.tag.len = msg_len - sizeof(struct ds_msg_tag);
 808
 809		mutex_lock(&ds_var_mutex);
 810
 811		spin_lock_irqsave(&ds_lock, flags);
 812		ds_var_doorbell = 0;
 813		ds_var_response = -1;
 814
 815		__ds_send(dp->lp, &pkt, msg_len);
 816		spin_unlock_irqrestore(&ds_lock, flags);
 817
 818		loops = 1000;
 819		while (ds_var_doorbell == 0) {
 820			if (loops-- < 0)
 821				break;
 822			barrier();
 823			udelay(100);
 824		}
 825
 826		mutex_unlock(&ds_var_mutex);
 827
 828		if (ds_var_doorbell == 0 ||
 829		    ds_var_response != DS_VAR_SUCCESS)
 830			printk(KERN_ERR "ds-%llu: var-config [%s:%s] "
 831			       "failed, response(%d).\n",
 832			       dp->id, var, value,
 833			       ds_var_response);
 834	} else {
 835		printk(KERN_ERR PFX "var-config not registered so "
 836		       "could not set (%s) variable to (%s).\n",
 837		       var, value);
 838	}
 839}
 840
 841static char full_boot_str[256] __attribute__((aligned(32)));
 842static int reboot_data_supported;
 843
 844void ldom_reboot(const char *boot_command)
 845{
 846	/* Don't bother with any of this if the boot_command
 847	 * is empty.
 848	 */
 849	if (boot_command && strlen(boot_command)) {
 850		unsigned long len;
 851
 852		snprintf(full_boot_str, sizeof(full_boot_str), "boot %s",
 853			 boot_command);
 854		len = strlen(full_boot_str);
 855
 856		if (reboot_data_supported) {
 857			unsigned long ra = kimage_addr_to_ra(full_boot_str);
 858			unsigned long hv_ret;
 859
 860			hv_ret = sun4v_reboot_data_set(ra, len);
 861			if (hv_ret != HV_EOK)
 862				pr_err("SUN4V: Unable to set reboot data "
 863				       "hv_ret=%lu\n", hv_ret);
 864		} else {
 865			ldom_set_var("reboot-command", full_boot_str);
 866		}
 867	}
 868	sun4v_mach_sir();
 869}
 870
 871void ldom_power_off(void)
 872{
 873	sun4v_mach_exit(0);
 874}
 875
 876static void ds_conn_reset(struct ds_info *dp)
 877{
 878	printk(KERN_ERR "ds-%llu: ds_conn_reset() from %pf\n",
 879	       dp->id, __builtin_return_address(0));
 880}
 881
 882static int register_services(struct ds_info *dp)
 883{
 884	struct ldc_channel *lp = dp->lp;
 885	int i;
 886
 887	for (i = 0; i < dp->num_ds_states; i++) {
 888		struct {
 889			struct ds_reg_req req;
 890			u8 id_buf[256];
 891		} pbuf;
 892		struct ds_cap_state *cp = &dp->ds_states[i];
 893		int err, msg_len;
 894		u64 new_count;
 895
 896		if (cp->state == CAP_STATE_REGISTERED)
 897			continue;
 898
 899		new_count = sched_clock() & 0xffffffff;
 900		cp->handle = ((u64) i << 32) | new_count;
 901
 902		msg_len = (sizeof(struct ds_reg_req) +
 903			   strlen(cp->service_id));
 904
 905		memset(&pbuf, 0, sizeof(pbuf));
 906		pbuf.req.tag.type = DS_REG_REQ;
 907		pbuf.req.tag.len = (msg_len - sizeof(struct ds_msg_tag));
 908		pbuf.req.handle = cp->handle;
 909		pbuf.req.major = 1;
 910		pbuf.req.minor = 0;
 911		strcpy(pbuf.req.svc_id, cp->service_id);
 912
 913		err = __ds_send(lp, &pbuf, msg_len);
 914		if (err > 0)
 915			cp->state = CAP_STATE_REG_SENT;
 916	}
 917	return 0;
 918}
 919
 920static int ds_handshake(struct ds_info *dp, struct ds_msg_tag *pkt)
 921{
 922
 923	if (dp->hs_state == DS_HS_START) {
 924		if (pkt->type != DS_INIT_ACK)
 925			goto conn_reset;
 926
 927		dp->hs_state = DS_HS_DONE;
 928
 929		return register_services(dp);
 930	}
 931
 932	if (dp->hs_state != DS_HS_DONE)
 933		goto conn_reset;
 934
 935	if (pkt->type == DS_REG_ACK) {
 936		struct ds_reg_ack *ap = (struct ds_reg_ack *) pkt;
 937		struct ds_cap_state *cp = find_cap(dp, ap->handle);
 938
 939		if (!cp) {
 940			printk(KERN_ERR "ds-%llu: REG ACK for unknown "
 941			       "handle %llx\n", dp->id, ap->handle);
 942			return 0;
 943		}
 944		printk(KERN_INFO "ds-%llu: Registered %s service.\n",
 945		       dp->id, cp->service_id);
 946		cp->state = CAP_STATE_REGISTERED;
 947	} else if (pkt->type == DS_REG_NACK) {
 948		struct ds_reg_nack *np = (struct ds_reg_nack *) pkt;
 949		struct ds_cap_state *cp = find_cap(dp, np->handle);
 950
 951		if (!cp) {
 952			printk(KERN_ERR "ds-%llu: REG NACK for "
 953			       "unknown handle %llx\n",
 954			       dp->id, np->handle);
 955			return 0;
 956		}
 957		cp->state = CAP_STATE_UNKNOWN;
 958	}
 959
 960	return 0;
 961
 962conn_reset:
 963	ds_conn_reset(dp);
 964	return -ECONNRESET;
 965}
 966
 967static void __send_ds_nack(struct ds_info *dp, u64 handle)
 968{
 969	struct ds_data_nack nack = {
 970		.tag = {
 971			.type = DS_NACK,
 972			.len = (sizeof(struct ds_data_nack) -
 973				sizeof(struct ds_msg_tag)),
 974		},
 975		.handle = handle,
 976		.result = DS_INV_HDL,
 977	};
 978
 979	__ds_send(dp->lp, &nack, sizeof(nack));
 980}
 981
 982static LIST_HEAD(ds_work_list);
 983static DECLARE_WAIT_QUEUE_HEAD(ds_wait);
 984
 985struct ds_queue_entry {
 986	struct list_head		list;
 987	struct ds_info			*dp;
 988	int				req_len;
 989	int				__pad;
 990	u64				req[0];
 991};
 992
 993static void process_ds_work(void)
 994{
 995	struct ds_queue_entry *qp, *tmp;
 996	unsigned long flags;
 997	LIST_HEAD(todo);
 998
 999	spin_lock_irqsave(&ds_lock, flags);
1000	list_splice_init(&ds_work_list, &todo);
1001	spin_unlock_irqrestore(&ds_lock, flags);
1002
1003	list_for_each_entry_safe(qp, tmp, &todo, list) {
1004		struct ds_data *dpkt = (struct ds_data *) qp->req;
1005		struct ds_info *dp = qp->dp;
1006		struct ds_cap_state *cp = find_cap(dp, dpkt->handle);
1007		int req_len = qp->req_len;
1008
1009		if (!cp) {
1010			printk(KERN_ERR "ds-%llu: Data for unknown "
1011			       "handle %llu\n",
1012			       dp->id, dpkt->handle);
1013
1014			spin_lock_irqsave(&ds_lock, flags);
1015			__send_ds_nack(dp, dpkt->handle);
1016			spin_unlock_irqrestore(&ds_lock, flags);
1017		} else {
1018			cp->data(dp, cp, dpkt, req_len);
1019		}
1020
1021		list_del(&qp->list);
1022		kfree(qp);
1023	}
1024}
1025
1026static int ds_thread(void *__unused)
1027{
1028	DEFINE_WAIT(wait);
1029
1030	while (1) {
1031		prepare_to_wait(&ds_wait, &wait, TASK_INTERRUPTIBLE);
1032		if (list_empty(&ds_work_list))
1033			schedule();
1034		finish_wait(&ds_wait, &wait);
1035
1036		if (kthread_should_stop())
1037			break;
1038
1039		process_ds_work();
1040	}
1041
1042	return 0;
1043}
1044
1045static int ds_data(struct ds_info *dp, struct ds_msg_tag *pkt, int len)
1046{
1047	struct ds_data *dpkt = (struct ds_data *) pkt;
1048	struct ds_queue_entry *qp;
1049
1050	qp = kmalloc(sizeof(struct ds_queue_entry) + len, GFP_ATOMIC);
1051	if (!qp) {
1052		__send_ds_nack(dp, dpkt->handle);
1053	} else {
1054		qp->dp = dp;
1055		memcpy(&qp->req, pkt, len);
1056		list_add_tail(&qp->list, &ds_work_list);
1057		wake_up(&ds_wait);
1058	}
1059	return 0;
1060}
1061
1062static void ds_up(struct ds_info *dp)
1063{
1064	struct ldc_channel *lp = dp->lp;
1065	struct ds_ver_req req;
1066	int err;
1067
1068	req.tag.type = DS_INIT_REQ;
1069	req.tag.len = sizeof(req) - sizeof(struct ds_msg_tag);
1070	req.ver.major = 1;
1071	req.ver.minor = 0;
1072
1073	err = __ds_send(lp, &req, sizeof(req));
1074	if (err > 0)
1075		dp->hs_state = DS_HS_START;
1076}
1077
1078static void ds_reset(struct ds_info *dp)
1079{
1080	int i;
1081
1082	dp->hs_state = 0;
1083
1084	for (i = 0; i < dp->num_ds_states; i++) {
1085		struct ds_cap_state *cp = &dp->ds_states[i];
1086
1087		cp->state = CAP_STATE_UNKNOWN;
1088	}
1089}
1090
1091static void ds_event(void *arg, int event)
1092{
1093	struct ds_info *dp = arg;
1094	struct ldc_channel *lp = dp->lp;
1095	unsigned long flags;
1096	int err;
1097
1098	spin_lock_irqsave(&ds_lock, flags);
1099
1100	if (event == LDC_EVENT_UP) {
1101		ds_up(dp);
1102		spin_unlock_irqrestore(&ds_lock, flags);
1103		return;
1104	}
1105
1106	if (event == LDC_EVENT_RESET) {
1107		ds_reset(dp);
1108		spin_unlock_irqrestore(&ds_lock, flags);
1109		return;
1110	}
1111
1112	if (event != LDC_EVENT_DATA_READY) {
1113		printk(KERN_WARNING "ds-%llu: Unexpected LDC event %d\n",
1114		       dp->id, event);
1115		spin_unlock_irqrestore(&ds_lock, flags);
1116		return;
1117	}
1118
1119	err = 0;
1120	while (1) {
1121		struct ds_msg_tag *tag;
1122
1123		err = ldc_read(lp, dp->rcv_buf, sizeof(*tag));
1124
1125		if (unlikely(err < 0)) {
1126			if (err == -ECONNRESET)
1127				ds_conn_reset(dp);
1128			break;
1129		}
1130		if (err == 0)
1131			break;
1132
1133		tag = dp->rcv_buf;
1134		err = ldc_read(lp, tag + 1, tag->len);
1135
1136		if (unlikely(err < 0)) {
1137			if (err == -ECONNRESET)
1138				ds_conn_reset(dp);
1139			break;
1140		}
1141		if (err < tag->len)
1142			break;
1143
1144		if (tag->type < DS_DATA)
1145			err = ds_handshake(dp, dp->rcv_buf);
1146		else
1147			err = ds_data(dp, dp->rcv_buf,
1148				      sizeof(*tag) + err);
1149		if (err == -ECONNRESET)
1150			break;
1151	}
1152
1153	spin_unlock_irqrestore(&ds_lock, flags);
1154}
1155
1156static int ds_probe(struct vio_dev *vdev, const struct vio_device_id *id)
1157{
1158	static int ds_version_printed;
1159	struct ldc_channel_config ds_cfg = {
1160		.event		= ds_event,
1161		.mtu		= 4096,
1162		.mode		= LDC_MODE_STREAM,
1163	};
1164	struct mdesc_handle *hp;
1165	struct ldc_channel *lp;
1166	struct ds_info *dp;
1167	const u64 *val;
1168	int err, i;
1169
1170	if (ds_version_printed++ == 0)
1171		printk(KERN_INFO "%s", version);
1172
1173	dp = kzalloc(sizeof(*dp), GFP_KERNEL);
1174	err = -ENOMEM;
1175	if (!dp)
1176		goto out_err;
1177
1178	hp = mdesc_grab();
1179	val = mdesc_get_property(hp, vdev->mp, "id", NULL);
1180	if (val)
1181		dp->id = *val;
1182	mdesc_release(hp);
1183
1184	dp->rcv_buf = kzalloc(4096, GFP_KERNEL);
1185	if (!dp->rcv_buf)
1186		goto out_free_dp;
1187
1188	dp->rcv_buf_len = 4096;
1189
1190	dp->ds_states = kmemdup(ds_states_template,
1191				sizeof(ds_states_template), GFP_KERNEL);
1192	if (!dp->ds_states)
1193		goto out_free_rcv_buf;
1194
1195	dp->num_ds_states = ARRAY_SIZE(ds_states_template);
1196
1197	for (i = 0; i < dp->num_ds_states; i++)
1198		dp->ds_states[i].handle = ((u64)i << 32);
1199
1200	ds_cfg.tx_irq = vdev->tx_irq;
1201	ds_cfg.rx_irq = vdev->rx_irq;
1202
1203	lp = ldc_alloc(vdev->channel_id, &ds_cfg, dp, "DS");
1204	if (IS_ERR(lp)) {
1205		err = PTR_ERR(lp);
1206		goto out_free_ds_states;
1207	}
1208	dp->lp = lp;
1209
1210	err = ldc_bind(lp);
1211	if (err)
1212		goto out_free_ldc;
1213
1214	spin_lock_irq(&ds_lock);
1215	dp->next = ds_info_list;
1216	ds_info_list = dp;
1217	spin_unlock_irq(&ds_lock);
1218
1219	return err;
1220
1221out_free_ldc:
1222	ldc_free(dp->lp);
1223
1224out_free_ds_states:
1225	kfree(dp->ds_states);
1226
1227out_free_rcv_buf:
1228	kfree(dp->rcv_buf);
1229
1230out_free_dp:
1231	kfree(dp);
1232
1233out_err:
1234	return err;
1235}
1236
1237static int ds_remove(struct vio_dev *vdev)
1238{
1239	return 0;
1240}
1241
1242static const struct vio_device_id ds_match[] = {
1243	{
1244		.type = "domain-services-port",
1245	},
1246	{},
1247};
1248
1249static struct vio_driver ds_driver = {
1250	.id_table	= ds_match,
1251	.probe		= ds_probe,
1252	.remove		= ds_remove,
1253	.name		= "ds",
1254};
1255
1256static int __init ds_init(void)
1257{
1258	unsigned long hv_ret, major, minor;
1259
1260	if (tlb_type == hypervisor) {
1261		hv_ret = sun4v_get_version(HV_GRP_REBOOT_DATA, &major, &minor);
1262		if (hv_ret == HV_EOK) {
1263			pr_info("SUN4V: Reboot data supported (maj=%lu,min=%lu).\n",
1264				major, minor);
1265			reboot_data_supported = 1;
1266		}
1267	}
1268	kthread_run(ds_thread, NULL, "kldomd");
1269
1270	return vio_register_driver(&ds_driver);
1271}
1272
1273fs_initcall(ds_init);