1/* ds.c: Domain Services driver for Logical Domains
2 *
3 * Copyright (C) 2007, 2008 David S. Miller <davem@davemloft.net>
4 */
5
6#include <linux/kernel.h>
7#include <linux/module.h>
8#include <linux/types.h>
9#include <linux/string.h>
10#include <linux/slab.h>
11#include <linux/sched.h>
12#include <linux/delay.h>
13#include <linux/mutex.h>
14#include <linux/kthread.h>
15#include <linux/reboot.h>
16#include <linux/cpu.h>
17
18#include <asm/hypervisor.h>
19#include <asm/ldc.h>
20#include <asm/vio.h>
21#include <asm/mdesc.h>
22#include <asm/head.h>
23#include <asm/irq.h>
24
25#include "kernel.h"
26
27#define DRV_MODULE_NAME		"ds"
28#define PFX DRV_MODULE_NAME	": "
29#define DRV_MODULE_VERSION	"1.0"
30#define DRV_MODULE_RELDATE	"Jul 11, 2007"
31
32static char version[] =
33	DRV_MODULE_NAME ".c:v" DRV_MODULE_VERSION " (" DRV_MODULE_RELDATE ")\n";
34MODULE_AUTHOR("David S. Miller (davem@davemloft.net)");
35MODULE_DESCRIPTION("Sun LDOM domain services driver");
36MODULE_LICENSE("GPL");
37MODULE_VERSION(DRV_MODULE_VERSION);
38
39struct ds_msg_tag {
40	__u32			type;
41#define DS_INIT_REQ		0x00
42#define DS_INIT_ACK		0x01
43#define DS_INIT_NACK		0x02
44#define DS_REG_REQ		0x03
45#define DS_REG_ACK		0x04
46#define DS_REG_NACK		0x05
47#define DS_UNREG_REQ		0x06
48#define DS_UNREG_ACK		0x07
49#define DS_UNREG_NACK		0x08
50#define DS_DATA			0x09
51#define DS_NACK			0x0a
52
53	__u32			len;
54};
55
56/* Result codes */
57#define DS_OK			0x00
58#define DS_REG_VER_NACK		0x01
59#define DS_REG_DUP		0x02
60#define DS_INV_HDL		0x03
61#define DS_TYPE_UNKNOWN		0x04
62
63struct ds_version {
64	__u16			major;
65	__u16			minor;
66};
67
68struct ds_ver_req {
69	struct ds_msg_tag	tag;
70	struct ds_version	ver;
71};
72
73struct ds_ver_ack {
74	struct ds_msg_tag	tag;
75	__u16			minor;
76};
77
78struct ds_ver_nack {
79	struct ds_msg_tag	tag;
80	__u16			major;
81};
82
83struct ds_reg_req {
84	struct ds_msg_tag	tag;
85	__u64			handle;
86	__u16			major;
87	__u16			minor;
88	char			svc_id[0];
89};
90
91struct ds_reg_ack {
92	struct ds_msg_tag	tag;
93	__u64			handle;
94	__u16			minor;
95};
96
97struct ds_reg_nack {
98	struct ds_msg_tag	tag;
99	__u64			handle;
100	__u16			major;
101};
102
103struct ds_unreg_req {
104	struct ds_msg_tag	tag;
105	__u64			handle;
106};
107
108struct ds_unreg_ack {
109	struct ds_msg_tag	tag;
110	__u64			handle;
111};
112
113struct ds_unreg_nack {
114	struct ds_msg_tag	tag;
115	__u64			handle;
116};
117
118struct ds_data {
119	struct ds_msg_tag	tag;
120	__u64			handle;
121};
122
123struct ds_data_nack {
124	struct ds_msg_tag	tag;
125	__u64			handle;
126	__u64			result;
127};
128
129struct ds_info;
130struct ds_cap_state {
131	__u64			handle;
132
133	void			(*data)(struct ds_info *dp,
134					struct ds_cap_state *cp,
135					void *buf, int len);
136
137	const char		*service_id;
138
139	u8			state;
140#define CAP_STATE_UNKNOWN	0x00
141#define CAP_STATE_REG_SENT	0x01
142#define CAP_STATE_REGISTERED	0x02
143};
144
145static void md_update_data(struct ds_info *dp, struct ds_cap_state *cp,
146			   void *buf, int len);
147static void domain_shutdown_data(struct ds_info *dp,
148				 struct ds_cap_state *cp,
149				 void *buf, int len);
150static void domain_panic_data(struct ds_info *dp,
151			      struct ds_cap_state *cp,
152			      void *buf, int len);
153#ifdef CONFIG_HOTPLUG_CPU
154static void dr_cpu_data(struct ds_info *dp,
155			struct ds_cap_state *cp,
156			void *buf, int len);
157#endif
158static void ds_pri_data(struct ds_info *dp,
159			struct ds_cap_state *cp,
160			void *buf, int len);
161static void ds_var_data(struct ds_info *dp,
162			struct ds_cap_state *cp,
163			void *buf, int len);
164
165static struct ds_cap_state ds_states_template[] = {
166	{
167		.service_id	= "md-update",
168		.data		= md_update_data,
169	},
170	{
171		.service_id	= "domain-shutdown",
172		.data		= domain_shutdown_data,
173	},
174	{
175		.service_id	= "domain-panic",
176		.data		= domain_panic_data,
177	},
178#ifdef CONFIG_HOTPLUG_CPU
179	{
180		.service_id	= "dr-cpu",
181		.data		= dr_cpu_data,
182	},
183#endif
184	{
185		.service_id	= "pri",
186		.data		= ds_pri_data,
187	},
188	{
189		.service_id	= "var-config",
190		.data		= ds_var_data,
191	},
192	{
193		.service_id	= "var-config-backup",
194		.data		= ds_var_data,
195	},
196};
197
198static DEFINE_SPINLOCK(ds_lock);
199
200struct ds_info {
201	struct ldc_channel	*lp;
202	u8			hs_state;
203#define DS_HS_START		0x01
204#define DS_HS_DONE		0x02
205
206	u64			id;
207
208	void			*rcv_buf;
209	int			rcv_buf_len;
210
211	struct ds_cap_state	*ds_states;
212	int			num_ds_states;
213
214	struct ds_info		*next;
215};
216
217static struct ds_info *ds_info_list;
218
219static struct ds_cap_state *find_cap(struct ds_info *dp, u64 handle)
220{
221	unsigned int index = handle >> 32;
222
223	if (index >= dp->num_ds_states)
224		return NULL;
225	return &dp->ds_states[index];
226}
227
228static struct ds_cap_state *find_cap_by_string(struct ds_info *dp,
229					       const char *name)
230{
231	int i;
232
233	for (i = 0; i < dp->num_ds_states; i++) {
234		if (strcmp(dp->ds_states[i].service_id, name))
235			continue;
236
237		return &dp->ds_states[i];
238	}
239	return NULL;
240}
241
242static int __ds_send(struct ldc_channel *lp, void *data, int len)
243{
244	int err, limit = 1000;
245
246	err = -EINVAL;
247	while (limit-- > 0) {
248		err = ldc_write(lp, data, len);
249		if (!err || (err != -EAGAIN))
250			break;
251		udelay(1);
252	}
253
254	return err;
255}
256
257static int ds_send(struct ldc_channel *lp, void *data, int len)
258{
259	unsigned long flags;
260	int err;
261
262	spin_lock_irqsave(&ds_lock, flags);
263	err = __ds_send(lp, data, len);
264	spin_unlock_irqrestore(&ds_lock, flags);
265
266	return err;
267}
268
269struct ds_md_update_req {
270	__u64				req_num;
271};
272
273struct ds_md_update_res {
274	__u64				req_num;
275	__u32				result;
276};
277
278static void md_update_data(struct ds_info *dp,
279			   struct ds_cap_state *cp,
280			   void *buf, int len)
281{
282	struct ldc_channel *lp = dp->lp;
283	struct ds_data *dpkt = buf;
284	struct ds_md_update_req *rp;
285	struct {
286		struct ds_data		data;
287		struct ds_md_update_res	res;
288	} pkt;
289
290	rp = (struct ds_md_update_req *) (dpkt + 1);
291
292	printk(KERN_INFO "ds-%llu: Machine description update.\n", dp->id);
293
294	mdesc_update();
295
296	memset(&pkt, 0, sizeof(pkt));
297	pkt.data.tag.type = DS_DATA;
298	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
299	pkt.data.handle = cp->handle;
300	pkt.res.req_num = rp->req_num;
301	pkt.res.result = DS_OK;
302
303	ds_send(lp, &pkt, sizeof(pkt));
304}
305
306struct ds_shutdown_req {
307	__u64				req_num;
308	__u32				ms_delay;
309};
310
311struct ds_shutdown_res {
312	__u64				req_num;
313	__u32				result;
314	char				reason[1];
315};
316
317static void domain_shutdown_data(struct ds_info *dp,
318				 struct ds_cap_state *cp,
319				 void *buf, int len)
320{
321	struct ldc_channel *lp = dp->lp;
322	struct ds_data *dpkt = buf;
323	struct ds_shutdown_req *rp;
324	struct {
325		struct ds_data		data;
326		struct ds_shutdown_res	res;
327	} pkt;
328
329	rp = (struct ds_shutdown_req *) (dpkt + 1);
330
331	printk(KERN_ALERT "ds-%llu: Shutdown request from "
332	       "LDOM manager received.\n", dp->id);
333
334	memset(&pkt, 0, sizeof(pkt));
335	pkt.data.tag.type = DS_DATA;
336	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
337	pkt.data.handle = cp->handle;
338	pkt.res.req_num = rp->req_num;
339	pkt.res.result = DS_OK;
340	pkt.res.reason[0] = 0;
341
342	ds_send(lp, &pkt, sizeof(pkt));
343
344	orderly_poweroff(true);
345}
346
347struct ds_panic_req {
348	__u64				req_num;
349};
350
351struct ds_panic_res {
352	__u64				req_num;
353	__u32				result;
354	char				reason[1];
355};
356
357static void domain_panic_data(struct ds_info *dp,
358			      struct ds_cap_state *cp,
359			      void *buf, int len)
360{
361	struct ldc_channel *lp = dp->lp;
362	struct ds_data *dpkt = buf;
363	struct ds_panic_req *rp;
364	struct {
365		struct ds_data		data;
366		struct ds_panic_res	res;
367	} pkt;
368
369	rp = (struct ds_panic_req *) (dpkt + 1);
370
371	printk(KERN_ALERT "ds-%llu: Panic request from "
372	       "LDOM manager received.\n", dp->id);
373
374	memset(&pkt, 0, sizeof(pkt));
375	pkt.data.tag.type = DS_DATA;
376	pkt.data.tag.len = sizeof(pkt) - sizeof(struct ds_msg_tag);
377	pkt.data.handle = cp->handle;
378	pkt.res.req_num = rp->req_num;
379	pkt.res.result = DS_OK;
380	pkt.res.reason[0] = 0;
381
382	ds_send(lp, &pkt, sizeof(pkt));
383
384	panic("PANIC requested by LDOM manager.");
385}
386
387#ifdef CONFIG_HOTPLUG_CPU
388struct dr_cpu_tag {
389	__u64				req_num;
390	__u32				type;
391#define DR_CPU_CONFIGURE		0x43
392#define DR_CPU_UNCONFIGURE		0x55
393#define DR_CPU_FORCE_UNCONFIGURE	0x46
394#define DR_CPU_STATUS			0x53
395
396/* Responses */
397#define DR_CPU_OK			0x6f
398#define DR_CPU_ERROR			0x65
399
400	__u32				num_records;
401};
402
403struct dr_cpu_resp_entry {
404	__u32				cpu;
405	__u32				result;
406#define DR_CPU_RES_OK			0x00
407#define DR_CPU_RES_FAILURE		0x01
408#define DR_CPU_RES_BLOCKED		0x02
409#define DR_CPU_RES_CPU_NOT_RESPONDING	0x03
410#define DR_CPU_RES_NOT_IN_MD		0x04
411
412	__u32				stat;
413#define DR_CPU_STAT_NOT_PRESENT		0x00
414#define DR_CPU_STAT_UNCONFIGURED	0x01
415#define DR_CPU_STAT_CONFIGURED		0x02
416
417	__u32				str_off;
418};
419
420static void __dr_cpu_send_error(struct ds_info *dp,
421				struct ds_cap_state *cp,
422				struct ds_data *data)
423{
424	struct dr_cpu_tag *tag = (struct dr_cpu_tag *) (data + 1);
425	struct {
426		struct ds_data		data;
427		struct dr_cpu_tag	tag;
428	} pkt;
429	int msg_len;
430
431	memset(&pkt, 0, sizeof(pkt));
432	pkt.data.tag.type = DS_DATA;
433	pkt.data.handle = cp->handle;
434	pkt.tag.req_num = tag->req_num;
435	pkt.tag.type = DR_CPU_ERROR;
436	pkt.tag.num_records = 0;
437
438	msg_len = (sizeof(struct ds_data) +
439		   sizeof(struct dr_cpu_tag));
440
441	pkt.data.tag.len = msg_len - sizeof(struct ds_msg_tag);
442
443	__ds_send(dp->lp, &pkt, msg_len);
444}
445
446static void dr_cpu_send_error(struct ds_info *dp,
447			      struct ds_cap_state *cp,
448			      struct ds_data *data)
449{
450	unsigned long flags;
451
452	spin_lock_irqsave(&ds_lock, flags);
453	__dr_cpu_send_error(dp, cp, data);
454	spin_unlock_irqrestore(&ds_lock, flags);
455}
456
457#define CPU_SENTINEL	0xffffffff
458
459static void purge_dups(u32 *list, u32 num_ents)
460{
461	unsigned int i;
462
463	for (i = 0; i < num_ents; i++) {
464		u32 cpu = list[i];
465		unsigned int j;
466
467		if (cpu == CPU_SENTINEL)
468			continue;
469
470		for (j = i + 1; j < num_ents; j++) {
471			if (list[j] == cpu)
472				list[j] = CPU_SENTINEL;
473		}
474	}
475}
476
477static int dr_cpu_size_response(int ncpus)
478{
479	return (sizeof(struct ds_data) +
480		sizeof(struct dr_cpu_tag) +
481		(sizeof(struct dr_cpu_resp_entry) * ncpus));
482}
483
484static void dr_cpu_init_response(struct ds_data *resp, u64 req_num,
485				 u64 handle, int resp_len, int ncpus,
486				 cpumask_t *mask, u32 default_stat)
487{
488	struct dr_cpu_resp_entry *ent;
489	struct dr_cpu_tag *tag;
490	int i, cpu;
491
492	tag = (struct dr_cpu_tag *) (resp + 1);
493	ent = (struct dr_cpu_resp_entry *) (tag + 1);
494
495	resp->tag.type = DS_DATA;
496	resp->tag.len = resp_len - sizeof(struct ds_msg_tag);
497	resp->handle = handle;
498	tag->req_num = req_num;
499	tag->type = DR_CPU_OK;
500	tag->num_records = ncpus;
501
502	i = 0;
503	for_each_cpu(cpu, mask) {
504		ent[i].cpu = cpu;
505		ent[i].result = DR_CPU_RES_OK;
506		ent[i].stat = default_stat;
507		i++;
508	}
509	BUG_ON(i != ncpus);
510}
511
512static void dr_cpu_mark(struct ds_data *resp, int cpu, int ncpus,
513			u32 res, u32 stat)
514{
515	struct dr_cpu_resp_entry *ent;
516	struct dr_cpu_tag *tag;
517	int i;
518
519	tag = (struct dr_cpu_tag *) (resp + 1);
520	ent = (struct dr_cpu_resp_entry *) (tag + 1);
521
522	for (i = 0; i < ncpus; i++) {
523		if (ent[i].cpu != cpu)
524			continue;
525		ent[i].result = res;
526		ent[i].stat = stat;
527		break;
528	}
529}
530
531static int dr_cpu_configure(struct ds_info *dp, struct ds_cap_state *cp,
532			    u64 req_num, cpumask_t *mask)
533{
534	struct ds_data *resp;
535	int resp_len, ncpus, cpu;
536	unsigned long flags;
537
538	ncpus = cpumask_weight(mask);
539	resp_len = dr_cpu_size_response(ncpus);
540	resp = kzalloc(resp_len, GFP_KERNEL);
541	if (!resp)
542		return -ENOMEM;
543
544	dr_cpu_init_response(resp, req_num, cp->handle,
545			     resp_len, ncpus, mask,
546			     DR_CPU_STAT_CONFIGURED);
547
548	mdesc_populate_present_mask(mask);
549	mdesc_fill_in_cpu_data(mask);
550
551	for_each_cpu(cpu, mask) {
552		int err;
553
554		printk(KERN_INFO "ds-%llu: Starting cpu %d...\n",
555		       dp->id, cpu);
556		err = cpu_up(cpu);
557		if (err) {
558			__u32 res = DR_CPU_RES_FAILURE;
559			__u32 stat = DR_CPU_STAT_UNCONFIGURED;
560
561			if (!cpu_present(cpu)) {
562				/* CPU not present in MD */
563				res = DR_CPU_RES_NOT_IN_MD;
564				stat = DR_CPU_STAT_NOT_PRESENT;
565			} else if (err == -ENODEV) {
566				/* CPU did not call in successfully */
567				res = DR_CPU_RES_CPU_NOT_RESPONDING;
568			}
569
570			printk(KERN_INFO "ds-%llu: CPU startup failed err=%d\n",
571			       dp->id, err);
572			dr_cpu_mark(resp, cpu, ncpus, res, stat);
573		}
574	}
575
576	spin_lock_irqsave(&ds_lock, flags);
577	__ds_send(dp->lp, resp, resp_len);
578	spin_unlock_irqrestore(&ds_lock, flags);
579
580	kfree(resp);
581
582	/* Redistribute IRQs, taking into account the new cpus.  */
583	fixup_irqs();
584
585	return 0;
586}
587
588static int dr_cpu_unconfigure(struct ds_info *dp,
589			      struct ds_cap_state *cp,
590			      u64 req_num,
591			      cpumask_t *mask)
592{
593	struct ds_data *resp;
594	int resp_len, ncpus, cpu;
595	unsigned long flags;
596
597	ncpus = cpumask_weight(mask);
598	resp_len = dr_cpu_size_response(ncpus);
599	resp = kzalloc(resp_len, GFP_KERNEL);
600	if (!resp)
601		return -ENOMEM;
602
603	dr_cpu_init_response(resp, req_num, cp->handle,
604			     resp_len, ncpus, mask,
605			     DR_CPU_STAT_UNCONFIGURED);
606
607	for_each_cpu(cpu, mask) {
608		int err;
609
610		printk(KERN_INFO "ds-%llu: Shutting down cpu %d...\n",
611		       dp->id, cpu);
612		err = cpu_down(cpu);
613		if (err)
614			dr_cpu_mark(resp, cpu, ncpus,
615				    DR_CPU_RES_FAILURE,
616				    DR_CPU_STAT_CONFIGURED);
617	}
618
619	spin_lock_irqsave(&ds_lock, flags);
620	__ds_send(dp->lp, resp, resp_len);
621	spin_unlock_irqrestore(&ds_lock, flags);
622
623	kfree(resp);
624
625	return 0;
626}
627
628static void dr_cpu_data(struct ds_info *dp, struct ds_cap_state *cp, void *buf,
629			int len)
630{
631	struct ds_data *data = buf;
632	struct dr_cpu_tag *tag = (struct dr_cpu_tag *) (data + 1);
633	u32 *cpu_list = (u32 *) (tag + 1);
634	u64 req_num = tag->req_num;
635	cpumask_t mask;
636	unsigned int i;
637	int err;
638
639	switch (tag->type) {
640	case DR_CPU_CONFIGURE:
641	case DR_CPU_UNCONFIGURE:
642	case DR_CPU_FORCE_UNCONFIGURE:
643		break;
644
645	default:
646		dr_cpu_send_error(dp, cp, data);
647		return;
648	}
649
650	purge_dups(cpu_list, tag->num_records);
651
652	cpumask_clear(&mask);
653	for (i = 0; i < tag->num_records; i++) {
654		if (cpu_list[i] == CPU_SENTINEL)
655			continue;
656
657		if (cpu_list[i] < nr_cpu_ids)
658			cpumask_set_cpu(cpu_list[i], &mask);
659	}
660
661	if (tag->type == DR_CPU_CONFIGURE)
662		err = dr_cpu_configure(dp, cp, req_num, &mask);
663	else
664		err = dr_cpu_unconfigure(dp, cp, req_num, &mask);
665
666	if (err)
667		dr_cpu_send_error(dp, cp, data);
668}
669#endif /* CONFIG_HOTPLUG_CPU */
670
671struct ds_pri_msg {
672	__u64				req_num;
673	__u64				type;
674#define DS_PRI_REQUEST			0x00
675#define DS_PRI_DATA			0x01
676#define DS_PRI_UPDATE			0x02
677};
678
679static void ds_pri_data(struct ds_info *dp,
680			struct ds_cap_state *cp,
681			void *buf, int len)
682{
683	struct ds_data *dpkt = buf;
684	struct ds_pri_msg *rp;
685
686	rp = (struct ds_pri_msg *) (dpkt + 1);
687
688	printk(KERN_INFO "ds-%llu: PRI REQ [%llx:%llx], len=%d\n",
689	       dp->id, rp->req_num, rp->type, len);
690}
691
692struct ds_var_hdr {
693	__u32				type;
694#define DS_VAR_SET_REQ			0x00
695#define DS_VAR_DELETE_REQ		0x01
696#define DS_VAR_SET_RESP			0x02
697#define DS_VAR_DELETE_RESP		0x03
698};
699
700struct ds_var_set_msg {
701	struct ds_var_hdr		hdr;
702	char				name_and_value[0];
703};
704
705struct ds_var_delete_msg {
706	struct ds_var_hdr		hdr;
707	char				name[0];
708};
709
710struct ds_var_resp {
711	struct ds_var_hdr		hdr;
712	__u32				result;
713#define DS_VAR_SUCCESS			0x00
714#define DS_VAR_NO_SPACE			0x01
715#define DS_VAR_INVALID_VAR		0x02
716#define DS_VAR_INVALID_VAL		0x03
717#define DS_VAR_NOT_PRESENT		0x04
718};
719
720static DEFINE_MUTEX(ds_var_mutex);
721static int ds_var_doorbell;
722static int ds_var_response;
723
724static void ds_var_data(struct ds_info *dp,
725			struct ds_cap_state *cp,
726			void *buf, int len)
727{
728	struct ds_data *dpkt = buf;
729	struct ds_var_resp *rp;
730
731	rp = (struct ds_var_resp *) (dpkt + 1);
732
733	if (rp->hdr.type != DS_VAR_SET_RESP &&
734	    rp->hdr.type != DS_VAR_DELETE_RESP)
735		return;
736
737	ds_var_response = rp->result;
738	wmb();
739	ds_var_doorbell = 1;
740}
741
742void ldom_set_var(const char *var, const char *value)
743{
744	struct ds_cap_state *cp;
745	struct ds_info *dp;
746	unsigned long flags;
747
748	spin_lock_irqsave(&ds_lock, flags);
749	cp = NULL;
750	for (dp = ds_info_list; dp; dp = dp->next) {
751		struct ds_cap_state *tmp;
752
753		tmp = find_cap_by_string(dp, "var-config");
754		if (tmp && tmp->state == CAP_STATE_REGISTERED) {
755			cp = tmp;
756			break;
757		}
758	}
759	if (!cp) {
760		for (dp = ds_info_list; dp; dp = dp->next) {
761			struct ds_cap_state *tmp;
762
763			tmp = find_cap_by_string(dp, "var-config-backup");
764			if (tmp && tmp->state == CAP_STATE_REGISTERED) {
765				cp = tmp;
766				break;
767			}
768		}
769	}
770	spin_unlock_irqrestore(&ds_lock, flags);
771
772	if (cp) {
773		union {
774			struct {
775				struct ds_data		data;
776				struct ds_var_set_msg	msg;
777			} header;
778			char			all[512];
779		} pkt;
780		char  *base, *p;
781		int msg_len, loops;
782
783		if (strlen(var) + strlen(value) + 2 >
784		    sizeof(pkt) - sizeof(pkt.header)) {
785			printk(KERN_ERR PFX
786				"contents length: %zu, which more than max: %lu,"
787				"so could not set (%s) variable to (%s).\n",
788				strlen(var) + strlen(value) + 2,
789				sizeof(pkt) - sizeof(pkt.header), var, value);
790			return;
791		}
792
793		memset(&pkt, 0, sizeof(pkt));
794		pkt.header.data.tag.type = DS_DATA;
795		pkt.header.data.handle = cp->handle;
796		pkt.header.msg.hdr.type = DS_VAR_SET_REQ;
797		base = p = &pkt.header.msg.name_and_value[0];
798		strcpy(p, var);
799		p += strlen(var) + 1;
800		strcpy(p, value);
801		p += strlen(value) + 1;
802
803		msg_len = (sizeof(struct ds_data) +
804			   sizeof(struct ds_var_set_msg) +
805			   (p - base));
806		msg_len = (msg_len + 3) & ~3;
807		pkt.header.data.tag.len = msg_len - sizeof(struct ds_msg_tag);
808
809		mutex_lock(&ds_var_mutex);
810
811		spin_lock_irqsave(&ds_lock, flags);
812		ds_var_doorbell = 0;
813		ds_var_response = -1;
814
815		__ds_send(dp->lp, &pkt, msg_len);
816		spin_unlock_irqrestore(&ds_lock, flags);
817
818		loops = 1000;
819		while (ds_var_doorbell == 0) {
820			if (loops-- < 0)
821				break;
822			barrier();
823			udelay(100);
824		}
825
826		mutex_unlock(&ds_var_mutex);
827
828		if (ds_var_doorbell == 0 ||
829		    ds_var_response != DS_VAR_SUCCESS)
830			printk(KERN_ERR "ds-%llu: var-config [%s:%s] "
831			       "failed, response(%d).\n",
832			       dp->id, var, value,
833			       ds_var_response);
834	} else {
835		printk(KERN_ERR PFX "var-config not registered so "
836		       "could not set (%s) variable to (%s).\n",
837		       var, value);
838	}
839}
840
841static char full_boot_str[256] __attribute__((aligned(32)));
842static int reboot_data_supported;
843
844void ldom_reboot(const char *boot_command)
845{
846	/* Don't bother with any of this if the boot_command
847	 * is empty.
848	 */
849	if (boot_command && strlen(boot_command)) {
850		unsigned long len;
851
852		snprintf(full_boot_str, sizeof(full_boot_str), "boot %s",
853			 boot_command);
854		len = strlen(full_boot_str);
855
856		if (reboot_data_supported) {
857			unsigned long ra = kimage_addr_to_ra(full_boot_str);
858			unsigned long hv_ret;
859
860			hv_ret = sun4v_reboot_data_set(ra, len);
861			if (hv_ret != HV_EOK)
862				pr_err("SUN4V: Unable to set reboot data "
863				       "hv_ret=%lu\n", hv_ret);
864		} else {
865			ldom_set_var("reboot-command", full_boot_str);
866		}
867	}
868	sun4v_mach_sir();
869}
870
871void ldom_power_off(void)
872{
873	sun4v_mach_exit(0);
874}
875
876static void ds_conn_reset(struct ds_info *dp)
877{
878	printk(KERN_ERR "ds-%llu: ds_conn_reset() from %pf\n",
879	       dp->id, __builtin_return_address(0));
880}
881
882static int register_services(struct ds_info *dp)
883{
884	struct ldc_channel *lp = dp->lp;
885	int i;
886
887	for (i = 0; i < dp->num_ds_states; i++) {
888		struct {
889			struct ds_reg_req req;
890			u8 id_buf[256];
891		} pbuf;
892		struct ds_cap_state *cp = &dp->ds_states[i];
893		int err, msg_len;
894		u64 new_count;
895
896		if (cp->state == CAP_STATE_REGISTERED)
897			continue;
898
899		new_count = sched_clock() & 0xffffffff;
900		cp->handle = ((u64) i << 32) | new_count;
901
902		msg_len = (sizeof(struct ds_reg_req) +
903			   strlen(cp->service_id));
904
905		memset(&pbuf, 0, sizeof(pbuf));
906		pbuf.req.tag.type = DS_REG_REQ;
907		pbuf.req.tag.len = (msg_len - sizeof(struct ds_msg_tag));
908		pbuf.req.handle = cp->handle;
909		pbuf.req.major = 1;
910		pbuf.req.minor = 0;
911		strcpy(pbuf.req.svc_id, cp->service_id);
912
913		err = __ds_send(lp, &pbuf, msg_len);
914		if (err > 0)
915			cp->state = CAP_STATE_REG_SENT;
916	}
917	return 0;
918}
919
920static int ds_handshake(struct ds_info *dp, struct ds_msg_tag *pkt)
921{
922
923	if (dp->hs_state == DS_HS_START) {
924		if (pkt->type != DS_INIT_ACK)
925			goto conn_reset;
926
927		dp->hs_state = DS_HS_DONE;
928
929		return register_services(dp);
930	}
931
932	if (dp->hs_state != DS_HS_DONE)
933		goto conn_reset;
934
935	if (pkt->type == DS_REG_ACK) {
936		struct ds_reg_ack *ap = (struct ds_reg_ack *) pkt;
937		struct ds_cap_state *cp = find_cap(dp, ap->handle);
938
939		if (!cp) {
940			printk(KERN_ERR "ds-%llu: REG ACK for unknown "
941			       "handle %llx\n", dp->id, ap->handle);
942			return 0;
943		}
944		printk(KERN_INFO "ds-%llu: Registered %s service.\n",
945		       dp->id, cp->service_id);
946		cp->state = CAP_STATE_REGISTERED;
947	} else if (pkt->type == DS_REG_NACK) {
948		struct ds_reg_nack *np = (struct ds_reg_nack *) pkt;
949		struct ds_cap_state *cp = find_cap(dp, np->handle);
950
951		if (!cp) {
952			printk(KERN_ERR "ds-%llu: REG NACK for "
953			       "unknown handle %llx\n",
954			       dp->id, np->handle);
955			return 0;
956		}
957		cp->state = CAP_STATE_UNKNOWN;
958	}
959
960	return 0;
961
962conn_reset:
963	ds_conn_reset(dp);
964	return -ECONNRESET;
965}
966
967static void __send_ds_nack(struct ds_info *dp, u64 handle)
968{
969	struct ds_data_nack nack = {
970		.tag = {
971			.type = DS_NACK,
972			.len = (sizeof(struct ds_data_nack) -
973				sizeof(struct ds_msg_tag)),
974		},
975		.handle = handle,
976		.result = DS_INV_HDL,
977	};
978
979	__ds_send(dp->lp, &nack, sizeof(nack));
980}
981
982static LIST_HEAD(ds_work_list);
983static DECLARE_WAIT_QUEUE_HEAD(ds_wait);
984
985struct ds_queue_entry {
986	struct list_head		list;
987	struct ds_info			*dp;
988	int				req_len;
989	int				__pad;
990	u64				req[0];
991};
992
993static void process_ds_work(void)
994{
995	struct ds_queue_entry *qp, *tmp;
996	unsigned long flags;
997	LIST_HEAD(todo);
998
999	spin_lock_irqsave(&ds_lock, flags);
1000	list_splice_init(&ds_work_list, &todo);
1001	spin_unlock_irqrestore(&ds_lock, flags);
1002
1003	list_for_each_entry_safe(qp, tmp, &todo, list) {
1004		struct ds_data *dpkt = (struct ds_data *) qp->req;
1005		struct ds_info *dp = qp->dp;
1006		struct ds_cap_state *cp = find_cap(dp, dpkt->handle);
1007		int req_len = qp->req_len;
1008
1009		if (!cp) {
1010			printk(KERN_ERR "ds-%llu: Data for unknown "
1011			       "handle %llu\n",
1012			       dp->id, dpkt->handle);
1013
1014			spin_lock_irqsave(&ds_lock, flags);
1015			__send_ds_nack(dp, dpkt->handle);
1016			spin_unlock_irqrestore(&ds_lock, flags);
1017		} else {
1018			cp->data(dp, cp, dpkt, req_len);
1019		}
1020
1021		list_del(&qp->list);
1022		kfree(qp);
1023	}
1024}
1025
1026static int ds_thread(void *__unused)
1027{
1028	DEFINE_WAIT(wait);
1029
1030	while (1) {
1031		prepare_to_wait(&ds_wait, &wait, TASK_INTERRUPTIBLE);
1032		if (list_empty(&ds_work_list))
1033			schedule();
1034		finish_wait(&ds_wait, &wait);
1035
1036		if (kthread_should_stop())
1037			break;
1038
1039		process_ds_work();
1040	}
1041
1042	return 0;
1043}
1044
1045static int ds_data(struct ds_info *dp, struct ds_msg_tag *pkt, int len)
1046{
1047	struct ds_data *dpkt = (struct ds_data *) pkt;
1048	struct ds_queue_entry *qp;
1049
1050	qp = kmalloc(sizeof(struct ds_queue_entry) + len, GFP_ATOMIC);
1051	if (!qp) {
1052		__send_ds_nack(dp, dpkt->handle);
1053	} else {
1054		qp->dp = dp;
1055		memcpy(&qp->req, pkt, len);
1056		list_add_tail(&qp->list, &ds_work_list);
1057		wake_up(&ds_wait);
1058	}
1059	return 0;
1060}
1061
1062static void ds_up(struct ds_info *dp)
1063{
1064	struct ldc_channel *lp = dp->lp;
1065	struct ds_ver_req req;
1066	int err;
1067
1068	req.tag.type = DS_INIT_REQ;
1069	req.tag.len = sizeof(req) - sizeof(struct ds_msg_tag);
1070	req.ver.major = 1;
1071	req.ver.minor = 0;
1072
1073	err = __ds_send(lp, &req, sizeof(req));
1074	if (err > 0)
1075		dp->hs_state = DS_HS_START;
1076}
1077
1078static void ds_reset(struct ds_info *dp)
1079{
1080	int i;
1081
1082	dp->hs_state = 0;
1083
1084	for (i = 0; i < dp->num_ds_states; i++) {
1085		struct ds_cap_state *cp = &dp->ds_states[i];
1086
1087		cp->state = CAP_STATE_UNKNOWN;
1088	}
1089}
1090
1091static void ds_event(void *arg, int event)
1092{
1093	struct ds_info *dp = arg;
1094	struct ldc_channel *lp = dp->lp;
1095	unsigned long flags;
1096	int err;
1097
1098	spin_lock_irqsave(&ds_lock, flags);
1099
1100	if (event == LDC_EVENT_UP) {
1101		ds_up(dp);
1102		spin_unlock_irqrestore(&ds_lock, flags);
1103		return;
1104	}
1105
1106	if (event == LDC_EVENT_RESET) {
1107		ds_reset(dp);
1108		spin_unlock_irqrestore(&ds_lock, flags);
1109		return;
1110	}
1111
1112	if (event != LDC_EVENT_DATA_READY) {
1113		printk(KERN_WARNING "ds-%llu: Unexpected LDC event %d\n",
1114		       dp->id, event);
1115		spin_unlock_irqrestore(&ds_lock, flags);
1116		return;
1117	}
1118
1119	err = 0;
1120	while (1) {
1121		struct ds_msg_tag *tag;
1122
1123		err = ldc_read(lp, dp->rcv_buf, sizeof(*tag));
1124
1125		if (unlikely(err < 0)) {
1126			if (err == -ECONNRESET)
1127				ds_conn_reset(dp);
1128			break;
1129		}
1130		if (err == 0)
1131			break;
1132
1133		tag = dp->rcv_buf;
1134		err = ldc_read(lp, tag + 1, tag->len);
1135
1136		if (unlikely(err < 0)) {
1137			if (err == -ECONNRESET)
1138				ds_conn_reset(dp);
1139			break;
1140		}
1141		if (err < tag->len)
1142			break;
1143
1144		if (tag->type < DS_DATA)
1145			err = ds_handshake(dp, dp->rcv_buf);
1146		else
1147			err = ds_data(dp, dp->rcv_buf,
1148				      sizeof(*tag) + err);
1149		if (err == -ECONNRESET)
1150			break;
1151	}
1152
1153	spin_unlock_irqrestore(&ds_lock, flags);
1154}
1155
1156static int ds_probe(struct vio_dev *vdev, const struct vio_device_id *id)
1157{
1158	static int ds_version_printed;
1159	struct ldc_channel_config ds_cfg = {
1160		.event		= ds_event,
1161		.mtu		= 4096,
1162		.mode		= LDC_MODE_STREAM,
1163	};
1164	struct mdesc_handle *hp;
1165	struct ldc_channel *lp;
1166	struct ds_info *dp;
1167	const u64 *val;
1168	int err, i;
1169
1170	if (ds_version_printed++ == 0)
1171		printk(KERN_INFO "%s", version);
1172
1173	dp = kzalloc(sizeof(*dp), GFP_KERNEL);
1174	err = -ENOMEM;
1175	if (!dp)
1176		goto out_err;
1177
1178	hp = mdesc_grab();
1179	val = mdesc_get_property(hp, vdev->mp, "id", NULL);
1180	if (val)
1181		dp->id = *val;
1182	mdesc_release(hp);
1183
1184	dp->rcv_buf = kzalloc(4096, GFP_KERNEL);
1185	if (!dp->rcv_buf)
1186		goto out_free_dp;
1187
1188	dp->rcv_buf_len = 4096;
1189
1190	dp->ds_states = kmemdup(ds_states_template,
1191				sizeof(ds_states_template), GFP_KERNEL);
1192	if (!dp->ds_states)
1193		goto out_free_rcv_buf;
1194
1195	dp->num_ds_states = ARRAY_SIZE(ds_states_template);
1196
1197	for (i = 0; i < dp->num_ds_states; i++)
1198		dp->ds_states[i].handle = ((u64)i << 32);
1199
1200	ds_cfg.tx_irq = vdev->tx_irq;
1201	ds_cfg.rx_irq = vdev->rx_irq;
1202
1203	lp = ldc_alloc(vdev->channel_id, &ds_cfg, dp, "DS");
1204	if (IS_ERR(lp)) {
1205		err = PTR_ERR(lp);
1206		goto out_free_ds_states;
1207	}
1208	dp->lp = lp;
1209
1210	err = ldc_bind(lp);
1211	if (err)
1212		goto out_free_ldc;
1213
1214	spin_lock_irq(&ds_lock);
1215	dp->next = ds_info_list;
1216	ds_info_list = dp;
1217	spin_unlock_irq(&ds_lock);
1218
1219	return err;
1220
1221out_free_ldc:
1222	ldc_free(dp->lp);
1223
1224out_free_ds_states:
1225	kfree(dp->ds_states);
1226
1227out_free_rcv_buf:
1228	kfree(dp->rcv_buf);
1229
1230out_free_dp:
1231	kfree(dp);
1232
1233out_err:
1234	return err;
1235}
1236
1237static int ds_remove(struct vio_dev *vdev)
1238{
1239	return 0;
1240}
1241
1242static const struct vio_device_id ds_match[] = {
1243	{
1244		.type = "domain-services-port",
1245	},
1246	{},
1247};
1248
1249static struct vio_driver ds_driver = {
1250	.id_table	= ds_match,
1251	.probe		= ds_probe,
1252	.remove		= ds_remove,
1253	.name		= "ds",
1254};
1255
1256static int __init ds_init(void)
1257{
1258	unsigned long hv_ret, major, minor;
1259
1260	if (tlb_type == hypervisor) {
1261		hv_ret = sun4v_get_version(HV_GRP_REBOOT_DATA, &major, &minor);
1262		if (hv_ret == HV_EOK) {
1263			pr_info("SUN4V: Reboot data supported (maj=%lu,min=%lu).\n",
1264				major, minor);
1265			reboot_data_supported = 1;
1266		}
1267	}
1268	kthread_run(ds_thread, NULL, "kldomd");
1269
1270	return vio_register_driver(&ds_driver);
1271}
1272
1273fs_initcall(ds_init);
1274