1/*
2 * handling kvm guest interrupts
3 *
4 * Copyright IBM Corp. 2008, 2015
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License (version 2 only)
8 * as published by the Free Software Foundation.
9 *
10 *    Author(s): Carsten Otte <cotte@de.ibm.com>
11 */
12
13#include <linux/interrupt.h>
14#include <linux/kvm_host.h>
15#include <linux/hrtimer.h>
16#include <linux/mmu_context.h>
17#include <linux/signal.h>
18#include <linux/slab.h>
19#include <linux/bitmap.h>
20#include <linux/vmalloc.h>
21#include <asm/asm-offsets.h>
22#include <asm/dis.h>
23#include <asm/uaccess.h>
24#include <asm/sclp.h>
25#include <asm/isc.h>
26#include "kvm-s390.h"
27#include "gaccess.h"
28#include "trace-s390.h"
29
30#define IOINT_SCHID_MASK 0x0000ffff
31#define IOINT_SSID_MASK 0x00030000
32#define IOINT_CSSID_MASK 0x03fc0000
33#define IOINT_AI_MASK 0x04000000
34#define PFAULT_INIT 0x0600
35#define PFAULT_DONE 0x0680
36#define VIRTIO_PARAM 0x0d00
37
38int psw_extint_disabled(struct kvm_vcpu *vcpu)
39{
40	return !(vcpu->arch.sie_block->gpsw.mask & PSW_MASK_EXT);
41}
42
43static int psw_ioint_disabled(struct kvm_vcpu *vcpu)
44{
45	return !(vcpu->arch.sie_block->gpsw.mask & PSW_MASK_IO);
46}
47
48static int psw_mchk_disabled(struct kvm_vcpu *vcpu)
49{
50	return !(vcpu->arch.sie_block->gpsw.mask & PSW_MASK_MCHECK);
51}
52
53static int psw_interrupts_disabled(struct kvm_vcpu *vcpu)
54{
55	if ((vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PER) ||
56	    (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_IO) ||
57	    (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_EXT))
58		return 0;
59	return 1;
60}
61
62static int ckc_interrupts_enabled(struct kvm_vcpu *vcpu)
63{
64	if (psw_extint_disabled(vcpu) ||
65	    !(vcpu->arch.sie_block->gcr[0] & 0x800ul))
66		return 0;
67	if (guestdbg_enabled(vcpu) && guestdbg_sstep_enabled(vcpu))
68		/* No timer interrupts when single stepping */
69		return 0;
70	return 1;
71}
72
73static int ckc_irq_pending(struct kvm_vcpu *vcpu)
74{
75	if (!(vcpu->arch.sie_block->ckc <
76	      get_tod_clock_fast() + vcpu->arch.sie_block->epoch))
77		return 0;
78	return ckc_interrupts_enabled(vcpu);
79}
80
81static int cpu_timer_interrupts_enabled(struct kvm_vcpu *vcpu)
82{
83	return !psw_extint_disabled(vcpu) &&
84	       (vcpu->arch.sie_block->gcr[0] & 0x400ul);
85}
86
87static int cpu_timer_irq_pending(struct kvm_vcpu *vcpu)
88{
89	return (vcpu->arch.sie_block->cputm >> 63) &&
90	       cpu_timer_interrupts_enabled(vcpu);
91}
92
93static inline int is_ioirq(unsigned long irq_type)
94{
95	return ((irq_type >= IRQ_PEND_IO_ISC_0) &&
96		(irq_type <= IRQ_PEND_IO_ISC_7));
97}
98
99static uint64_t isc_to_isc_bits(int isc)
100{
101	return (0x80 >> isc) << 24;
102}
103
104static inline u8 int_word_to_isc(u32 int_word)
105{
106	return (int_word & 0x38000000) >> 27;
107}
108
109static inline unsigned long pending_floating_irqs(struct kvm_vcpu *vcpu)
110{
111	return vcpu->kvm->arch.float_int.pending_irqs;
112}
113
114static inline unsigned long pending_local_irqs(struct kvm_vcpu *vcpu)
115{
116	return vcpu->arch.local_int.pending_irqs;
117}
118
119static unsigned long disable_iscs(struct kvm_vcpu *vcpu,
120				   unsigned long active_mask)
121{
122	int i;
123
124	for (i = 0; i <= MAX_ISC; i++)
125		if (!(vcpu->arch.sie_block->gcr[6] & isc_to_isc_bits(i)))
126			active_mask &= ~(1UL << (IRQ_PEND_IO_ISC_0 + i));
127
128	return active_mask;
129}
130
131static unsigned long deliverable_irqs(struct kvm_vcpu *vcpu)
132{
133	unsigned long active_mask;
134
135	active_mask = pending_local_irqs(vcpu);
136	active_mask |= pending_floating_irqs(vcpu);
137
138	if (psw_extint_disabled(vcpu))
139		active_mask &= ~IRQ_PEND_EXT_MASK;
140	if (psw_ioint_disabled(vcpu))
141		active_mask &= ~IRQ_PEND_IO_MASK;
142	else
143		active_mask = disable_iscs(vcpu, active_mask);
144	if (!(vcpu->arch.sie_block->gcr[0] & 0x2000ul))
145		__clear_bit(IRQ_PEND_EXT_EXTERNAL, &active_mask);
146	if (!(vcpu->arch.sie_block->gcr[0] & 0x4000ul))
147		__clear_bit(IRQ_PEND_EXT_EMERGENCY, &active_mask);
148	if (!(vcpu->arch.sie_block->gcr[0] & 0x800ul))
149		__clear_bit(IRQ_PEND_EXT_CLOCK_COMP, &active_mask);
150	if (!(vcpu->arch.sie_block->gcr[0] & 0x400ul))
151		__clear_bit(IRQ_PEND_EXT_CPU_TIMER, &active_mask);
152	if (!(vcpu->arch.sie_block->gcr[0] & 0x200ul))
153		__clear_bit(IRQ_PEND_EXT_SERVICE, &active_mask);
154	if (psw_mchk_disabled(vcpu))
155		active_mask &= ~IRQ_PEND_MCHK_MASK;
156	if (!(vcpu->arch.sie_block->gcr[14] &
157	      vcpu->kvm->arch.float_int.mchk.cr14))
158		__clear_bit(IRQ_PEND_MCHK_REP, &active_mask);
159
160	/*
161	 * STOP irqs will never be actively delivered. They are triggered via
162	 * intercept requests and cleared when the stop intercept is performed.
163	 */
164	__clear_bit(IRQ_PEND_SIGP_STOP, &active_mask);
165
166	return active_mask;
167}
168
169static void __set_cpu_idle(struct kvm_vcpu *vcpu)
170{
171	atomic_set_mask(CPUSTAT_WAIT, &vcpu->arch.sie_block->cpuflags);
172	set_bit(vcpu->vcpu_id, vcpu->arch.local_int.float_int->idle_mask);
173}
174
175static void __unset_cpu_idle(struct kvm_vcpu *vcpu)
176{
177	atomic_clear_mask(CPUSTAT_WAIT, &vcpu->arch.sie_block->cpuflags);
178	clear_bit(vcpu->vcpu_id, vcpu->arch.local_int.float_int->idle_mask);
179}
180
181static void __reset_intercept_indicators(struct kvm_vcpu *vcpu)
182{
183	atomic_clear_mask(CPUSTAT_IO_INT | CPUSTAT_EXT_INT | CPUSTAT_STOP_INT,
184			  &vcpu->arch.sie_block->cpuflags);
185	vcpu->arch.sie_block->lctl = 0x0000;
186	vcpu->arch.sie_block->ictl &= ~(ICTL_LPSW | ICTL_STCTL | ICTL_PINT);
187
188	if (guestdbg_enabled(vcpu)) {
189		vcpu->arch.sie_block->lctl |= (LCTL_CR0 | LCTL_CR9 |
190					       LCTL_CR10 | LCTL_CR11);
191		vcpu->arch.sie_block->ictl |= (ICTL_STCTL | ICTL_PINT);
192	}
193}
194
195static void __set_cpuflag(struct kvm_vcpu *vcpu, u32 flag)
196{
197	atomic_set_mask(flag, &vcpu->arch.sie_block->cpuflags);
198}
199
200static void set_intercept_indicators_io(struct kvm_vcpu *vcpu)
201{
202	if (!(pending_floating_irqs(vcpu) & IRQ_PEND_IO_MASK))
203		return;
204	else if (psw_ioint_disabled(vcpu))
205		__set_cpuflag(vcpu, CPUSTAT_IO_INT);
206	else
207		vcpu->arch.sie_block->lctl |= LCTL_CR6;
208}
209
210static void set_intercept_indicators_ext(struct kvm_vcpu *vcpu)
211{
212	if (!(pending_local_irqs(vcpu) & IRQ_PEND_EXT_MASK))
213		return;
214	if (psw_extint_disabled(vcpu))
215		__set_cpuflag(vcpu, CPUSTAT_EXT_INT);
216	else
217		vcpu->arch.sie_block->lctl |= LCTL_CR0;
218}
219
220static void set_intercept_indicators_mchk(struct kvm_vcpu *vcpu)
221{
222	if (!(pending_local_irqs(vcpu) & IRQ_PEND_MCHK_MASK))
223		return;
224	if (psw_mchk_disabled(vcpu))
225		vcpu->arch.sie_block->ictl |= ICTL_LPSW;
226	else
227		vcpu->arch.sie_block->lctl |= LCTL_CR14;
228}
229
230static void set_intercept_indicators_stop(struct kvm_vcpu *vcpu)
231{
232	if (kvm_s390_is_stop_irq_pending(vcpu))
233		__set_cpuflag(vcpu, CPUSTAT_STOP_INT);
234}
235
236/* Set interception request for non-deliverable interrupts */
237static void set_intercept_indicators(struct kvm_vcpu *vcpu)
238{
239	set_intercept_indicators_io(vcpu);
240	set_intercept_indicators_ext(vcpu);
241	set_intercept_indicators_mchk(vcpu);
242	set_intercept_indicators_stop(vcpu);
243}
244
245static u16 get_ilc(struct kvm_vcpu *vcpu)
246{
247	switch (vcpu->arch.sie_block->icptcode) {
248	case ICPT_INST:
249	case ICPT_INSTPROGI:
250	case ICPT_OPEREXC:
251	case ICPT_PARTEXEC:
252	case ICPT_IOINST:
253		/* last instruction only stored for these icptcodes */
254		return insn_length(vcpu->arch.sie_block->ipa >> 8);
255	case ICPT_PROGI:
256		return vcpu->arch.sie_block->pgmilc;
257	default:
258		return 0;
259	}
260}
261
262static int __must_check __deliver_cpu_timer(struct kvm_vcpu *vcpu)
263{
264	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
265	int rc;
266
267	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, KVM_S390_INT_CPU_TIMER,
268					 0, 0);
269
270	rc  = put_guest_lc(vcpu, EXT_IRQ_CPU_TIMER,
271			   (u16 *)__LC_EXT_INT_CODE);
272	rc |= put_guest_lc(vcpu, 0, (u16 *)__LC_EXT_CPU_ADDR);
273	rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
274			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
275	rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
276			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
277	clear_bit(IRQ_PEND_EXT_CPU_TIMER, &li->pending_irqs);
278	return rc ? -EFAULT : 0;
279}
280
281static int __must_check __deliver_ckc(struct kvm_vcpu *vcpu)
282{
283	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
284	int rc;
285
286	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, KVM_S390_INT_CLOCK_COMP,
287					 0, 0);
288
289	rc  = put_guest_lc(vcpu, EXT_IRQ_CLK_COMP,
290			   (u16 __user *)__LC_EXT_INT_CODE);
291	rc |= put_guest_lc(vcpu, 0, (u16 *)__LC_EXT_CPU_ADDR);
292	rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
293			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
294	rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
295			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
296	clear_bit(IRQ_PEND_EXT_CLOCK_COMP, &li->pending_irqs);
297	return rc ? -EFAULT : 0;
298}
299
300static int __must_check __deliver_pfault_init(struct kvm_vcpu *vcpu)
301{
302	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
303	struct kvm_s390_ext_info ext;
304	int rc;
305
306	spin_lock(&li->lock);
307	ext = li->irq.ext;
308	clear_bit(IRQ_PEND_PFAULT_INIT, &li->pending_irqs);
309	li->irq.ext.ext_params2 = 0;
310	spin_unlock(&li->lock);
311
312	VCPU_EVENT(vcpu, 4, "interrupt: pfault init parm:%x,parm64:%llx",
313		   0, ext.ext_params2);
314	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
315					 KVM_S390_INT_PFAULT_INIT,
316					 0, ext.ext_params2);
317
318	rc  = put_guest_lc(vcpu, EXT_IRQ_CP_SERVICE, (u16 *) __LC_EXT_INT_CODE);
319	rc |= put_guest_lc(vcpu, PFAULT_INIT, (u16 *) __LC_EXT_CPU_ADDR);
320	rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
321			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
322	rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
323			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
324	rc |= put_guest_lc(vcpu, ext.ext_params2, (u64 *) __LC_EXT_PARAMS2);
325	return rc ? -EFAULT : 0;
326}
327
328static int __must_check __deliver_machine_check(struct kvm_vcpu *vcpu)
329{
330	struct kvm_s390_float_interrupt *fi = &vcpu->kvm->arch.float_int;
331	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
332	struct kvm_s390_mchk_info mchk = {};
333	unsigned long adtl_status_addr;
334	int deliver = 0;
335	int rc = 0;
336
337	spin_lock(&fi->lock);
338	spin_lock(&li->lock);
339	if (test_bit(IRQ_PEND_MCHK_EX, &li->pending_irqs) ||
340	    test_bit(IRQ_PEND_MCHK_REP, &li->pending_irqs)) {
341		/*
342		 * If there was an exigent machine check pending, then any
343		 * repressible machine checks that might have been pending
344		 * are indicated along with it, so always clear bits for
345		 * repressible and exigent interrupts
346		 */
347		mchk = li->irq.mchk;
348		clear_bit(IRQ_PEND_MCHK_EX, &li->pending_irqs);
349		clear_bit(IRQ_PEND_MCHK_REP, &li->pending_irqs);
350		memset(&li->irq.mchk, 0, sizeof(mchk));
351		deliver = 1;
352	}
353	/*
354	 * We indicate floating repressible conditions along with
355	 * other pending conditions. Channel Report Pending and Channel
356	 * Subsystem damage are the only two and and are indicated by
357	 * bits in mcic and masked in cr14.
358	 */
359	if (test_and_clear_bit(IRQ_PEND_MCHK_REP, &fi->pending_irqs)) {
360		mchk.mcic |= fi->mchk.mcic;
361		mchk.cr14 |= fi->mchk.cr14;
362		memset(&fi->mchk, 0, sizeof(mchk));
363		deliver = 1;
364	}
365	spin_unlock(&li->lock);
366	spin_unlock(&fi->lock);
367
368	if (deliver) {
369		VCPU_EVENT(vcpu, 4, "interrupt: machine check mcic=%llx",
370			   mchk.mcic);
371		trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
372						 KVM_S390_MCHK,
373						 mchk.cr14, mchk.mcic);
374
375		rc  = kvm_s390_vcpu_store_status(vcpu,
376						 KVM_S390_STORE_STATUS_PREFIXED);
377		rc |= read_guest_lc(vcpu, __LC_VX_SAVE_AREA_ADDR,
378				    &adtl_status_addr,
379				    sizeof(unsigned long));
380		rc |= kvm_s390_vcpu_store_adtl_status(vcpu,
381						      adtl_status_addr);
382		rc |= put_guest_lc(vcpu, mchk.mcic,
383				   (u64 __user *) __LC_MCCK_CODE);
384		rc |= put_guest_lc(vcpu, mchk.failing_storage_address,
385				   (u64 __user *) __LC_MCCK_FAIL_STOR_ADDR);
386		rc |= write_guest_lc(vcpu, __LC_PSW_SAVE_AREA,
387				     &mchk.fixed_logout,
388				     sizeof(mchk.fixed_logout));
389		rc |= write_guest_lc(vcpu, __LC_MCK_OLD_PSW,
390				     &vcpu->arch.sie_block->gpsw,
391				     sizeof(psw_t));
392		rc |= read_guest_lc(vcpu, __LC_MCK_NEW_PSW,
393				    &vcpu->arch.sie_block->gpsw,
394				    sizeof(psw_t));
395	}
396	return rc ? -EFAULT : 0;
397}
398
399static int __must_check __deliver_restart(struct kvm_vcpu *vcpu)
400{
401	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
402	int rc;
403
404	VCPU_EVENT(vcpu, 4, "%s", "interrupt: cpu restart");
405	vcpu->stat.deliver_restart_signal++;
406	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, KVM_S390_RESTART, 0, 0);
407
408	rc  = write_guest_lc(vcpu,
409			     offsetof(struct _lowcore, restart_old_psw),
410			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
411	rc |= read_guest_lc(vcpu, offsetof(struct _lowcore, restart_psw),
412			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
413	clear_bit(IRQ_PEND_RESTART, &li->pending_irqs);
414	return rc ? -EFAULT : 0;
415}
416
417static int __must_check __deliver_set_prefix(struct kvm_vcpu *vcpu)
418{
419	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
420	struct kvm_s390_prefix_info prefix;
421
422	spin_lock(&li->lock);
423	prefix = li->irq.prefix;
424	li->irq.prefix.address = 0;
425	clear_bit(IRQ_PEND_SET_PREFIX, &li->pending_irqs);
426	spin_unlock(&li->lock);
427
428	VCPU_EVENT(vcpu, 4, "interrupt: set prefix to %x", prefix.address);
429	vcpu->stat.deliver_prefix_signal++;
430	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
431					 KVM_S390_SIGP_SET_PREFIX,
432					 prefix.address, 0);
433
434	kvm_s390_set_prefix(vcpu, prefix.address);
435	return 0;
436}
437
438static int __must_check __deliver_emergency_signal(struct kvm_vcpu *vcpu)
439{
440	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
441	int rc;
442	int cpu_addr;
443
444	spin_lock(&li->lock);
445	cpu_addr = find_first_bit(li->sigp_emerg_pending, KVM_MAX_VCPUS);
446	clear_bit(cpu_addr, li->sigp_emerg_pending);
447	if (bitmap_empty(li->sigp_emerg_pending, KVM_MAX_VCPUS))
448		clear_bit(IRQ_PEND_EXT_EMERGENCY, &li->pending_irqs);
449	spin_unlock(&li->lock);
450
451	VCPU_EVENT(vcpu, 4, "%s", "interrupt: sigp emerg");
452	vcpu->stat.deliver_emergency_signal++;
453	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, KVM_S390_INT_EMERGENCY,
454					 cpu_addr, 0);
455
456	rc  = put_guest_lc(vcpu, EXT_IRQ_EMERGENCY_SIG,
457			   (u16 *)__LC_EXT_INT_CODE);
458	rc |= put_guest_lc(vcpu, cpu_addr, (u16 *)__LC_EXT_CPU_ADDR);
459	rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
460			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
461	rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
462			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
463	return rc ? -EFAULT : 0;
464}
465
466static int __must_check __deliver_external_call(struct kvm_vcpu *vcpu)
467{
468	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
469	struct kvm_s390_extcall_info extcall;
470	int rc;
471
472	spin_lock(&li->lock);
473	extcall = li->irq.extcall;
474	li->irq.extcall.code = 0;
475	clear_bit(IRQ_PEND_EXT_EXTERNAL, &li->pending_irqs);
476	spin_unlock(&li->lock);
477
478	VCPU_EVENT(vcpu, 4, "%s", "interrupt: sigp ext call");
479	vcpu->stat.deliver_external_call++;
480	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
481					 KVM_S390_INT_EXTERNAL_CALL,
482					 extcall.code, 0);
483
484	rc  = put_guest_lc(vcpu, EXT_IRQ_EXTERNAL_CALL,
485			   (u16 *)__LC_EXT_INT_CODE);
486	rc |= put_guest_lc(vcpu, extcall.code, (u16 *)__LC_EXT_CPU_ADDR);
487	rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
488			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
489	rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW, &vcpu->arch.sie_block->gpsw,
490			    sizeof(psw_t));
491	return rc ? -EFAULT : 0;
492}
493
494static int __must_check __deliver_prog(struct kvm_vcpu *vcpu)
495{
496	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
497	struct kvm_s390_pgm_info pgm_info;
498	int rc = 0, nullifying = false;
499	u16 ilc = get_ilc(vcpu);
500
501	spin_lock(&li->lock);
502	pgm_info = li->irq.pgm;
503	clear_bit(IRQ_PEND_PROG, &li->pending_irqs);
504	memset(&li->irq.pgm, 0, sizeof(pgm_info));
505	spin_unlock(&li->lock);
506
507	VCPU_EVENT(vcpu, 4, "interrupt: pgm check code:%x, ilc:%x",
508		   pgm_info.code, ilc);
509	vcpu->stat.deliver_program_int++;
510	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, KVM_S390_PROGRAM_INT,
511					 pgm_info.code, 0);
512
513	switch (pgm_info.code & ~PGM_PER) {
514	case PGM_AFX_TRANSLATION:
515	case PGM_ASX_TRANSLATION:
516	case PGM_EX_TRANSLATION:
517	case PGM_LFX_TRANSLATION:
518	case PGM_LSTE_SEQUENCE:
519	case PGM_LSX_TRANSLATION:
520	case PGM_LX_TRANSLATION:
521	case PGM_PRIMARY_AUTHORITY:
522	case PGM_SECONDARY_AUTHORITY:
523		nullifying = true;
524		/* fall through */
525	case PGM_SPACE_SWITCH:
526		rc = put_guest_lc(vcpu, pgm_info.trans_exc_code,
527				  (u64 *)__LC_TRANS_EXC_CODE);
528		break;
529	case PGM_ALEN_TRANSLATION:
530	case PGM_ALE_SEQUENCE:
531	case PGM_ASTE_INSTANCE:
532	case PGM_ASTE_SEQUENCE:
533	case PGM_ASTE_VALIDITY:
534	case PGM_EXTENDED_AUTHORITY:
535		rc = put_guest_lc(vcpu, pgm_info.exc_access_id,
536				  (u8 *)__LC_EXC_ACCESS_ID);
537		nullifying = true;
538		break;
539	case PGM_ASCE_TYPE:
540	case PGM_PAGE_TRANSLATION:
541	case PGM_REGION_FIRST_TRANS:
542	case PGM_REGION_SECOND_TRANS:
543	case PGM_REGION_THIRD_TRANS:
544	case PGM_SEGMENT_TRANSLATION:
545		rc = put_guest_lc(vcpu, pgm_info.trans_exc_code,
546				  (u64 *)__LC_TRANS_EXC_CODE);
547		rc |= put_guest_lc(vcpu, pgm_info.exc_access_id,
548				   (u8 *)__LC_EXC_ACCESS_ID);
549		rc |= put_guest_lc(vcpu, pgm_info.op_access_id,
550				   (u8 *)__LC_OP_ACCESS_ID);
551		nullifying = true;
552		break;
553	case PGM_MONITOR:
554		rc = put_guest_lc(vcpu, pgm_info.mon_class_nr,
555				  (u16 *)__LC_MON_CLASS_NR);
556		rc |= put_guest_lc(vcpu, pgm_info.mon_code,
557				   (u64 *)__LC_MON_CODE);
558		break;
559	case PGM_VECTOR_PROCESSING:
560	case PGM_DATA:
561		rc = put_guest_lc(vcpu, pgm_info.data_exc_code,
562				  (u32 *)__LC_DATA_EXC_CODE);
563		break;
564	case PGM_PROTECTION:
565		rc = put_guest_lc(vcpu, pgm_info.trans_exc_code,
566				  (u64 *)__LC_TRANS_EXC_CODE);
567		rc |= put_guest_lc(vcpu, pgm_info.exc_access_id,
568				   (u8 *)__LC_EXC_ACCESS_ID);
569		break;
570	case PGM_STACK_FULL:
571	case PGM_STACK_EMPTY:
572	case PGM_STACK_SPECIFICATION:
573	case PGM_STACK_TYPE:
574	case PGM_STACK_OPERATION:
575	case PGM_TRACE_TABEL:
576	case PGM_CRYPTO_OPERATION:
577		nullifying = true;
578		break;
579	}
580
581	if (pgm_info.code & PGM_PER) {
582		rc |= put_guest_lc(vcpu, pgm_info.per_code,
583				   (u8 *) __LC_PER_CODE);
584		rc |= put_guest_lc(vcpu, pgm_info.per_atmid,
585				   (u8 *)__LC_PER_ATMID);
586		rc |= put_guest_lc(vcpu, pgm_info.per_address,
587				   (u64 *) __LC_PER_ADDRESS);
588		rc |= put_guest_lc(vcpu, pgm_info.per_access_id,
589				   (u8 *) __LC_PER_ACCESS_ID);
590	}
591
592	if (nullifying && vcpu->arch.sie_block->icptcode == ICPT_INST)
593		kvm_s390_rewind_psw(vcpu, ilc);
594
595	rc |= put_guest_lc(vcpu, ilc, (u16 *) __LC_PGM_ILC);
596	rc |= put_guest_lc(vcpu, vcpu->arch.sie_block->gbea,
597				 (u64 *) __LC_LAST_BREAK);
598	rc |= put_guest_lc(vcpu, pgm_info.code,
599			   (u16 *)__LC_PGM_INT_CODE);
600	rc |= write_guest_lc(vcpu, __LC_PGM_OLD_PSW,
601			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
602	rc |= read_guest_lc(vcpu, __LC_PGM_NEW_PSW,
603			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
604	return rc ? -EFAULT : 0;
605}
606
607static int __must_check __deliver_service(struct kvm_vcpu *vcpu)
608{
609	struct kvm_s390_float_interrupt *fi = &vcpu->kvm->arch.float_int;
610	struct kvm_s390_ext_info ext;
611	int rc = 0;
612
613	spin_lock(&fi->lock);
614	if (!(test_bit(IRQ_PEND_EXT_SERVICE, &fi->pending_irqs))) {
615		spin_unlock(&fi->lock);
616		return 0;
617	}
618	ext = fi->srv_signal;
619	memset(&fi->srv_signal, 0, sizeof(ext));
620	clear_bit(IRQ_PEND_EXT_SERVICE, &fi->pending_irqs);
621	spin_unlock(&fi->lock);
622
623	VCPU_EVENT(vcpu, 4, "interrupt: sclp parm:%x",
624		   ext.ext_params);
625	vcpu->stat.deliver_service_signal++;
626	trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, KVM_S390_INT_SERVICE,
627					 ext.ext_params, 0);
628
629	rc  = put_guest_lc(vcpu, EXT_IRQ_SERVICE_SIG, (u16 *)__LC_EXT_INT_CODE);
630	rc |= put_guest_lc(vcpu, 0, (u16 *)__LC_EXT_CPU_ADDR);
631	rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
632			     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
633	rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
634			    &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
635	rc |= put_guest_lc(vcpu, ext.ext_params,
636			   (u32 *)__LC_EXT_PARAMS);
637
638	return rc ? -EFAULT : 0;
639}
640
641static int __must_check __deliver_pfault_done(struct kvm_vcpu *vcpu)
642{
643	struct kvm_s390_float_interrupt *fi = &vcpu->kvm->arch.float_int;
644	struct kvm_s390_interrupt_info *inti;
645	int rc = 0;
646
647	spin_lock(&fi->lock);
648	inti = list_first_entry_or_null(&fi->lists[FIRQ_LIST_PFAULT],
649					struct kvm_s390_interrupt_info,
650					list);
651	if (inti) {
652		trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
653				KVM_S390_INT_PFAULT_DONE, 0,
654				inti->ext.ext_params2);
655		list_del(&inti->list);
656		fi->counters[FIRQ_CNTR_PFAULT] -= 1;
657	}
658	if (list_empty(&fi->lists[FIRQ_LIST_PFAULT]))
659		clear_bit(IRQ_PEND_PFAULT_DONE, &fi->pending_irqs);
660	spin_unlock(&fi->lock);
661
662	if (inti) {
663		rc  = put_guest_lc(vcpu, EXT_IRQ_CP_SERVICE,
664				(u16 *)__LC_EXT_INT_CODE);
665		rc |= put_guest_lc(vcpu, PFAULT_DONE,
666				(u16 *)__LC_EXT_CPU_ADDR);
667		rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
668				&vcpu->arch.sie_block->gpsw,
669				sizeof(psw_t));
670		rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
671				&vcpu->arch.sie_block->gpsw,
672				sizeof(psw_t));
673		rc |= put_guest_lc(vcpu, inti->ext.ext_params2,
674				(u64 *)__LC_EXT_PARAMS2);
675		kfree(inti);
676	}
677	return rc ? -EFAULT : 0;
678}
679
680static int __must_check __deliver_virtio(struct kvm_vcpu *vcpu)
681{
682	struct kvm_s390_float_interrupt *fi = &vcpu->kvm->arch.float_int;
683	struct kvm_s390_interrupt_info *inti;
684	int rc = 0;
685
686	spin_lock(&fi->lock);
687	inti = list_first_entry_or_null(&fi->lists[FIRQ_LIST_VIRTIO],
688					struct kvm_s390_interrupt_info,
689					list);
690	if (inti) {
691		VCPU_EVENT(vcpu, 4,
692			   "interrupt: virtio parm:%x,parm64:%llx",
693			   inti->ext.ext_params, inti->ext.ext_params2);
694		vcpu->stat.deliver_virtio_interrupt++;
695		trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
696				inti->type,
697				inti->ext.ext_params,
698				inti->ext.ext_params2);
699		list_del(&inti->list);
700		fi->counters[FIRQ_CNTR_VIRTIO] -= 1;
701	}
702	if (list_empty(&fi->lists[FIRQ_LIST_VIRTIO]))
703		clear_bit(IRQ_PEND_VIRTIO, &fi->pending_irqs);
704	spin_unlock(&fi->lock);
705
706	if (inti) {
707		rc  = put_guest_lc(vcpu, EXT_IRQ_CP_SERVICE,
708				(u16 *)__LC_EXT_INT_CODE);
709		rc |= put_guest_lc(vcpu, VIRTIO_PARAM,
710				(u16 *)__LC_EXT_CPU_ADDR);
711		rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
712				&vcpu->arch.sie_block->gpsw,
713				sizeof(psw_t));
714		rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
715				&vcpu->arch.sie_block->gpsw,
716				sizeof(psw_t));
717		rc |= put_guest_lc(vcpu, inti->ext.ext_params,
718				(u32 *)__LC_EXT_PARAMS);
719		rc |= put_guest_lc(vcpu, inti->ext.ext_params2,
720				(u64 *)__LC_EXT_PARAMS2);
721		kfree(inti);
722	}
723	return rc ? -EFAULT : 0;
724}
725
726static int __must_check __deliver_io(struct kvm_vcpu *vcpu,
727				     unsigned long irq_type)
728{
729	struct list_head *isc_list;
730	struct kvm_s390_float_interrupt *fi;
731	struct kvm_s390_interrupt_info *inti = NULL;
732	int rc = 0;
733
734	fi = &vcpu->kvm->arch.float_int;
735
736	spin_lock(&fi->lock);
737	isc_list = &fi->lists[irq_type - IRQ_PEND_IO_ISC_0];
738	inti = list_first_entry_or_null(isc_list,
739					struct kvm_s390_interrupt_info,
740					list);
741	if (inti) {
742		VCPU_EVENT(vcpu, 4, "interrupt: I/O %llx", inti->type);
743		vcpu->stat.deliver_io_int++;
744		trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id,
745				inti->type,
746				((__u32)inti->io.subchannel_id << 16) |
747				inti->io.subchannel_nr,
748				((__u64)inti->io.io_int_parm << 32) |
749				inti->io.io_int_word);
750		list_del(&inti->list);
751		fi->counters[FIRQ_CNTR_IO] -= 1;
752	}
753	if (list_empty(isc_list))
754		clear_bit(irq_type, &fi->pending_irqs);
755	spin_unlock(&fi->lock);
756
757	if (inti) {
758		rc  = put_guest_lc(vcpu, inti->io.subchannel_id,
759				(u16 *)__LC_SUBCHANNEL_ID);
760		rc |= put_guest_lc(vcpu, inti->io.subchannel_nr,
761				(u16 *)__LC_SUBCHANNEL_NR);
762		rc |= put_guest_lc(vcpu, inti->io.io_int_parm,
763				(u32 *)__LC_IO_INT_PARM);
764		rc |= put_guest_lc(vcpu, inti->io.io_int_word,
765				(u32 *)__LC_IO_INT_WORD);
766		rc |= write_guest_lc(vcpu, __LC_IO_OLD_PSW,
767				&vcpu->arch.sie_block->gpsw,
768				sizeof(psw_t));
769		rc |= read_guest_lc(vcpu, __LC_IO_NEW_PSW,
770				&vcpu->arch.sie_block->gpsw,
771				sizeof(psw_t));
772		kfree(inti);
773	}
774
775	return rc ? -EFAULT : 0;
776}
777
778typedef int (*deliver_irq_t)(struct kvm_vcpu *vcpu);
779
780static const deliver_irq_t deliver_irq_funcs[] = {
781	[IRQ_PEND_MCHK_EX]        = __deliver_machine_check,
782	[IRQ_PEND_MCHK_REP]       = __deliver_machine_check,
783	[IRQ_PEND_PROG]           = __deliver_prog,
784	[IRQ_PEND_EXT_EMERGENCY]  = __deliver_emergency_signal,
785	[IRQ_PEND_EXT_EXTERNAL]   = __deliver_external_call,
786	[IRQ_PEND_EXT_CLOCK_COMP] = __deliver_ckc,
787	[IRQ_PEND_EXT_CPU_TIMER]  = __deliver_cpu_timer,
788	[IRQ_PEND_RESTART]        = __deliver_restart,
789	[IRQ_PEND_SET_PREFIX]     = __deliver_set_prefix,
790	[IRQ_PEND_PFAULT_INIT]    = __deliver_pfault_init,
791	[IRQ_PEND_EXT_SERVICE]    = __deliver_service,
792	[IRQ_PEND_PFAULT_DONE]    = __deliver_pfault_done,
793	[IRQ_PEND_VIRTIO]         = __deliver_virtio,
794};
795
796/* Check whether an external call is pending (deliverable or not) */
797int kvm_s390_ext_call_pending(struct kvm_vcpu *vcpu)
798{
799	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
800	uint8_t sigp_ctrl = vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].sigp_ctrl;
801
802	if (!sclp_has_sigpif())
803		return test_bit(IRQ_PEND_EXT_EXTERNAL, &li->pending_irqs);
804
805	return (sigp_ctrl & SIGP_CTRL_C) &&
806	       (atomic_read(&vcpu->arch.sie_block->cpuflags) & CPUSTAT_ECALL_PEND);
807}
808
809int kvm_s390_vcpu_has_irq(struct kvm_vcpu *vcpu, int exclude_stop)
810{
811	int rc;
812
813	rc = !!deliverable_irqs(vcpu);
814
815	if (!rc && kvm_cpu_has_pending_timer(vcpu))
816		rc = 1;
817
818	/* external call pending and deliverable */
819	if (!rc && kvm_s390_ext_call_pending(vcpu) &&
820	    !psw_extint_disabled(vcpu) &&
821	    (vcpu->arch.sie_block->gcr[0] & 0x2000ul))
822		rc = 1;
823
824	if (!rc && !exclude_stop && kvm_s390_is_stop_irq_pending(vcpu))
825		rc = 1;
826
827	return rc;
828}
829
830int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu)
831{
832	return ckc_irq_pending(vcpu) || cpu_timer_irq_pending(vcpu);
833}
834
835int kvm_s390_handle_wait(struct kvm_vcpu *vcpu)
836{
837	u64 now, sltime;
838
839	vcpu->stat.exit_wait_state++;
840
841	/* fast path */
842	if (kvm_cpu_has_pending_timer(vcpu) || kvm_arch_vcpu_runnable(vcpu))
843		return 0;
844
845	if (psw_interrupts_disabled(vcpu)) {
846		VCPU_EVENT(vcpu, 3, "%s", "disabled wait");
847		return -EOPNOTSUPP; /* disabled wait */
848	}
849
850	if (!ckc_interrupts_enabled(vcpu)) {
851		VCPU_EVENT(vcpu, 3, "%s", "enabled wait w/o timer");
852		__set_cpu_idle(vcpu);
853		goto no_timer;
854	}
855
856	now = get_tod_clock_fast() + vcpu->arch.sie_block->epoch;
857	sltime = tod_to_ns(vcpu->arch.sie_block->ckc - now);
858
859	/* underflow */
860	if (vcpu->arch.sie_block->ckc < now)
861		return 0;
862
863	__set_cpu_idle(vcpu);
864	hrtimer_start(&vcpu->arch.ckc_timer, ktime_set (0, sltime) , HRTIMER_MODE_REL);
865	VCPU_EVENT(vcpu, 5, "enabled wait via clock comparator: %llx ns", sltime);
866no_timer:
867	srcu_read_unlock(&vcpu->kvm->srcu, vcpu->srcu_idx);
868	kvm_vcpu_block(vcpu);
869	__unset_cpu_idle(vcpu);
870	vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
871
872	hrtimer_cancel(&vcpu->arch.ckc_timer);
873	return 0;
874}
875
876void kvm_s390_vcpu_wakeup(struct kvm_vcpu *vcpu)
877{
878	if (waitqueue_active(&vcpu->wq)) {
879		/*
880		 * The vcpu gave up the cpu voluntarily, mark it as a good
881		 * yield-candidate.
882		 */
883		vcpu->preempted = true;
884		wake_up_interruptible(&vcpu->wq);
885		vcpu->stat.halt_wakeup++;
886	}
887}
888
889enum hrtimer_restart kvm_s390_idle_wakeup(struct hrtimer *timer)
890{
891	struct kvm_vcpu *vcpu;
892	u64 now, sltime;
893
894	vcpu = container_of(timer, struct kvm_vcpu, arch.ckc_timer);
895	now = get_tod_clock_fast() + vcpu->arch.sie_block->epoch;
896	sltime = tod_to_ns(vcpu->arch.sie_block->ckc - now);
897
898	/*
899	 * If the monotonic clock runs faster than the tod clock we might be
900	 * woken up too early and have to go back to sleep to avoid deadlocks.
901	 */
902	if (vcpu->arch.sie_block->ckc > now &&
903	    hrtimer_forward_now(timer, ns_to_ktime(sltime)))
904		return HRTIMER_RESTART;
905	kvm_s390_vcpu_wakeup(vcpu);
906	return HRTIMER_NORESTART;
907}
908
909void kvm_s390_clear_local_irqs(struct kvm_vcpu *vcpu)
910{
911	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
912
913	spin_lock(&li->lock);
914	li->pending_irqs = 0;
915	bitmap_zero(li->sigp_emerg_pending, KVM_MAX_VCPUS);
916	memset(&li->irq, 0, sizeof(li->irq));
917	spin_unlock(&li->lock);
918
919	/* clear pending external calls set by sigp interpretation facility */
920	atomic_clear_mask(CPUSTAT_ECALL_PEND, li->cpuflags);
921	vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].sigp_ctrl = 0;
922}
923
924int __must_check kvm_s390_deliver_pending_interrupts(struct kvm_vcpu *vcpu)
925{
926	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
927	deliver_irq_t func;
928	int rc = 0;
929	unsigned long irq_type;
930	unsigned long irqs;
931
932	__reset_intercept_indicators(vcpu);
933
934	/* pending ckc conditions might have been invalidated */
935	clear_bit(IRQ_PEND_EXT_CLOCK_COMP, &li->pending_irqs);
936	if (ckc_irq_pending(vcpu))
937		set_bit(IRQ_PEND_EXT_CLOCK_COMP, &li->pending_irqs);
938
939	/* pending cpu timer conditions might have been invalidated */
940	clear_bit(IRQ_PEND_EXT_CPU_TIMER, &li->pending_irqs);
941	if (cpu_timer_irq_pending(vcpu))
942		set_bit(IRQ_PEND_EXT_CPU_TIMER, &li->pending_irqs);
943
944	do {
945		irqs = deliverable_irqs(vcpu);
946		/* bits are in the order of interrupt priority */
947		irq_type = find_first_bit(&irqs, IRQ_PEND_COUNT);
948		if (irq_type == IRQ_PEND_COUNT)
949			break;
950		if (is_ioirq(irq_type)) {
951			rc = __deliver_io(vcpu, irq_type);
952		} else {
953			func = deliver_irq_funcs[irq_type];
954			if (!func) {
955				WARN_ON_ONCE(func == NULL);
956				clear_bit(irq_type, &li->pending_irqs);
957				continue;
958			}
959			rc = func(vcpu);
960		}
961		if (rc)
962			break;
963	} while (!rc);
964
965	set_intercept_indicators(vcpu);
966
967	return rc;
968}
969
970static int __inject_prog(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
971{
972	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
973
974	li->irq.pgm = irq->u.pgm;
975	set_bit(IRQ_PEND_PROG, &li->pending_irqs);
976	return 0;
977}
978
979int kvm_s390_inject_program_int(struct kvm_vcpu *vcpu, u16 code)
980{
981	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
982	struct kvm_s390_irq irq;
983
984	VCPU_EVENT(vcpu, 3, "inject: program check %d (from kernel)", code);
985	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_PROGRAM_INT, code,
986				   0, 1);
987	spin_lock(&li->lock);
988	irq.u.pgm.code = code;
989	__inject_prog(vcpu, &irq);
990	BUG_ON(waitqueue_active(li->wq));
991	spin_unlock(&li->lock);
992	return 0;
993}
994
995int kvm_s390_inject_prog_irq(struct kvm_vcpu *vcpu,
996			     struct kvm_s390_pgm_info *pgm_info)
997{
998	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
999	struct kvm_s390_irq irq;
1000	int rc;
1001
1002	VCPU_EVENT(vcpu, 3, "inject: prog irq %d (from kernel)",
1003		   pgm_info->code);
1004	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_PROGRAM_INT,
1005				   pgm_info->code, 0, 1);
1006	spin_lock(&li->lock);
1007	irq.u.pgm = *pgm_info;
1008	rc = __inject_prog(vcpu, &irq);
1009	BUG_ON(waitqueue_active(li->wq));
1010	spin_unlock(&li->lock);
1011	return rc;
1012}
1013
1014static int __inject_pfault_init(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1015{
1016	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1017
1018	VCPU_EVENT(vcpu, 3, "inject: external irq params:%x, params2:%llx",
1019		   irq->u.ext.ext_params, irq->u.ext.ext_params2);
1020	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_INT_PFAULT_INIT,
1021				   irq->u.ext.ext_params,
1022				   irq->u.ext.ext_params2, 2);
1023
1024	li->irq.ext = irq->u.ext;
1025	set_bit(IRQ_PEND_PFAULT_INIT, &li->pending_irqs);
1026	atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1027	return 0;
1028}
1029
1030static int __inject_extcall_sigpif(struct kvm_vcpu *vcpu, uint16_t src_id)
1031{
1032	unsigned char new_val, old_val;
1033	uint8_t *sigp_ctrl = &vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].sigp_ctrl;
1034
1035	new_val = SIGP_CTRL_C | (src_id & SIGP_CTRL_SCN_MASK);
1036	old_val = *sigp_ctrl & ~SIGP_CTRL_C;
1037	if (cmpxchg(sigp_ctrl, old_val, new_val) != old_val) {
1038		/* another external call is pending */
1039		return -EBUSY;
1040	}
1041	atomic_set_mask(CPUSTAT_ECALL_PEND, &vcpu->arch.sie_block->cpuflags);
1042	return 0;
1043}
1044
1045static int __inject_extcall(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1046{
1047	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1048	struct kvm_s390_extcall_info *extcall = &li->irq.extcall;
1049	uint16_t src_id = irq->u.extcall.code;
1050
1051	VCPU_EVENT(vcpu, 3, "inject: external call source-cpu:%u",
1052		   src_id);
1053	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_INT_EXTERNAL_CALL,
1054				   src_id, 0, 2);
1055
1056	/* sending vcpu invalid */
1057	if (kvm_get_vcpu_by_id(vcpu->kvm, src_id) == NULL)
1058		return -EINVAL;
1059
1060	if (sclp_has_sigpif())
1061		return __inject_extcall_sigpif(vcpu, src_id);
1062
1063	if (test_and_set_bit(IRQ_PEND_EXT_EXTERNAL, &li->pending_irqs))
1064		return -EBUSY;
1065	*extcall = irq->u.extcall;
1066	atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1067	return 0;
1068}
1069
1070static int __inject_set_prefix(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1071{
1072	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1073	struct kvm_s390_prefix_info *prefix = &li->irq.prefix;
1074
1075	VCPU_EVENT(vcpu, 3, "inject: set prefix to %x (from user)",
1076		   irq->u.prefix.address);
1077	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_SIGP_SET_PREFIX,
1078				   irq->u.prefix.address, 0, 2);
1079
1080	if (!is_vcpu_stopped(vcpu))
1081		return -EBUSY;
1082
1083	*prefix = irq->u.prefix;
1084	set_bit(IRQ_PEND_SET_PREFIX, &li->pending_irqs);
1085	return 0;
1086}
1087
1088#define KVM_S390_STOP_SUPP_FLAGS (KVM_S390_STOP_FLAG_STORE_STATUS)
1089static int __inject_sigp_stop(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1090{
1091	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1092	struct kvm_s390_stop_info *stop = &li->irq.stop;
1093	int rc = 0;
1094
1095	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_SIGP_STOP, 0, 0, 2);
1096
1097	if (irq->u.stop.flags & ~KVM_S390_STOP_SUPP_FLAGS)
1098		return -EINVAL;
1099
1100	if (is_vcpu_stopped(vcpu)) {
1101		if (irq->u.stop.flags & KVM_S390_STOP_FLAG_STORE_STATUS)
1102			rc = kvm_s390_store_status_unloaded(vcpu,
1103						KVM_S390_STORE_STATUS_NOADDR);
1104		return rc;
1105	}
1106
1107	if (test_and_set_bit(IRQ_PEND_SIGP_STOP, &li->pending_irqs))
1108		return -EBUSY;
1109	stop->flags = irq->u.stop.flags;
1110	__set_cpuflag(vcpu, CPUSTAT_STOP_INT);
1111	return 0;
1112}
1113
1114static int __inject_sigp_restart(struct kvm_vcpu *vcpu,
1115				 struct kvm_s390_irq *irq)
1116{
1117	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1118
1119	VCPU_EVENT(vcpu, 3, "inject: restart type %llx", irq->type);
1120	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_RESTART, 0, 0, 2);
1121
1122	set_bit(IRQ_PEND_RESTART, &li->pending_irqs);
1123	return 0;
1124}
1125
1126static int __inject_sigp_emergency(struct kvm_vcpu *vcpu,
1127				   struct kvm_s390_irq *irq)
1128{
1129	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1130
1131	VCPU_EVENT(vcpu, 3, "inject: emergency %u\n",
1132		   irq->u.emerg.code);
1133	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_INT_EMERGENCY,
1134				   irq->u.emerg.code, 0, 2);
1135
1136	/* sending vcpu invalid */
1137	if (kvm_get_vcpu_by_id(vcpu->kvm, irq->u.emerg.code) == NULL)
1138		return -EINVAL;
1139
1140	set_bit(irq->u.emerg.code, li->sigp_emerg_pending);
1141	set_bit(IRQ_PEND_EXT_EMERGENCY, &li->pending_irqs);
1142	atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1143	return 0;
1144}
1145
1146static int __inject_mchk(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1147{
1148	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1149	struct kvm_s390_mchk_info *mchk = &li->irq.mchk;
1150
1151	VCPU_EVENT(vcpu, 5, "inject: machine check parm64:%llx",
1152		   irq->u.mchk.mcic);
1153	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_MCHK, 0,
1154				   irq->u.mchk.mcic, 2);
1155
1156	/*
1157	 * Because repressible machine checks can be indicated along with
1158	 * exigent machine checks (PoP, Chapter 11, Interruption action)
1159	 * we need to combine cr14, mcic and external damage code.
1160	 * Failing storage address and the logout area should not be or'ed
1161	 * together, we just indicate the last occurrence of the corresponding
1162	 * machine check
1163	 */
1164	mchk->cr14 |= irq->u.mchk.cr14;
1165	mchk->mcic |= irq->u.mchk.mcic;
1166	mchk->ext_damage_code |= irq->u.mchk.ext_damage_code;
1167	mchk->failing_storage_address = irq->u.mchk.failing_storage_address;
1168	memcpy(&mchk->fixed_logout, &irq->u.mchk.fixed_logout,
1169	       sizeof(mchk->fixed_logout));
1170	if (mchk->mcic & MCHK_EX_MASK)
1171		set_bit(IRQ_PEND_MCHK_EX, &li->pending_irqs);
1172	else if (mchk->mcic & MCHK_REP_MASK)
1173		set_bit(IRQ_PEND_MCHK_REP,  &li->pending_irqs);
1174	return 0;
1175}
1176
1177static int __inject_ckc(struct kvm_vcpu *vcpu)
1178{
1179	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1180
1181	VCPU_EVENT(vcpu, 3, "inject: type %x", KVM_S390_INT_CLOCK_COMP);
1182	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_INT_CLOCK_COMP,
1183				   0, 0, 2);
1184
1185	set_bit(IRQ_PEND_EXT_CLOCK_COMP, &li->pending_irqs);
1186	atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1187	return 0;
1188}
1189
1190static int __inject_cpu_timer(struct kvm_vcpu *vcpu)
1191{
1192	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1193
1194	VCPU_EVENT(vcpu, 3, "inject: type %x", KVM_S390_INT_CPU_TIMER);
1195	trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_INT_CPU_TIMER,
1196				   0, 0, 2);
1197
1198	set_bit(IRQ_PEND_EXT_CPU_TIMER, &li->pending_irqs);
1199	atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1200	return 0;
1201}
1202
1203static struct kvm_s390_interrupt_info *get_io_int(struct kvm *kvm,
1204						  int isc, u32 schid)
1205{
1206	struct kvm_s390_float_interrupt *fi = &kvm->arch.float_int;
1207	struct list_head *isc_list = &fi->lists[FIRQ_LIST_IO_ISC_0 + isc];
1208	struct kvm_s390_interrupt_info *iter;
1209	u16 id = (schid & 0xffff0000U) >> 16;
1210	u16 nr = schid & 0x0000ffffU;
1211
1212	spin_lock(&fi->lock);
1213	list_for_each_entry(iter, isc_list, list) {
1214		if (schid && (id != iter->io.subchannel_id ||
1215			      nr != iter->io.subchannel_nr))
1216			continue;
1217		/* found an appropriate entry */
1218		list_del_init(&iter->list);
1219		fi->counters[FIRQ_CNTR_IO] -= 1;
1220		if (list_empty(isc_list))
1221			clear_bit(IRQ_PEND_IO_ISC_0 + isc, &fi->pending_irqs);
1222		spin_unlock(&fi->lock);
1223		return iter;
1224	}
1225	spin_unlock(&fi->lock);
1226	return NULL;
1227}
1228
1229/*
1230 * Dequeue and return an I/O interrupt matching any of the interruption
1231 * subclasses as designated by the isc mask in cr6 and the schid (if != 0).
1232 */
1233struct kvm_s390_interrupt_info *kvm_s390_get_io_int(struct kvm *kvm,
1234						    u64 isc_mask, u32 schid)
1235{
1236	struct kvm_s390_interrupt_info *inti = NULL;
1237	int isc;
1238
1239	for (isc = 0; isc <= MAX_ISC && !inti; isc++) {
1240		if (isc_mask & isc_to_isc_bits(isc))
1241			inti = get_io_int(kvm, isc, schid);
1242	}
1243	return inti;
1244}
1245
1246#define SCCB_MASK 0xFFFFFFF8
1247#define SCCB_EVENT_PENDING 0x3
1248
1249static int __inject_service(struct kvm *kvm,
1250			     struct kvm_s390_interrupt_info *inti)
1251{
1252	struct kvm_s390_float_interrupt *fi = &kvm->arch.float_int;
1253
1254	spin_lock(&fi->lock);
1255	fi->srv_signal.ext_params |= inti->ext.ext_params & SCCB_EVENT_PENDING;
1256	/*
1257	 * Early versions of the QEMU s390 bios will inject several
1258	 * service interrupts after another without handling a
1259	 * condition code indicating busy.
1260	 * We will silently ignore those superfluous sccb values.
1261	 * A future version of QEMU will take care of serialization
1262	 * of servc requests
1263	 */
1264	if (fi->srv_signal.ext_params & SCCB_MASK)
1265		goto out;
1266	fi->srv_signal.ext_params |= inti->ext.ext_params & SCCB_MASK;
1267	set_bit(IRQ_PEND_EXT_SERVICE, &fi->pending_irqs);
1268out:
1269	spin_unlock(&fi->lock);
1270	kfree(inti);
1271	return 0;
1272}
1273
1274static int __inject_virtio(struct kvm *kvm,
1275			    struct kvm_s390_interrupt_info *inti)
1276{
1277	struct kvm_s390_float_interrupt *fi = &kvm->arch.float_int;
1278
1279	spin_lock(&fi->lock);
1280	if (fi->counters[FIRQ_CNTR_VIRTIO] >= KVM_S390_MAX_VIRTIO_IRQS) {
1281		spin_unlock(&fi->lock);
1282		return -EBUSY;
1283	}
1284	fi->counters[FIRQ_CNTR_VIRTIO] += 1;
1285	list_add_tail(&inti->list, &fi->lists[FIRQ_LIST_VIRTIO]);
1286	set_bit(IRQ_PEND_VIRTIO, &fi->pending_irqs);
1287	spin_unlock(&fi->lock);
1288	return 0;
1289}
1290
1291static int __inject_pfault_done(struct kvm *kvm,
1292				 struct kvm_s390_interrupt_info *inti)
1293{
1294	struct kvm_s390_float_interrupt *fi = &kvm->arch.float_int;
1295
1296	spin_lock(&fi->lock);
1297	if (fi->counters[FIRQ_CNTR_PFAULT] >=
1298		(ASYNC_PF_PER_VCPU * KVM_MAX_VCPUS)) {
1299		spin_unlock(&fi->lock);
1300		return -EBUSY;
1301	}
1302	fi->counters[FIRQ_CNTR_PFAULT] += 1;
1303	list_add_tail(&inti->list, &fi->lists[FIRQ_LIST_PFAULT]);
1304	set_bit(IRQ_PEND_PFAULT_DONE, &fi->pending_irqs);
1305	spin_unlock(&fi->lock);
1306	return 0;
1307}
1308
1309#define CR_PENDING_SUBCLASS 28
1310static int __inject_float_mchk(struct kvm *kvm,
1311				struct kvm_s390_interrupt_info *inti)
1312{
1313	struct kvm_s390_float_interrupt *fi = &kvm->arch.float_int;
1314
1315	spin_lock(&fi->lock);
1316	fi->mchk.cr14 |= inti->mchk.cr14 & (1UL << CR_PENDING_SUBCLASS);
1317	fi->mchk.mcic |= inti->mchk.mcic;
1318	set_bit(IRQ_PEND_MCHK_REP, &fi->pending_irqs);
1319	spin_unlock(&fi->lock);
1320	kfree(inti);
1321	return 0;
1322}
1323
1324static int __inject_io(struct kvm *kvm, struct kvm_s390_interrupt_info *inti)
1325{
1326	struct kvm_s390_float_interrupt *fi;
1327	struct list_head *list;
1328	int isc;
1329
1330	fi = &kvm->arch.float_int;
1331	spin_lock(&fi->lock);
1332	if (fi->counters[FIRQ_CNTR_IO] >= KVM_S390_MAX_FLOAT_IRQS) {
1333		spin_unlock(&fi->lock);
1334		return -EBUSY;
1335	}
1336	fi->counters[FIRQ_CNTR_IO] += 1;
1337
1338	isc = int_word_to_isc(inti->io.io_int_word);
1339	list = &fi->lists[FIRQ_LIST_IO_ISC_0 + isc];
1340	list_add_tail(&inti->list, list);
1341	set_bit(IRQ_PEND_IO_ISC_0 + isc, &fi->pending_irqs);
1342	spin_unlock(&fi->lock);
1343	return 0;
1344}
1345
1346static int __inject_vm(struct kvm *kvm, struct kvm_s390_interrupt_info *inti)
1347{
1348	struct kvm_s390_local_interrupt *li;
1349	struct kvm_s390_float_interrupt *fi;
1350	struct kvm_vcpu *dst_vcpu = NULL;
1351	int sigcpu;
1352	u64 type = READ_ONCE(inti->type);
1353	int rc;
1354
1355	fi = &kvm->arch.float_int;
1356
1357	switch (type) {
1358	case KVM_S390_MCHK:
1359		rc = __inject_float_mchk(kvm, inti);
1360		break;
1361	case KVM_S390_INT_VIRTIO:
1362		rc = __inject_virtio(kvm, inti);
1363		break;
1364	case KVM_S390_INT_SERVICE:
1365		rc = __inject_service(kvm, inti);
1366		break;
1367	case KVM_S390_INT_PFAULT_DONE:
1368		rc = __inject_pfault_done(kvm, inti);
1369		break;
1370	case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1371		rc = __inject_io(kvm, inti);
1372		break;
1373	default:
1374		rc = -EINVAL;
1375	}
1376	if (rc)
1377		return rc;
1378
1379	sigcpu = find_first_bit(fi->idle_mask, KVM_MAX_VCPUS);
1380	if (sigcpu == KVM_MAX_VCPUS) {
1381		do {
1382			sigcpu = fi->next_rr_cpu++;
1383			if (sigcpu == KVM_MAX_VCPUS)
1384				sigcpu = fi->next_rr_cpu = 0;
1385		} while (kvm_get_vcpu(kvm, sigcpu) == NULL);
1386	}
1387	dst_vcpu = kvm_get_vcpu(kvm, sigcpu);
1388	li = &dst_vcpu->arch.local_int;
1389	spin_lock(&li->lock);
1390	switch (type) {
1391	case KVM_S390_MCHK:
1392		atomic_set_mask(CPUSTAT_STOP_INT, li->cpuflags);
1393		break;
1394	case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1395		atomic_set_mask(CPUSTAT_IO_INT, li->cpuflags);
1396		break;
1397	default:
1398		atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1399		break;
1400	}
1401	spin_unlock(&li->lock);
1402	kvm_s390_vcpu_wakeup(kvm_get_vcpu(kvm, sigcpu));
1403	return 0;
1404
1405}
1406
1407int kvm_s390_inject_vm(struct kvm *kvm,
1408		       struct kvm_s390_interrupt *s390int)
1409{
1410	struct kvm_s390_interrupt_info *inti;
1411	int rc;
1412
1413	inti = kzalloc(sizeof(*inti), GFP_KERNEL);
1414	if (!inti)
1415		return -ENOMEM;
1416
1417	inti->type = s390int->type;
1418	switch (inti->type) {
1419	case KVM_S390_INT_VIRTIO:
1420		VM_EVENT(kvm, 5, "inject: virtio parm:%x,parm64:%llx",
1421			 s390int->parm, s390int->parm64);
1422		inti->ext.ext_params = s390int->parm;
1423		inti->ext.ext_params2 = s390int->parm64;
1424		break;
1425	case KVM_S390_INT_SERVICE:
1426		VM_EVENT(kvm, 5, "inject: sclp parm:%x", s390int->parm);
1427		inti->ext.ext_params = s390int->parm;
1428		break;
1429	case KVM_S390_INT_PFAULT_DONE:
1430		inti->ext.ext_params2 = s390int->parm64;
1431		break;
1432	case KVM_S390_MCHK:
1433		VM_EVENT(kvm, 5, "inject: machine check parm64:%llx",
1434			 s390int->parm64);
1435		inti->mchk.cr14 = s390int->parm; /* upper bits are not used */
1436		inti->mchk.mcic = s390int->parm64;
1437		break;
1438	case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1439		if (inti->type & IOINT_AI_MASK)
1440			VM_EVENT(kvm, 5, "%s", "inject: I/O (AI)");
1441		else
1442			VM_EVENT(kvm, 5, "inject: I/O css %x ss %x schid %04x",
1443				 s390int->type & IOINT_CSSID_MASK,
1444				 s390int->type & IOINT_SSID_MASK,
1445				 s390int->type & IOINT_SCHID_MASK);
1446		inti->io.subchannel_id = s390int->parm >> 16;
1447		inti->io.subchannel_nr = s390int->parm & 0x0000ffffu;
1448		inti->io.io_int_parm = s390int->parm64 >> 32;
1449		inti->io.io_int_word = s390int->parm64 & 0x00000000ffffffffull;
1450		break;
1451	default:
1452		kfree(inti);
1453		return -EINVAL;
1454	}
1455	trace_kvm_s390_inject_vm(s390int->type, s390int->parm, s390int->parm64,
1456				 2);
1457
1458	rc = __inject_vm(kvm, inti);
1459	if (rc)
1460		kfree(inti);
1461	return rc;
1462}
1463
1464int kvm_s390_reinject_io_int(struct kvm *kvm,
1465			      struct kvm_s390_interrupt_info *inti)
1466{
1467	return __inject_vm(kvm, inti);
1468}
1469
1470int s390int_to_s390irq(struct kvm_s390_interrupt *s390int,
1471		       struct kvm_s390_irq *irq)
1472{
1473	irq->type = s390int->type;
1474	switch (irq->type) {
1475	case KVM_S390_PROGRAM_INT:
1476		if (s390int->parm & 0xffff0000)
1477			return -EINVAL;
1478		irq->u.pgm.code = s390int->parm;
1479		break;
1480	case KVM_S390_SIGP_SET_PREFIX:
1481		irq->u.prefix.address = s390int->parm;
1482		break;
1483	case KVM_S390_SIGP_STOP:
1484		irq->u.stop.flags = s390int->parm;
1485		break;
1486	case KVM_S390_INT_EXTERNAL_CALL:
1487		if (s390int->parm & 0xffff0000)
1488			return -EINVAL;
1489		irq->u.extcall.code = s390int->parm;
1490		break;
1491	case KVM_S390_INT_EMERGENCY:
1492		if (s390int->parm & 0xffff0000)
1493			return -EINVAL;
1494		irq->u.emerg.code = s390int->parm;
1495		break;
1496	case KVM_S390_MCHK:
1497		irq->u.mchk.mcic = s390int->parm64;
1498		break;
1499	}
1500	return 0;
1501}
1502
1503int kvm_s390_is_stop_irq_pending(struct kvm_vcpu *vcpu)
1504{
1505	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1506
1507	return test_bit(IRQ_PEND_SIGP_STOP, &li->pending_irqs);
1508}
1509
1510void kvm_s390_clear_stop_irq(struct kvm_vcpu *vcpu)
1511{
1512	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1513
1514	spin_lock(&li->lock);
1515	li->irq.stop.flags = 0;
1516	clear_bit(IRQ_PEND_SIGP_STOP, &li->pending_irqs);
1517	spin_unlock(&li->lock);
1518}
1519
1520static int do_inject_vcpu(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1521{
1522	int rc;
1523
1524	switch (irq->type) {
1525	case KVM_S390_PROGRAM_INT:
1526		VCPU_EVENT(vcpu, 3, "inject: program check %d (from user)",
1527			   irq->u.pgm.code);
1528		rc = __inject_prog(vcpu, irq);
1529		break;
1530	case KVM_S390_SIGP_SET_PREFIX:
1531		rc = __inject_set_prefix(vcpu, irq);
1532		break;
1533	case KVM_S390_SIGP_STOP:
1534		rc = __inject_sigp_stop(vcpu, irq);
1535		break;
1536	case KVM_S390_RESTART:
1537		rc = __inject_sigp_restart(vcpu, irq);
1538		break;
1539	case KVM_S390_INT_CLOCK_COMP:
1540		rc = __inject_ckc(vcpu);
1541		break;
1542	case KVM_S390_INT_CPU_TIMER:
1543		rc = __inject_cpu_timer(vcpu);
1544		break;
1545	case KVM_S390_INT_EXTERNAL_CALL:
1546		rc = __inject_extcall(vcpu, irq);
1547		break;
1548	case KVM_S390_INT_EMERGENCY:
1549		rc = __inject_sigp_emergency(vcpu, irq);
1550		break;
1551	case KVM_S390_MCHK:
1552		rc = __inject_mchk(vcpu, irq);
1553		break;
1554	case KVM_S390_INT_PFAULT_INIT:
1555		rc = __inject_pfault_init(vcpu, irq);
1556		break;
1557	case KVM_S390_INT_VIRTIO:
1558	case KVM_S390_INT_SERVICE:
1559	case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1560	default:
1561		rc = -EINVAL;
1562	}
1563
1564	return rc;
1565}
1566
1567int kvm_s390_inject_vcpu(struct kvm_vcpu *vcpu, struct kvm_s390_irq *irq)
1568{
1569	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
1570	int rc;
1571
1572	spin_lock(&li->lock);
1573	rc = do_inject_vcpu(vcpu, irq);
1574	spin_unlock(&li->lock);
1575	if (!rc)
1576		kvm_s390_vcpu_wakeup(vcpu);
1577	return rc;
1578}
1579
1580static inline void clear_irq_list(struct list_head *_list)
1581{
1582	struct kvm_s390_interrupt_info *inti, *n;
1583
1584	list_for_each_entry_safe(inti, n, _list, list) {
1585		list_del(&inti->list);
1586		kfree(inti);
1587	}
1588}
1589
1590static void inti_to_irq(struct kvm_s390_interrupt_info *inti,
1591		       struct kvm_s390_irq *irq)
1592{
1593	irq->type = inti->type;
1594	switch (inti->type) {
1595	case KVM_S390_INT_PFAULT_INIT:
1596	case KVM_S390_INT_PFAULT_DONE:
1597	case KVM_S390_INT_VIRTIO:
1598		irq->u.ext = inti->ext;
1599		break;
1600	case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1601		irq->u.io = inti->io;
1602		break;
1603	}
1604}
1605
1606void kvm_s390_clear_float_irqs(struct kvm *kvm)
1607{
1608	struct kvm_s390_float_interrupt *fi = &kvm->arch.float_int;
1609	int i;
1610
1611	spin_lock(&fi->lock);
1612	fi->pending_irqs = 0;
1613	memset(&fi->srv_signal, 0, sizeof(fi->srv_signal));
1614	memset(&fi->mchk, 0, sizeof(fi->mchk));
1615	for (i = 0; i < FIRQ_LIST_COUNT; i++)
1616		clear_irq_list(&fi->lists[i]);
1617	for (i = 0; i < FIRQ_MAX_COUNT; i++)
1618		fi->counters[i] = 0;
1619	spin_unlock(&fi->lock);
1620};
1621
1622static int get_all_floating_irqs(struct kvm *kvm, u8 __user *usrbuf, u64 len)
1623{
1624	struct kvm_s390_interrupt_info *inti;
1625	struct kvm_s390_float_interrupt *fi;
1626	struct kvm_s390_irq *buf;
1627	struct kvm_s390_irq *irq;
1628	int max_irqs;
1629	int ret = 0;
1630	int n = 0;
1631	int i;
1632
1633	if (len > KVM_S390_FLIC_MAX_BUFFER || len == 0)
1634		return -EINVAL;
1635
1636	/*
1637	 * We are already using -ENOMEM to signal
1638	 * userspace it may retry with a bigger buffer,
1639	 * so we need to use something else for this case
1640	 */
1641	buf = vzalloc(len);
1642	if (!buf)
1643		return -ENOBUFS;
1644
1645	max_irqs = len / sizeof(struct kvm_s390_irq);
1646
1647	fi = &kvm->arch.float_int;
1648	spin_lock(&fi->lock);
1649	for (i = 0; i < FIRQ_LIST_COUNT; i++) {
1650		list_for_each_entry(inti, &fi->lists[i], list) {
1651			if (n == max_irqs) {
1652				/* signal userspace to try again */
1653				ret = -ENOMEM;
1654				goto out;
1655			}
1656			inti_to_irq(inti, &buf[n]);
1657			n++;
1658		}
1659	}
1660	if (test_bit(IRQ_PEND_EXT_SERVICE, &fi->pending_irqs)) {
1661		if (n == max_irqs) {
1662			/* signal userspace to try again */
1663			ret = -ENOMEM;
1664			goto out;
1665		}
1666		irq = (struct kvm_s390_irq *) &buf[n];
1667		irq->type = KVM_S390_INT_SERVICE;
1668		irq->u.ext = fi->srv_signal;
1669		n++;
1670	}
1671	if (test_bit(IRQ_PEND_MCHK_REP, &fi->pending_irqs)) {
1672		if (n == max_irqs) {
1673				/* signal userspace to try again */
1674				ret = -ENOMEM;
1675				goto out;
1676		}
1677		irq = (struct kvm_s390_irq *) &buf[n];
1678		irq->type = KVM_S390_MCHK;
1679		irq->u.mchk = fi->mchk;
1680		n++;
1681}
1682
1683out:
1684	spin_unlock(&fi->lock);
1685	if (!ret && n > 0) {
1686		if (copy_to_user(usrbuf, buf, sizeof(struct kvm_s390_irq) * n))
1687			ret = -EFAULT;
1688	}
1689	vfree(buf);
1690
1691	return ret < 0 ? ret : n;
1692}
1693
1694static int flic_get_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
1695{
1696	int r;
1697
1698	switch (attr->group) {
1699	case KVM_DEV_FLIC_GET_ALL_IRQS:
1700		r = get_all_floating_irqs(dev->kvm, (u8 __user *) attr->addr,
1701					  attr->attr);
1702		break;
1703	default:
1704		r = -EINVAL;
1705	}
1706
1707	return r;
1708}
1709
1710static inline int copy_irq_from_user(struct kvm_s390_interrupt_info *inti,
1711				     u64 addr)
1712{
1713	struct kvm_s390_irq __user *uptr = (struct kvm_s390_irq __user *) addr;
1714	void *target = NULL;
1715	void __user *source;
1716	u64 size;
1717
1718	if (get_user(inti->type, (u64 __user *)addr))
1719		return -EFAULT;
1720
1721	switch (inti->type) {
1722	case KVM_S390_INT_PFAULT_INIT:
1723	case KVM_S390_INT_PFAULT_DONE:
1724	case KVM_S390_INT_VIRTIO:
1725	case KVM_S390_INT_SERVICE:
1726		target = (void *) &inti->ext;
1727		source = &uptr->u.ext;
1728		size = sizeof(inti->ext);
1729		break;
1730	case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1731		target = (void *) &inti->io;
1732		source = &uptr->u.io;
1733		size = sizeof(inti->io);
1734		break;
1735	case KVM_S390_MCHK:
1736		target = (void *) &inti->mchk;
1737		source = &uptr->u.mchk;
1738		size = sizeof(inti->mchk);
1739		break;
1740	default:
1741		return -EINVAL;
1742	}
1743
1744	if (copy_from_user(target, source, size))
1745		return -EFAULT;
1746
1747	return 0;
1748}
1749
1750static int enqueue_floating_irq(struct kvm_device *dev,
1751				struct kvm_device_attr *attr)
1752{
1753	struct kvm_s390_interrupt_info *inti = NULL;
1754	int r = 0;
1755	int len = attr->attr;
1756
1757	if (len % sizeof(struct kvm_s390_irq) != 0)
1758		return -EINVAL;
1759	else if (len > KVM_S390_FLIC_MAX_BUFFER)
1760		return -EINVAL;
1761
1762	while (len >= sizeof(struct kvm_s390_irq)) {
1763		inti = kzalloc(sizeof(*inti), GFP_KERNEL);
1764		if (!inti)
1765			return -ENOMEM;
1766
1767		r = copy_irq_from_user(inti, attr->addr);
1768		if (r) {
1769			kfree(inti);
1770			return r;
1771		}
1772		r = __inject_vm(dev->kvm, inti);
1773		if (r) {
1774			kfree(inti);
1775			return r;
1776		}
1777		len -= sizeof(struct kvm_s390_irq);
1778		attr->addr += sizeof(struct kvm_s390_irq);
1779	}
1780
1781	return r;
1782}
1783
1784static struct s390_io_adapter *get_io_adapter(struct kvm *kvm, unsigned int id)
1785{
1786	if (id >= MAX_S390_IO_ADAPTERS)
1787		return NULL;
1788	return kvm->arch.adapters[id];
1789}
1790
1791static int register_io_adapter(struct kvm_device *dev,
1792			       struct kvm_device_attr *attr)
1793{
1794	struct s390_io_adapter *adapter;
1795	struct kvm_s390_io_adapter adapter_info;
1796
1797	if (copy_from_user(&adapter_info,
1798			   (void __user *)attr->addr, sizeof(adapter_info)))
1799		return -EFAULT;
1800
1801	if ((adapter_info.id >= MAX_S390_IO_ADAPTERS) ||
1802	    (dev->kvm->arch.adapters[adapter_info.id] != NULL))
1803		return -EINVAL;
1804
1805	adapter = kzalloc(sizeof(*adapter), GFP_KERNEL);
1806	if (!adapter)
1807		return -ENOMEM;
1808
1809	INIT_LIST_HEAD(&adapter->maps);
1810	init_rwsem(&adapter->maps_lock);
1811	atomic_set(&adapter->nr_maps, 0);
1812	adapter->id = adapter_info.id;
1813	adapter->isc = adapter_info.isc;
1814	adapter->maskable = adapter_info.maskable;
1815	adapter->masked = false;
1816	adapter->swap = adapter_info.swap;
1817	dev->kvm->arch.adapters[adapter->id] = adapter;
1818
1819	return 0;
1820}
1821
1822int kvm_s390_mask_adapter(struct kvm *kvm, unsigned int id, bool masked)
1823{
1824	int ret;
1825	struct s390_io_adapter *adapter = get_io_adapter(kvm, id);
1826
1827	if (!adapter || !adapter->maskable)
1828		return -EINVAL;
1829	ret = adapter->masked;
1830	adapter->masked = masked;
1831	return ret;
1832}
1833
1834static int kvm_s390_adapter_map(struct kvm *kvm, unsigned int id, __u64 addr)
1835{
1836	struct s390_io_adapter *adapter = get_io_adapter(kvm, id);
1837	struct s390_map_info *map;
1838	int ret;
1839
1840	if (!adapter || !addr)
1841		return -EINVAL;
1842
1843	map = kzalloc(sizeof(*map), GFP_KERNEL);
1844	if (!map) {
1845		ret = -ENOMEM;
1846		goto out;
1847	}
1848	INIT_LIST_HEAD(&map->list);
1849	map->guest_addr = addr;
1850	map->addr = gmap_translate(kvm->arch.gmap, addr);
1851	if (map->addr == -EFAULT) {
1852		ret = -EFAULT;
1853		goto out;
1854	}
1855	ret = get_user_pages_fast(map->addr, 1, 1, &map->page);
1856	if (ret < 0)
1857		goto out;
1858	BUG_ON(ret != 1);
1859	down_write(&adapter->maps_lock);
1860	if (atomic_inc_return(&adapter->nr_maps) < MAX_S390_ADAPTER_MAPS) {
1861		list_add_tail(&map->list, &adapter->maps);
1862		ret = 0;
1863	} else {
1864		put_page(map->page);
1865		ret = -EINVAL;
1866	}
1867	up_write(&adapter->maps_lock);
1868out:
1869	if (ret)
1870		kfree(map);
1871	return ret;
1872}
1873
1874static int kvm_s390_adapter_unmap(struct kvm *kvm, unsigned int id, __u64 addr)
1875{
1876	struct s390_io_adapter *adapter = get_io_adapter(kvm, id);
1877	struct s390_map_info *map, *tmp;
1878	int found = 0;
1879
1880	if (!adapter || !addr)
1881		return -EINVAL;
1882
1883	down_write(&adapter->maps_lock);
1884	list_for_each_entry_safe(map, tmp, &adapter->maps, list) {
1885		if (map->guest_addr == addr) {
1886			found = 1;
1887			atomic_dec(&adapter->nr_maps);
1888			list_del(&map->list);
1889			put_page(map->page);
1890			kfree(map);
1891			break;
1892		}
1893	}
1894	up_write(&adapter->maps_lock);
1895
1896	return found ? 0 : -EINVAL;
1897}
1898
1899void kvm_s390_destroy_adapters(struct kvm *kvm)
1900{
1901	int i;
1902	struct s390_map_info *map, *tmp;
1903
1904	for (i = 0; i < MAX_S390_IO_ADAPTERS; i++) {
1905		if (!kvm->arch.adapters[i])
1906			continue;
1907		list_for_each_entry_safe(map, tmp,
1908					 &kvm->arch.adapters[i]->maps, list) {
1909			list_del(&map->list);
1910			put_page(map->page);
1911			kfree(map);
1912		}
1913		kfree(kvm->arch.adapters[i]);
1914	}
1915}
1916
1917static int modify_io_adapter(struct kvm_device *dev,
1918			     struct kvm_device_attr *attr)
1919{
1920	struct kvm_s390_io_adapter_req req;
1921	struct s390_io_adapter *adapter;
1922	int ret;
1923
1924	if (copy_from_user(&req, (void __user *)attr->addr, sizeof(req)))
1925		return -EFAULT;
1926
1927	adapter = get_io_adapter(dev->kvm, req.id);
1928	if (!adapter)
1929		return -EINVAL;
1930	switch (req.type) {
1931	case KVM_S390_IO_ADAPTER_MASK:
1932		ret = kvm_s390_mask_adapter(dev->kvm, req.id, req.mask);
1933		if (ret > 0)
1934			ret = 0;
1935		break;
1936	case KVM_S390_IO_ADAPTER_MAP:
1937		ret = kvm_s390_adapter_map(dev->kvm, req.id, req.addr);
1938		break;
1939	case KVM_S390_IO_ADAPTER_UNMAP:
1940		ret = kvm_s390_adapter_unmap(dev->kvm, req.id, req.addr);
1941		break;
1942	default:
1943		ret = -EINVAL;
1944	}
1945
1946	return ret;
1947}
1948
1949static int flic_set_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
1950{
1951	int r = 0;
1952	unsigned int i;
1953	struct kvm_vcpu *vcpu;
1954
1955	switch (attr->group) {
1956	case KVM_DEV_FLIC_ENQUEUE:
1957		r = enqueue_floating_irq(dev, attr);
1958		break;
1959	case KVM_DEV_FLIC_CLEAR_IRQS:
1960		kvm_s390_clear_float_irqs(dev->kvm);
1961		break;
1962	case KVM_DEV_FLIC_APF_ENABLE:
1963		dev->kvm->arch.gmap->pfault_enabled = 1;
1964		break;
1965	case KVM_DEV_FLIC_APF_DISABLE_WAIT:
1966		dev->kvm->arch.gmap->pfault_enabled = 0;
1967		/*
1968		 * Make sure no async faults are in transition when
1969		 * clearing the queues. So we don't need to worry
1970		 * about late coming workers.
1971		 */
1972		synchronize_srcu(&dev->kvm->srcu);
1973		kvm_for_each_vcpu(i, vcpu, dev->kvm)
1974			kvm_clear_async_pf_completion_queue(vcpu);
1975		break;
1976	case KVM_DEV_FLIC_ADAPTER_REGISTER:
1977		r = register_io_adapter(dev, attr);
1978		break;
1979	case KVM_DEV_FLIC_ADAPTER_MODIFY:
1980		r = modify_io_adapter(dev, attr);
1981		break;
1982	default:
1983		r = -EINVAL;
1984	}
1985
1986	return r;
1987}
1988
1989static int flic_create(struct kvm_device *dev, u32 type)
1990{
1991	if (!dev)
1992		return -EINVAL;
1993	if (dev->kvm->arch.flic)
1994		return -EINVAL;
1995	dev->kvm->arch.flic = dev;
1996	return 0;
1997}
1998
1999static void flic_destroy(struct kvm_device *dev)
2000{
2001	dev->kvm->arch.flic = NULL;
2002	kfree(dev);
2003}
2004
2005/* s390 floating irq controller (flic) */
2006struct kvm_device_ops kvm_flic_ops = {
2007	.name = "kvm-flic",
2008	.get_attr = flic_get_attr,
2009	.set_attr = flic_set_attr,
2010	.create = flic_create,
2011	.destroy = flic_destroy,
2012};
2013
2014static unsigned long get_ind_bit(__u64 addr, unsigned long bit_nr, bool swap)
2015{
2016	unsigned long bit;
2017
2018	bit = bit_nr + (addr % PAGE_SIZE) * 8;
2019
2020	return swap ? (bit ^ (BITS_PER_LONG - 1)) : bit;
2021}
2022
2023static struct s390_map_info *get_map_info(struct s390_io_adapter *adapter,
2024					  u64 addr)
2025{
2026	struct s390_map_info *map;
2027
2028	if (!adapter)
2029		return NULL;
2030
2031	list_for_each_entry(map, &adapter->maps, list) {
2032		if (map->guest_addr == addr)
2033			return map;
2034	}
2035	return NULL;
2036}
2037
2038static int adapter_indicators_set(struct kvm *kvm,
2039				  struct s390_io_adapter *adapter,
2040				  struct kvm_s390_adapter_int *adapter_int)
2041{
2042	unsigned long bit;
2043	int summary_set, idx;
2044	struct s390_map_info *info;
2045	void *map;
2046
2047	info = get_map_info(adapter, adapter_int->ind_addr);
2048	if (!info)
2049		return -1;
2050	map = page_address(info->page);
2051	bit = get_ind_bit(info->addr, adapter_int->ind_offset, adapter->swap);
2052	set_bit(bit, map);
2053	idx = srcu_read_lock(&kvm->srcu);
2054	mark_page_dirty(kvm, info->guest_addr >> PAGE_SHIFT);
2055	set_page_dirty_lock(info->page);
2056	info = get_map_info(adapter, adapter_int->summary_addr);
2057	if (!info) {
2058		srcu_read_unlock(&kvm->srcu, idx);
2059		return -1;
2060	}
2061	map = page_address(info->page);
2062	bit = get_ind_bit(info->addr, adapter_int->summary_offset,
2063			  adapter->swap);
2064	summary_set = test_and_set_bit(bit, map);
2065	mark_page_dirty(kvm, info->guest_addr >> PAGE_SHIFT);
2066	set_page_dirty_lock(info->page);
2067	srcu_read_unlock(&kvm->srcu, idx);
2068	return summary_set ? 0 : 1;
2069}
2070
2071/*
2072 * < 0 - not injected due to error
2073 * = 0 - coalesced, summary indicator already active
2074 * > 0 - injected interrupt
2075 */
2076static int set_adapter_int(struct kvm_kernel_irq_routing_entry *e,
2077			   struct kvm *kvm, int irq_source_id, int level,
2078			   bool line_status)
2079{
2080	int ret;
2081	struct s390_io_adapter *adapter;
2082
2083	/* We're only interested in the 0->1 transition. */
2084	if (!level)
2085		return 0;
2086	adapter = get_io_adapter(kvm, e->adapter.adapter_id);
2087	if (!adapter)
2088		return -1;
2089	down_read(&adapter->maps_lock);
2090	ret = adapter_indicators_set(kvm, adapter, &e->adapter);
2091	up_read(&adapter->maps_lock);
2092	if ((ret > 0) && !adapter->masked) {
2093		struct kvm_s390_interrupt s390int = {
2094			.type = KVM_S390_INT_IO(1, 0, 0, 0),
2095			.parm = 0,
2096			.parm64 = (adapter->isc << 27) | 0x80000000,
2097		};
2098		ret = kvm_s390_inject_vm(kvm, &s390int);
2099		if (ret == 0)
2100			ret = 1;
2101	}
2102	return ret;
2103}
2104
2105int kvm_set_routing_entry(struct kvm_kernel_irq_routing_entry *e,
2106			  const struct kvm_irq_routing_entry *ue)
2107{
2108	int ret;
2109
2110	switch (ue->type) {
2111	case KVM_IRQ_ROUTING_S390_ADAPTER:
2112		e->set = set_adapter_int;
2113		e->adapter.summary_addr = ue->u.adapter.summary_addr;
2114		e->adapter.ind_addr = ue->u.adapter.ind_addr;
2115		e->adapter.summary_offset = ue->u.adapter.summary_offset;
2116		e->adapter.ind_offset = ue->u.adapter.ind_offset;
2117		e->adapter.adapter_id = ue->u.adapter.adapter_id;
2118		ret = 0;
2119		break;
2120	default:
2121		ret = -EINVAL;
2122	}
2123
2124	return ret;
2125}
2126
2127int kvm_set_msi(struct kvm_kernel_irq_routing_entry *e, struct kvm *kvm,
2128		int irq_source_id, int level, bool line_status)
2129{
2130	return -EINVAL;
2131}
2132
2133int kvm_s390_set_irq_state(struct kvm_vcpu *vcpu, void __user *irqstate, int len)
2134{
2135	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
2136	struct kvm_s390_irq *buf;
2137	int r = 0;
2138	int n;
2139
2140	buf = vmalloc(len);
2141	if (!buf)
2142		return -ENOMEM;
2143
2144	if (copy_from_user((void *) buf, irqstate, len)) {
2145		r = -EFAULT;
2146		goto out_free;
2147	}
2148
2149	/*
2150	 * Don't allow setting the interrupt state
2151	 * when there are already interrupts pending
2152	 */
2153	spin_lock(&li->lock);
2154	if (li->pending_irqs) {
2155		r = -EBUSY;
2156		goto out_unlock;
2157	}
2158
2159	for (n = 0; n < len / sizeof(*buf); n++) {
2160		r = do_inject_vcpu(vcpu, &buf[n]);
2161		if (r)
2162			break;
2163	}
2164
2165out_unlock:
2166	spin_unlock(&li->lock);
2167out_free:
2168	vfree(buf);
2169
2170	return r;
2171}
2172
2173static void store_local_irq(struct kvm_s390_local_interrupt *li,
2174			    struct kvm_s390_irq *irq,
2175			    unsigned long irq_type)
2176{
2177	switch (irq_type) {
2178	case IRQ_PEND_MCHK_EX:
2179	case IRQ_PEND_MCHK_REP:
2180		irq->type = KVM_S390_MCHK;
2181		irq->u.mchk = li->irq.mchk;
2182		break;
2183	case IRQ_PEND_PROG:
2184		irq->type = KVM_S390_PROGRAM_INT;
2185		irq->u.pgm = li->irq.pgm;
2186		break;
2187	case IRQ_PEND_PFAULT_INIT:
2188		irq->type = KVM_S390_INT_PFAULT_INIT;
2189		irq->u.ext = li->irq.ext;
2190		break;
2191	case IRQ_PEND_EXT_EXTERNAL:
2192		irq->type = KVM_S390_INT_EXTERNAL_CALL;
2193		irq->u.extcall = li->irq.extcall;
2194		break;
2195	case IRQ_PEND_EXT_CLOCK_COMP:
2196		irq->type = KVM_S390_INT_CLOCK_COMP;
2197		break;
2198	case IRQ_PEND_EXT_CPU_TIMER:
2199		irq->type = KVM_S390_INT_CPU_TIMER;
2200		break;
2201	case IRQ_PEND_SIGP_STOP:
2202		irq->type = KVM_S390_SIGP_STOP;
2203		irq->u.stop = li->irq.stop;
2204		break;
2205	case IRQ_PEND_RESTART:
2206		irq->type = KVM_S390_RESTART;
2207		break;
2208	case IRQ_PEND_SET_PREFIX:
2209		irq->type = KVM_S390_SIGP_SET_PREFIX;
2210		irq->u.prefix = li->irq.prefix;
2211		break;
2212	}
2213}
2214
2215int kvm_s390_get_irq_state(struct kvm_vcpu *vcpu, __u8 __user *buf, int len)
2216{
2217	uint8_t sigp_ctrl = vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].sigp_ctrl;
2218	unsigned long sigp_emerg_pending[BITS_TO_LONGS(KVM_MAX_VCPUS)];
2219	struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
2220	unsigned long pending_irqs;
2221	struct kvm_s390_irq irq;
2222	unsigned long irq_type;
2223	int cpuaddr;
2224	int n = 0;
2225
2226	spin_lock(&li->lock);
2227	pending_irqs = li->pending_irqs;
2228	memcpy(&sigp_emerg_pending, &li->sigp_emerg_pending,
2229	       sizeof(sigp_emerg_pending));
2230	spin_unlock(&li->lock);
2231
2232	for_each_set_bit(irq_type, &pending_irqs, IRQ_PEND_COUNT) {
2233		memset(&irq, 0, sizeof(irq));
2234		if (irq_type == IRQ_PEND_EXT_EMERGENCY)
2235			continue;
2236		if (n + sizeof(irq) > len)
2237			return -ENOBUFS;
2238		store_local_irq(&vcpu->arch.local_int, &irq, irq_type);
2239		if (copy_to_user(&buf[n], &irq, sizeof(irq)))
2240			return -EFAULT;
2241		n += sizeof(irq);
2242	}
2243
2244	if (test_bit(IRQ_PEND_EXT_EMERGENCY, &pending_irqs)) {
2245		for_each_set_bit(cpuaddr, sigp_emerg_pending, KVM_MAX_VCPUS) {
2246			memset(&irq, 0, sizeof(irq));
2247			if (n + sizeof(irq) > len)
2248				return -ENOBUFS;
2249			irq.type = KVM_S390_INT_EMERGENCY;
2250			irq.u.emerg.code = cpuaddr;
2251			if (copy_to_user(&buf[n], &irq, sizeof(irq)))
2252				return -EFAULT;
2253			n += sizeof(irq);
2254		}
2255	}
2256
2257	if ((sigp_ctrl & SIGP_CTRL_C) &&
2258	    (atomic_read(&vcpu->arch.sie_block->cpuflags) &
2259	     CPUSTAT_ECALL_PEND)) {
2260		if (n + sizeof(irq) > len)
2261			return -ENOBUFS;
2262		memset(&irq, 0, sizeof(irq));
2263		irq.type = KVM_S390_INT_EXTERNAL_CALL;
2264		irq.u.extcall.code = sigp_ctrl & SIGP_CTRL_SCN_MASK;
2265		if (copy_to_user(&buf[n], &irq, sizeof(irq)))
2266			return -EFAULT;
2267		n += sizeof(irq);
2268	}
2269
2270	return n;
2271}
2272