2 * handling kvm guest interrupts
4 * Copyright IBM Corp. 2008, 2015
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License (version 2 only)
8 * as published by the Free Software Foundation.
10 * Author(s): Carsten Otte <cotte@de.ibm.com>
13 #include <linux/interrupt.h>
14 #include <linux/kvm_host.h>
15 #include <linux/hrtimer.h>
16 #include <linux/mmu_context.h>
17 #include <linux/signal.h>
18 #include <linux/slab.h>
19 #include <linux/bitmap.h>
20 #include <linux/vmalloc.h>
21 #include <asm/asm-offsets.h>
23 #include <asm/uaccess.h>
29 #include "trace-s390.h"
31 #define IOINT_SCHID_MASK 0x0000ffff
32 #define IOINT_SSID_MASK 0x00030000
33 #define IOINT_CSSID_MASK 0x03fc0000
34 #define PFAULT_INIT 0x0600
35 #define PFAULT_DONE 0x0680
36 #define VIRTIO_PARAM 0x0d00
38 /* handle external calls via sigp interpretation facility */
39 static int sca_ext_call_pending(struct kvm_vcpu
*vcpu
, int *src_id
)
43 if (!(atomic_read(&vcpu
->arch
.sie_block
->cpuflags
) & CPUSTAT_ECALL_PEND
))
46 read_lock(&vcpu
->kvm
->arch
.sca_lock
);
47 if (vcpu
->kvm
->arch
.use_esca
) {
48 struct esca_block
*sca
= vcpu
->kvm
->arch
.sca
;
49 union esca_sigp_ctrl sigp_ctrl
=
50 sca
->cpu
[vcpu
->vcpu_id
].sigp_ctrl
;
55 struct bsca_block
*sca
= vcpu
->kvm
->arch
.sca
;
56 union bsca_sigp_ctrl sigp_ctrl
=
57 sca
->cpu
[vcpu
->vcpu_id
].sigp_ctrl
;
62 read_unlock(&vcpu
->kvm
->arch
.sca_lock
);
70 static int sca_inject_ext_call(struct kvm_vcpu
*vcpu
, int src_id
)
74 read_lock(&vcpu
->kvm
->arch
.sca_lock
);
75 if (vcpu
->kvm
->arch
.use_esca
) {
76 struct esca_block
*sca
= vcpu
->kvm
->arch
.sca
;
77 union esca_sigp_ctrl
*sigp_ctrl
=
78 &(sca
->cpu
[vcpu
->vcpu_id
].sigp_ctrl
);
79 union esca_sigp_ctrl new_val
= {0}, old_val
= *sigp_ctrl
;
85 expect
= old_val
.value
;
86 rc
= cmpxchg(&sigp_ctrl
->value
, old_val
.value
, new_val
.value
);
88 struct bsca_block
*sca
= vcpu
->kvm
->arch
.sca
;
89 union bsca_sigp_ctrl
*sigp_ctrl
=
90 &(sca
->cpu
[vcpu
->vcpu_id
].sigp_ctrl
);
91 union bsca_sigp_ctrl new_val
= {0}, old_val
= *sigp_ctrl
;
97 expect
= old_val
.value
;
98 rc
= cmpxchg(&sigp_ctrl
->value
, old_val
.value
, new_val
.value
);
100 read_unlock(&vcpu
->kvm
->arch
.sca_lock
);
103 /* another external call is pending */
106 atomic_or(CPUSTAT_ECALL_PEND
, &vcpu
->arch
.sie_block
->cpuflags
);
110 static void sca_clear_ext_call(struct kvm_vcpu
*vcpu
)
112 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
115 atomic_andnot(CPUSTAT_ECALL_PEND
, li
->cpuflags
);
116 read_lock(&vcpu
->kvm
->arch
.sca_lock
);
117 if (vcpu
->kvm
->arch
.use_esca
) {
118 struct esca_block
*sca
= vcpu
->kvm
->arch
.sca
;
119 union esca_sigp_ctrl
*sigp_ctrl
=
120 &(sca
->cpu
[vcpu
->vcpu_id
].sigp_ctrl
);
121 union esca_sigp_ctrl old
= *sigp_ctrl
;
124 rc
= cmpxchg(&sigp_ctrl
->value
, old
.value
, 0);
126 struct bsca_block
*sca
= vcpu
->kvm
->arch
.sca
;
127 union bsca_sigp_ctrl
*sigp_ctrl
=
128 &(sca
->cpu
[vcpu
->vcpu_id
].sigp_ctrl
);
129 union bsca_sigp_ctrl old
= *sigp_ctrl
;
132 rc
= cmpxchg(&sigp_ctrl
->value
, old
.value
, 0);
134 read_unlock(&vcpu
->kvm
->arch
.sca_lock
);
135 WARN_ON(rc
!= expect
); /* cannot clear? */
138 int psw_extint_disabled(struct kvm_vcpu
*vcpu
)
140 return !(vcpu
->arch
.sie_block
->gpsw
.mask
& PSW_MASK_EXT
);
143 static int psw_ioint_disabled(struct kvm_vcpu
*vcpu
)
145 return !(vcpu
->arch
.sie_block
->gpsw
.mask
& PSW_MASK_IO
);
148 static int psw_mchk_disabled(struct kvm_vcpu
*vcpu
)
150 return !(vcpu
->arch
.sie_block
->gpsw
.mask
& PSW_MASK_MCHECK
);
153 static int psw_interrupts_disabled(struct kvm_vcpu
*vcpu
)
155 return psw_extint_disabled(vcpu
) &&
156 psw_ioint_disabled(vcpu
) &&
157 psw_mchk_disabled(vcpu
);
160 static int ckc_interrupts_enabled(struct kvm_vcpu
*vcpu
)
162 if (psw_extint_disabled(vcpu
) ||
163 !(vcpu
->arch
.sie_block
->gcr
[0] & 0x800ul
))
165 if (guestdbg_enabled(vcpu
) && guestdbg_sstep_enabled(vcpu
))
166 /* No timer interrupts when single stepping */
171 static int ckc_irq_pending(struct kvm_vcpu
*vcpu
)
173 if (vcpu
->arch
.sie_block
->ckc
>= kvm_s390_get_tod_clock_fast(vcpu
->kvm
))
175 return ckc_interrupts_enabled(vcpu
);
178 static int cpu_timer_interrupts_enabled(struct kvm_vcpu
*vcpu
)
180 return !psw_extint_disabled(vcpu
) &&
181 (vcpu
->arch
.sie_block
->gcr
[0] & 0x400ul
);
184 static int cpu_timer_irq_pending(struct kvm_vcpu
*vcpu
)
186 return (vcpu
->arch
.sie_block
->cputm
>> 63) &&
187 cpu_timer_interrupts_enabled(vcpu
);
190 static inline int is_ioirq(unsigned long irq_type
)
192 return ((irq_type
>= IRQ_PEND_IO_ISC_0
) &&
193 (irq_type
<= IRQ_PEND_IO_ISC_7
));
196 static uint64_t isc_to_isc_bits(int isc
)
198 return (0x80 >> isc
) << 24;
201 static inline u8
int_word_to_isc(u32 int_word
)
203 return (int_word
& 0x38000000) >> 27;
206 static inline unsigned long pending_irqs(struct kvm_vcpu
*vcpu
)
208 return vcpu
->kvm
->arch
.float_int
.pending_irqs
|
209 vcpu
->arch
.local_int
.pending_irqs
;
212 static unsigned long disable_iscs(struct kvm_vcpu
*vcpu
,
213 unsigned long active_mask
)
217 for (i
= 0; i
<= MAX_ISC
; i
++)
218 if (!(vcpu
->arch
.sie_block
->gcr
[6] & isc_to_isc_bits(i
)))
219 active_mask
&= ~(1UL << (IRQ_PEND_IO_ISC_0
+ i
));
224 static unsigned long deliverable_irqs(struct kvm_vcpu
*vcpu
)
226 unsigned long active_mask
;
228 active_mask
= pending_irqs(vcpu
);
232 if (psw_extint_disabled(vcpu
))
233 active_mask
&= ~IRQ_PEND_EXT_MASK
;
234 if (psw_ioint_disabled(vcpu
))
235 active_mask
&= ~IRQ_PEND_IO_MASK
;
237 active_mask
= disable_iscs(vcpu
, active_mask
);
238 if (!(vcpu
->arch
.sie_block
->gcr
[0] & 0x2000ul
))
239 __clear_bit(IRQ_PEND_EXT_EXTERNAL
, &active_mask
);
240 if (!(vcpu
->arch
.sie_block
->gcr
[0] & 0x4000ul
))
241 __clear_bit(IRQ_PEND_EXT_EMERGENCY
, &active_mask
);
242 if (!(vcpu
->arch
.sie_block
->gcr
[0] & 0x800ul
))
243 __clear_bit(IRQ_PEND_EXT_CLOCK_COMP
, &active_mask
);
244 if (!(vcpu
->arch
.sie_block
->gcr
[0] & 0x400ul
))
245 __clear_bit(IRQ_PEND_EXT_CPU_TIMER
, &active_mask
);
246 if (!(vcpu
->arch
.sie_block
->gcr
[0] & 0x200ul
))
247 __clear_bit(IRQ_PEND_EXT_SERVICE
, &active_mask
);
248 if (psw_mchk_disabled(vcpu
))
249 active_mask
&= ~IRQ_PEND_MCHK_MASK
;
250 if (!(vcpu
->arch
.sie_block
->gcr
[14] &
251 vcpu
->kvm
->arch
.float_int
.mchk
.cr14
))
252 __clear_bit(IRQ_PEND_MCHK_REP
, &active_mask
);
255 * STOP irqs will never be actively delivered. They are triggered via
256 * intercept requests and cleared when the stop intercept is performed.
258 __clear_bit(IRQ_PEND_SIGP_STOP
, &active_mask
);
263 static void __set_cpu_idle(struct kvm_vcpu
*vcpu
)
265 atomic_or(CPUSTAT_WAIT
, &vcpu
->arch
.sie_block
->cpuflags
);
266 set_bit(vcpu
->vcpu_id
, vcpu
->arch
.local_int
.float_int
->idle_mask
);
269 static void __unset_cpu_idle(struct kvm_vcpu
*vcpu
)
271 atomic_andnot(CPUSTAT_WAIT
, &vcpu
->arch
.sie_block
->cpuflags
);
272 clear_bit(vcpu
->vcpu_id
, vcpu
->arch
.local_int
.float_int
->idle_mask
);
275 static void __reset_intercept_indicators(struct kvm_vcpu
*vcpu
)
277 atomic_andnot(CPUSTAT_IO_INT
| CPUSTAT_EXT_INT
| CPUSTAT_STOP_INT
,
278 &vcpu
->arch
.sie_block
->cpuflags
);
279 vcpu
->arch
.sie_block
->lctl
= 0x0000;
280 vcpu
->arch
.sie_block
->ictl
&= ~(ICTL_LPSW
| ICTL_STCTL
| ICTL_PINT
);
282 if (guestdbg_enabled(vcpu
)) {
283 vcpu
->arch
.sie_block
->lctl
|= (LCTL_CR0
| LCTL_CR9
|
284 LCTL_CR10
| LCTL_CR11
);
285 vcpu
->arch
.sie_block
->ictl
|= (ICTL_STCTL
| ICTL_PINT
);
289 static void __set_cpuflag(struct kvm_vcpu
*vcpu
, u32 flag
)
291 atomic_or(flag
, &vcpu
->arch
.sie_block
->cpuflags
);
294 static void set_intercept_indicators_io(struct kvm_vcpu
*vcpu
)
296 if (!(pending_irqs(vcpu
) & IRQ_PEND_IO_MASK
))
298 else if (psw_ioint_disabled(vcpu
))
299 __set_cpuflag(vcpu
, CPUSTAT_IO_INT
);
301 vcpu
->arch
.sie_block
->lctl
|= LCTL_CR6
;
304 static void set_intercept_indicators_ext(struct kvm_vcpu
*vcpu
)
306 if (!(pending_irqs(vcpu
) & IRQ_PEND_EXT_MASK
))
308 if (psw_extint_disabled(vcpu
))
309 __set_cpuflag(vcpu
, CPUSTAT_EXT_INT
);
311 vcpu
->arch
.sie_block
->lctl
|= LCTL_CR0
;
314 static void set_intercept_indicators_mchk(struct kvm_vcpu
*vcpu
)
316 if (!(pending_irqs(vcpu
) & IRQ_PEND_MCHK_MASK
))
318 if (psw_mchk_disabled(vcpu
))
319 vcpu
->arch
.sie_block
->ictl
|= ICTL_LPSW
;
321 vcpu
->arch
.sie_block
->lctl
|= LCTL_CR14
;
324 static void set_intercept_indicators_stop(struct kvm_vcpu
*vcpu
)
326 if (kvm_s390_is_stop_irq_pending(vcpu
))
327 __set_cpuflag(vcpu
, CPUSTAT_STOP_INT
);
330 /* Set interception request for non-deliverable interrupts */
331 static void set_intercept_indicators(struct kvm_vcpu
*vcpu
)
333 set_intercept_indicators_io(vcpu
);
334 set_intercept_indicators_ext(vcpu
);
335 set_intercept_indicators_mchk(vcpu
);
336 set_intercept_indicators_stop(vcpu
);
339 static u16
get_ilc(struct kvm_vcpu
*vcpu
)
341 switch (vcpu
->arch
.sie_block
->icptcode
) {
347 /* last instruction only stored for these icptcodes */
348 return insn_length(vcpu
->arch
.sie_block
->ipa
>> 8);
350 return vcpu
->arch
.sie_block
->pgmilc
;
356 static int __must_check
__deliver_cpu_timer(struct kvm_vcpu
*vcpu
)
358 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
361 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
, KVM_S390_INT_CPU_TIMER
,
364 rc
= put_guest_lc(vcpu
, EXT_IRQ_CPU_TIMER
,
365 (u16
*)__LC_EXT_INT_CODE
);
366 rc
|= put_guest_lc(vcpu
, 0, (u16
*)__LC_EXT_CPU_ADDR
);
367 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
368 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
369 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
370 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
371 clear_bit(IRQ_PEND_EXT_CPU_TIMER
, &li
->pending_irqs
);
372 return rc
? -EFAULT
: 0;
375 static int __must_check
__deliver_ckc(struct kvm_vcpu
*vcpu
)
377 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
380 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
, KVM_S390_INT_CLOCK_COMP
,
383 rc
= put_guest_lc(vcpu
, EXT_IRQ_CLK_COMP
,
384 (u16 __user
*)__LC_EXT_INT_CODE
);
385 rc
|= put_guest_lc(vcpu
, 0, (u16
*)__LC_EXT_CPU_ADDR
);
386 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
387 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
388 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
389 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
390 clear_bit(IRQ_PEND_EXT_CLOCK_COMP
, &li
->pending_irqs
);
391 return rc
? -EFAULT
: 0;
394 static int __must_check
__deliver_pfault_init(struct kvm_vcpu
*vcpu
)
396 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
397 struct kvm_s390_ext_info ext
;
400 spin_lock(&li
->lock
);
402 clear_bit(IRQ_PEND_PFAULT_INIT
, &li
->pending_irqs
);
403 li
->irq
.ext
.ext_params2
= 0;
404 spin_unlock(&li
->lock
);
406 VCPU_EVENT(vcpu
, 4, "deliver: pfault init token 0x%llx",
408 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
409 KVM_S390_INT_PFAULT_INIT
,
412 rc
= put_guest_lc(vcpu
, EXT_IRQ_CP_SERVICE
, (u16
*) __LC_EXT_INT_CODE
);
413 rc
|= put_guest_lc(vcpu
, PFAULT_INIT
, (u16
*) __LC_EXT_CPU_ADDR
);
414 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
415 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
416 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
417 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
418 rc
|= put_guest_lc(vcpu
, ext
.ext_params2
, (u64
*) __LC_EXT_PARAMS2
);
419 return rc
? -EFAULT
: 0;
422 static int __must_check
__deliver_machine_check(struct kvm_vcpu
*vcpu
)
424 struct kvm_s390_float_interrupt
*fi
= &vcpu
->kvm
->arch
.float_int
;
425 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
426 struct kvm_s390_mchk_info mchk
= {};
427 unsigned long adtl_status_addr
;
431 spin_lock(&fi
->lock
);
432 spin_lock(&li
->lock
);
433 if (test_bit(IRQ_PEND_MCHK_EX
, &li
->pending_irqs
) ||
434 test_bit(IRQ_PEND_MCHK_REP
, &li
->pending_irqs
)) {
436 * If there was an exigent machine check pending, then any
437 * repressible machine checks that might have been pending
438 * are indicated along with it, so always clear bits for
439 * repressible and exigent interrupts
442 clear_bit(IRQ_PEND_MCHK_EX
, &li
->pending_irqs
);
443 clear_bit(IRQ_PEND_MCHK_REP
, &li
->pending_irqs
);
444 memset(&li
->irq
.mchk
, 0, sizeof(mchk
));
448 * We indicate floating repressible conditions along with
449 * other pending conditions. Channel Report Pending and Channel
450 * Subsystem damage are the only two and and are indicated by
451 * bits in mcic and masked in cr14.
453 if (test_and_clear_bit(IRQ_PEND_MCHK_REP
, &fi
->pending_irqs
)) {
454 mchk
.mcic
|= fi
->mchk
.mcic
;
455 mchk
.cr14
|= fi
->mchk
.cr14
;
456 memset(&fi
->mchk
, 0, sizeof(mchk
));
459 spin_unlock(&li
->lock
);
460 spin_unlock(&fi
->lock
);
463 VCPU_EVENT(vcpu
, 3, "deliver: machine check mcic 0x%llx",
465 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
467 mchk
.cr14
, mchk
.mcic
);
469 rc
= kvm_s390_vcpu_store_status(vcpu
,
470 KVM_S390_STORE_STATUS_PREFIXED
);
471 rc
|= read_guest_lc(vcpu
, __LC_VX_SAVE_AREA_ADDR
,
473 sizeof(unsigned long));
474 rc
|= kvm_s390_vcpu_store_adtl_status(vcpu
,
476 rc
|= put_guest_lc(vcpu
, mchk
.mcic
,
477 (u64 __user
*) __LC_MCCK_CODE
);
478 rc
|= put_guest_lc(vcpu
, mchk
.failing_storage_address
,
479 (u64 __user
*) __LC_MCCK_FAIL_STOR_ADDR
);
480 rc
|= write_guest_lc(vcpu
, __LC_PSW_SAVE_AREA
,
482 sizeof(mchk
.fixed_logout
));
483 rc
|= write_guest_lc(vcpu
, __LC_MCK_OLD_PSW
,
484 &vcpu
->arch
.sie_block
->gpsw
,
486 rc
|= read_guest_lc(vcpu
, __LC_MCK_NEW_PSW
,
487 &vcpu
->arch
.sie_block
->gpsw
,
490 return rc
? -EFAULT
: 0;
493 static int __must_check
__deliver_restart(struct kvm_vcpu
*vcpu
)
495 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
498 VCPU_EVENT(vcpu
, 3, "%s", "deliver: cpu restart");
499 vcpu
->stat
.deliver_restart_signal
++;
500 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
, KVM_S390_RESTART
, 0, 0);
502 rc
= write_guest_lc(vcpu
,
503 offsetof(struct lowcore
, restart_old_psw
),
504 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
505 rc
|= read_guest_lc(vcpu
, offsetof(struct lowcore
, restart_psw
),
506 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
507 clear_bit(IRQ_PEND_RESTART
, &li
->pending_irqs
);
508 return rc
? -EFAULT
: 0;
511 static int __must_check
__deliver_set_prefix(struct kvm_vcpu
*vcpu
)
513 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
514 struct kvm_s390_prefix_info prefix
;
516 spin_lock(&li
->lock
);
517 prefix
= li
->irq
.prefix
;
518 li
->irq
.prefix
.address
= 0;
519 clear_bit(IRQ_PEND_SET_PREFIX
, &li
->pending_irqs
);
520 spin_unlock(&li
->lock
);
522 vcpu
->stat
.deliver_prefix_signal
++;
523 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
524 KVM_S390_SIGP_SET_PREFIX
,
527 kvm_s390_set_prefix(vcpu
, prefix
.address
);
531 static int __must_check
__deliver_emergency_signal(struct kvm_vcpu
*vcpu
)
533 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
537 spin_lock(&li
->lock
);
538 cpu_addr
= find_first_bit(li
->sigp_emerg_pending
, KVM_MAX_VCPUS
);
539 clear_bit(cpu_addr
, li
->sigp_emerg_pending
);
540 if (bitmap_empty(li
->sigp_emerg_pending
, KVM_MAX_VCPUS
))
541 clear_bit(IRQ_PEND_EXT_EMERGENCY
, &li
->pending_irqs
);
542 spin_unlock(&li
->lock
);
544 VCPU_EVENT(vcpu
, 4, "%s", "deliver: sigp emerg");
545 vcpu
->stat
.deliver_emergency_signal
++;
546 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
, KVM_S390_INT_EMERGENCY
,
549 rc
= put_guest_lc(vcpu
, EXT_IRQ_EMERGENCY_SIG
,
550 (u16
*)__LC_EXT_INT_CODE
);
551 rc
|= put_guest_lc(vcpu
, cpu_addr
, (u16
*)__LC_EXT_CPU_ADDR
);
552 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
553 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
554 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
555 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
556 return rc
? -EFAULT
: 0;
559 static int __must_check
__deliver_external_call(struct kvm_vcpu
*vcpu
)
561 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
562 struct kvm_s390_extcall_info extcall
;
565 spin_lock(&li
->lock
);
566 extcall
= li
->irq
.extcall
;
567 li
->irq
.extcall
.code
= 0;
568 clear_bit(IRQ_PEND_EXT_EXTERNAL
, &li
->pending_irqs
);
569 spin_unlock(&li
->lock
);
571 VCPU_EVENT(vcpu
, 4, "%s", "deliver: sigp ext call");
572 vcpu
->stat
.deliver_external_call
++;
573 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
574 KVM_S390_INT_EXTERNAL_CALL
,
577 rc
= put_guest_lc(vcpu
, EXT_IRQ_EXTERNAL_CALL
,
578 (u16
*)__LC_EXT_INT_CODE
);
579 rc
|= put_guest_lc(vcpu
, extcall
.code
, (u16
*)__LC_EXT_CPU_ADDR
);
580 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
581 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
582 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
, &vcpu
->arch
.sie_block
->gpsw
,
584 return rc
? -EFAULT
: 0;
587 static int __must_check
__deliver_prog(struct kvm_vcpu
*vcpu
)
589 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
590 struct kvm_s390_pgm_info pgm_info
;
591 int rc
= 0, nullifying
= false;
592 u16 ilc
= get_ilc(vcpu
);
594 spin_lock(&li
->lock
);
595 pgm_info
= li
->irq
.pgm
;
596 clear_bit(IRQ_PEND_PROG
, &li
->pending_irqs
);
597 memset(&li
->irq
.pgm
, 0, sizeof(pgm_info
));
598 spin_unlock(&li
->lock
);
600 VCPU_EVENT(vcpu
, 3, "deliver: program irq code 0x%x, ilc:%d",
602 vcpu
->stat
.deliver_program_int
++;
603 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
, KVM_S390_PROGRAM_INT
,
606 switch (pgm_info
.code
& ~PGM_PER
) {
607 case PGM_AFX_TRANSLATION
:
608 case PGM_ASX_TRANSLATION
:
609 case PGM_EX_TRANSLATION
:
610 case PGM_LFX_TRANSLATION
:
611 case PGM_LSTE_SEQUENCE
:
612 case PGM_LSX_TRANSLATION
:
613 case PGM_LX_TRANSLATION
:
614 case PGM_PRIMARY_AUTHORITY
:
615 case PGM_SECONDARY_AUTHORITY
:
618 case PGM_SPACE_SWITCH
:
619 rc
= put_guest_lc(vcpu
, pgm_info
.trans_exc_code
,
620 (u64
*)__LC_TRANS_EXC_CODE
);
622 case PGM_ALEN_TRANSLATION
:
623 case PGM_ALE_SEQUENCE
:
624 case PGM_ASTE_INSTANCE
:
625 case PGM_ASTE_SEQUENCE
:
626 case PGM_ASTE_VALIDITY
:
627 case PGM_EXTENDED_AUTHORITY
:
628 rc
= put_guest_lc(vcpu
, pgm_info
.exc_access_id
,
629 (u8
*)__LC_EXC_ACCESS_ID
);
633 case PGM_PAGE_TRANSLATION
:
634 case PGM_REGION_FIRST_TRANS
:
635 case PGM_REGION_SECOND_TRANS
:
636 case PGM_REGION_THIRD_TRANS
:
637 case PGM_SEGMENT_TRANSLATION
:
638 rc
= put_guest_lc(vcpu
, pgm_info
.trans_exc_code
,
639 (u64
*)__LC_TRANS_EXC_CODE
);
640 rc
|= put_guest_lc(vcpu
, pgm_info
.exc_access_id
,
641 (u8
*)__LC_EXC_ACCESS_ID
);
642 rc
|= put_guest_lc(vcpu
, pgm_info
.op_access_id
,
643 (u8
*)__LC_OP_ACCESS_ID
);
647 rc
= put_guest_lc(vcpu
, pgm_info
.mon_class_nr
,
648 (u16
*)__LC_MON_CLASS_NR
);
649 rc
|= put_guest_lc(vcpu
, pgm_info
.mon_code
,
650 (u64
*)__LC_MON_CODE
);
652 case PGM_VECTOR_PROCESSING
:
654 rc
= put_guest_lc(vcpu
, pgm_info
.data_exc_code
,
655 (u32
*)__LC_DATA_EXC_CODE
);
658 rc
= put_guest_lc(vcpu
, pgm_info
.trans_exc_code
,
659 (u64
*)__LC_TRANS_EXC_CODE
);
660 rc
|= put_guest_lc(vcpu
, pgm_info
.exc_access_id
,
661 (u8
*)__LC_EXC_ACCESS_ID
);
664 case PGM_STACK_EMPTY
:
665 case PGM_STACK_SPECIFICATION
:
667 case PGM_STACK_OPERATION
:
668 case PGM_TRACE_TABEL
:
669 case PGM_CRYPTO_OPERATION
:
674 if (pgm_info
.code
& PGM_PER
) {
675 rc
|= put_guest_lc(vcpu
, pgm_info
.per_code
,
676 (u8
*) __LC_PER_CODE
);
677 rc
|= put_guest_lc(vcpu
, pgm_info
.per_atmid
,
678 (u8
*)__LC_PER_ATMID
);
679 rc
|= put_guest_lc(vcpu
, pgm_info
.per_address
,
680 (u64
*) __LC_PER_ADDRESS
);
681 rc
|= put_guest_lc(vcpu
, pgm_info
.per_access_id
,
682 (u8
*) __LC_PER_ACCESS_ID
);
685 if (nullifying
&& vcpu
->arch
.sie_block
->icptcode
== ICPT_INST
)
686 kvm_s390_rewind_psw(vcpu
, ilc
);
688 rc
|= put_guest_lc(vcpu
, ilc
, (u16
*) __LC_PGM_ILC
);
689 rc
|= put_guest_lc(vcpu
, vcpu
->arch
.sie_block
->gbea
,
690 (u64
*) __LC_LAST_BREAK
);
691 rc
|= put_guest_lc(vcpu
, pgm_info
.code
,
692 (u16
*)__LC_PGM_INT_CODE
);
693 rc
|= write_guest_lc(vcpu
, __LC_PGM_OLD_PSW
,
694 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
695 rc
|= read_guest_lc(vcpu
, __LC_PGM_NEW_PSW
,
696 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
697 return rc
? -EFAULT
: 0;
700 static int __must_check
__deliver_service(struct kvm_vcpu
*vcpu
)
702 struct kvm_s390_float_interrupt
*fi
= &vcpu
->kvm
->arch
.float_int
;
703 struct kvm_s390_ext_info ext
;
706 spin_lock(&fi
->lock
);
707 if (!(test_bit(IRQ_PEND_EXT_SERVICE
, &fi
->pending_irqs
))) {
708 spin_unlock(&fi
->lock
);
711 ext
= fi
->srv_signal
;
712 memset(&fi
->srv_signal
, 0, sizeof(ext
));
713 clear_bit(IRQ_PEND_EXT_SERVICE
, &fi
->pending_irqs
);
714 spin_unlock(&fi
->lock
);
716 VCPU_EVENT(vcpu
, 4, "deliver: sclp parameter 0x%x",
718 vcpu
->stat
.deliver_service_signal
++;
719 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
, KVM_S390_INT_SERVICE
,
722 rc
= put_guest_lc(vcpu
, EXT_IRQ_SERVICE_SIG
, (u16
*)__LC_EXT_INT_CODE
);
723 rc
|= put_guest_lc(vcpu
, 0, (u16
*)__LC_EXT_CPU_ADDR
);
724 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
725 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
726 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
727 &vcpu
->arch
.sie_block
->gpsw
, sizeof(psw_t
));
728 rc
|= put_guest_lc(vcpu
, ext
.ext_params
,
729 (u32
*)__LC_EXT_PARAMS
);
731 return rc
? -EFAULT
: 0;
734 static int __must_check
__deliver_pfault_done(struct kvm_vcpu
*vcpu
)
736 struct kvm_s390_float_interrupt
*fi
= &vcpu
->kvm
->arch
.float_int
;
737 struct kvm_s390_interrupt_info
*inti
;
740 spin_lock(&fi
->lock
);
741 inti
= list_first_entry_or_null(&fi
->lists
[FIRQ_LIST_PFAULT
],
742 struct kvm_s390_interrupt_info
,
745 list_del(&inti
->list
);
746 fi
->counters
[FIRQ_CNTR_PFAULT
] -= 1;
748 if (list_empty(&fi
->lists
[FIRQ_LIST_PFAULT
]))
749 clear_bit(IRQ_PEND_PFAULT_DONE
, &fi
->pending_irqs
);
750 spin_unlock(&fi
->lock
);
753 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
754 KVM_S390_INT_PFAULT_DONE
, 0,
755 inti
->ext
.ext_params2
);
756 VCPU_EVENT(vcpu
, 4, "deliver: pfault done token 0x%llx",
757 inti
->ext
.ext_params2
);
759 rc
= put_guest_lc(vcpu
, EXT_IRQ_CP_SERVICE
,
760 (u16
*)__LC_EXT_INT_CODE
);
761 rc
|= put_guest_lc(vcpu
, PFAULT_DONE
,
762 (u16
*)__LC_EXT_CPU_ADDR
);
763 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
764 &vcpu
->arch
.sie_block
->gpsw
,
766 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
767 &vcpu
->arch
.sie_block
->gpsw
,
769 rc
|= put_guest_lc(vcpu
, inti
->ext
.ext_params2
,
770 (u64
*)__LC_EXT_PARAMS2
);
773 return rc
? -EFAULT
: 0;
776 static int __must_check
__deliver_virtio(struct kvm_vcpu
*vcpu
)
778 struct kvm_s390_float_interrupt
*fi
= &vcpu
->kvm
->arch
.float_int
;
779 struct kvm_s390_interrupt_info
*inti
;
782 spin_lock(&fi
->lock
);
783 inti
= list_first_entry_or_null(&fi
->lists
[FIRQ_LIST_VIRTIO
],
784 struct kvm_s390_interrupt_info
,
788 "deliver: virtio parm: 0x%x,parm64: 0x%llx",
789 inti
->ext
.ext_params
, inti
->ext
.ext_params2
);
790 vcpu
->stat
.deliver_virtio_interrupt
++;
791 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
793 inti
->ext
.ext_params
,
794 inti
->ext
.ext_params2
);
795 list_del(&inti
->list
);
796 fi
->counters
[FIRQ_CNTR_VIRTIO
] -= 1;
798 if (list_empty(&fi
->lists
[FIRQ_LIST_VIRTIO
]))
799 clear_bit(IRQ_PEND_VIRTIO
, &fi
->pending_irqs
);
800 spin_unlock(&fi
->lock
);
803 rc
= put_guest_lc(vcpu
, EXT_IRQ_CP_SERVICE
,
804 (u16
*)__LC_EXT_INT_CODE
);
805 rc
|= put_guest_lc(vcpu
, VIRTIO_PARAM
,
806 (u16
*)__LC_EXT_CPU_ADDR
);
807 rc
|= write_guest_lc(vcpu
, __LC_EXT_OLD_PSW
,
808 &vcpu
->arch
.sie_block
->gpsw
,
810 rc
|= read_guest_lc(vcpu
, __LC_EXT_NEW_PSW
,
811 &vcpu
->arch
.sie_block
->gpsw
,
813 rc
|= put_guest_lc(vcpu
, inti
->ext
.ext_params
,
814 (u32
*)__LC_EXT_PARAMS
);
815 rc
|= put_guest_lc(vcpu
, inti
->ext
.ext_params2
,
816 (u64
*)__LC_EXT_PARAMS2
);
819 return rc
? -EFAULT
: 0;
822 static int __must_check
__deliver_io(struct kvm_vcpu
*vcpu
,
823 unsigned long irq_type
)
825 struct list_head
*isc_list
;
826 struct kvm_s390_float_interrupt
*fi
;
827 struct kvm_s390_interrupt_info
*inti
= NULL
;
830 fi
= &vcpu
->kvm
->arch
.float_int
;
832 spin_lock(&fi
->lock
);
833 isc_list
= &fi
->lists
[irq_type
- IRQ_PEND_IO_ISC_0
];
834 inti
= list_first_entry_or_null(isc_list
,
835 struct kvm_s390_interrupt_info
,
838 VCPU_EVENT(vcpu
, 4, "deliver: I/O 0x%llx", inti
->type
);
839 vcpu
->stat
.deliver_io_int
++;
840 trace_kvm_s390_deliver_interrupt(vcpu
->vcpu_id
,
842 ((__u32
)inti
->io
.subchannel_id
<< 16) |
843 inti
->io
.subchannel_nr
,
844 ((__u64
)inti
->io
.io_int_parm
<< 32) |
845 inti
->io
.io_int_word
);
846 list_del(&inti
->list
);
847 fi
->counters
[FIRQ_CNTR_IO
] -= 1;
849 if (list_empty(isc_list
))
850 clear_bit(irq_type
, &fi
->pending_irqs
);
851 spin_unlock(&fi
->lock
);
854 rc
= put_guest_lc(vcpu
, inti
->io
.subchannel_id
,
855 (u16
*)__LC_SUBCHANNEL_ID
);
856 rc
|= put_guest_lc(vcpu
, inti
->io
.subchannel_nr
,
857 (u16
*)__LC_SUBCHANNEL_NR
);
858 rc
|= put_guest_lc(vcpu
, inti
->io
.io_int_parm
,
859 (u32
*)__LC_IO_INT_PARM
);
860 rc
|= put_guest_lc(vcpu
, inti
->io
.io_int_word
,
861 (u32
*)__LC_IO_INT_WORD
);
862 rc
|= write_guest_lc(vcpu
, __LC_IO_OLD_PSW
,
863 &vcpu
->arch
.sie_block
->gpsw
,
865 rc
|= read_guest_lc(vcpu
, __LC_IO_NEW_PSW
,
866 &vcpu
->arch
.sie_block
->gpsw
,
871 return rc
? -EFAULT
: 0;
874 typedef int (*deliver_irq_t
)(struct kvm_vcpu
*vcpu
);
876 static const deliver_irq_t deliver_irq_funcs
[] = {
877 [IRQ_PEND_MCHK_EX
] = __deliver_machine_check
,
878 [IRQ_PEND_MCHK_REP
] = __deliver_machine_check
,
879 [IRQ_PEND_PROG
] = __deliver_prog
,
880 [IRQ_PEND_EXT_EMERGENCY
] = __deliver_emergency_signal
,
881 [IRQ_PEND_EXT_EXTERNAL
] = __deliver_external_call
,
882 [IRQ_PEND_EXT_CLOCK_COMP
] = __deliver_ckc
,
883 [IRQ_PEND_EXT_CPU_TIMER
] = __deliver_cpu_timer
,
884 [IRQ_PEND_RESTART
] = __deliver_restart
,
885 [IRQ_PEND_SET_PREFIX
] = __deliver_set_prefix
,
886 [IRQ_PEND_PFAULT_INIT
] = __deliver_pfault_init
,
887 [IRQ_PEND_EXT_SERVICE
] = __deliver_service
,
888 [IRQ_PEND_PFAULT_DONE
] = __deliver_pfault_done
,
889 [IRQ_PEND_VIRTIO
] = __deliver_virtio
,
892 /* Check whether an external call is pending (deliverable or not) */
893 int kvm_s390_ext_call_pending(struct kvm_vcpu
*vcpu
)
895 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
897 if (!sclp
.has_sigpif
)
898 return test_bit(IRQ_PEND_EXT_EXTERNAL
, &li
->pending_irqs
);
900 return sca_ext_call_pending(vcpu
, NULL
);
903 int kvm_s390_vcpu_has_irq(struct kvm_vcpu
*vcpu
, int exclude_stop
)
905 if (deliverable_irqs(vcpu
))
908 if (kvm_cpu_has_pending_timer(vcpu
))
911 /* external call pending and deliverable */
912 if (kvm_s390_ext_call_pending(vcpu
) &&
913 !psw_extint_disabled(vcpu
) &&
914 (vcpu
->arch
.sie_block
->gcr
[0] & 0x2000ul
))
917 if (!exclude_stop
&& kvm_s390_is_stop_irq_pending(vcpu
))
922 int kvm_cpu_has_pending_timer(struct kvm_vcpu
*vcpu
)
924 return ckc_irq_pending(vcpu
) || cpu_timer_irq_pending(vcpu
);
927 int kvm_s390_handle_wait(struct kvm_vcpu
*vcpu
)
931 vcpu
->stat
.exit_wait_state
++;
934 if (kvm_arch_vcpu_runnable(vcpu
))
937 if (psw_interrupts_disabled(vcpu
)) {
938 VCPU_EVENT(vcpu
, 3, "%s", "disabled wait");
939 return -EOPNOTSUPP
; /* disabled wait */
942 if (!ckc_interrupts_enabled(vcpu
)) {
943 VCPU_EVENT(vcpu
, 3, "%s", "enabled wait w/o timer");
944 __set_cpu_idle(vcpu
);
948 now
= kvm_s390_get_tod_clock_fast(vcpu
->kvm
);
949 sltime
= tod_to_ns(vcpu
->arch
.sie_block
->ckc
- now
);
952 if (vcpu
->arch
.sie_block
->ckc
< now
)
955 __set_cpu_idle(vcpu
);
956 hrtimer_start(&vcpu
->arch
.ckc_timer
, ktime_set (0, sltime
) , HRTIMER_MODE_REL
);
957 VCPU_EVENT(vcpu
, 4, "enabled wait via clock comparator: %llu ns", sltime
);
959 srcu_read_unlock(&vcpu
->kvm
->srcu
, vcpu
->srcu_idx
);
960 kvm_vcpu_block(vcpu
);
961 __unset_cpu_idle(vcpu
);
962 vcpu
->srcu_idx
= srcu_read_lock(&vcpu
->kvm
->srcu
);
964 hrtimer_cancel(&vcpu
->arch
.ckc_timer
);
968 void kvm_s390_vcpu_wakeup(struct kvm_vcpu
*vcpu
)
970 if (waitqueue_active(&vcpu
->wq
)) {
972 * The vcpu gave up the cpu voluntarily, mark it as a good
975 vcpu
->preempted
= true;
976 wake_up_interruptible(&vcpu
->wq
);
977 vcpu
->stat
.halt_wakeup
++;
981 enum hrtimer_restart
kvm_s390_idle_wakeup(struct hrtimer
*timer
)
983 struct kvm_vcpu
*vcpu
;
986 vcpu
= container_of(timer
, struct kvm_vcpu
, arch
.ckc_timer
);
987 now
= kvm_s390_get_tod_clock_fast(vcpu
->kvm
);
988 sltime
= tod_to_ns(vcpu
->arch
.sie_block
->ckc
- now
);
991 * If the monotonic clock runs faster than the tod clock we might be
992 * woken up too early and have to go back to sleep to avoid deadlocks.
994 if (vcpu
->arch
.sie_block
->ckc
> now
&&
995 hrtimer_forward_now(timer
, ns_to_ktime(sltime
)))
996 return HRTIMER_RESTART
;
997 kvm_s390_vcpu_wakeup(vcpu
);
998 return HRTIMER_NORESTART
;
1001 void kvm_s390_clear_local_irqs(struct kvm_vcpu
*vcpu
)
1003 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1005 spin_lock(&li
->lock
);
1006 li
->pending_irqs
= 0;
1007 bitmap_zero(li
->sigp_emerg_pending
, KVM_MAX_VCPUS
);
1008 memset(&li
->irq
, 0, sizeof(li
->irq
));
1009 spin_unlock(&li
->lock
);
1011 sca_clear_ext_call(vcpu
);
1014 int __must_check
kvm_s390_deliver_pending_interrupts(struct kvm_vcpu
*vcpu
)
1016 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1019 unsigned long irq_type
;
1022 __reset_intercept_indicators(vcpu
);
1024 /* pending ckc conditions might have been invalidated */
1025 clear_bit(IRQ_PEND_EXT_CLOCK_COMP
, &li
->pending_irqs
);
1026 if (ckc_irq_pending(vcpu
))
1027 set_bit(IRQ_PEND_EXT_CLOCK_COMP
, &li
->pending_irqs
);
1029 /* pending cpu timer conditions might have been invalidated */
1030 clear_bit(IRQ_PEND_EXT_CPU_TIMER
, &li
->pending_irqs
);
1031 if (cpu_timer_irq_pending(vcpu
))
1032 set_bit(IRQ_PEND_EXT_CPU_TIMER
, &li
->pending_irqs
);
1034 while ((irqs
= deliverable_irqs(vcpu
)) && !rc
) {
1035 /* bits are in the order of interrupt priority */
1036 irq_type
= find_first_bit(&irqs
, IRQ_PEND_COUNT
);
1037 if (is_ioirq(irq_type
)) {
1038 rc
= __deliver_io(vcpu
, irq_type
);
1040 func
= deliver_irq_funcs
[irq_type
];
1042 WARN_ON_ONCE(func
== NULL
);
1043 clear_bit(irq_type
, &li
->pending_irqs
);
1050 set_intercept_indicators(vcpu
);
1055 static int __inject_prog(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1057 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1059 VCPU_EVENT(vcpu
, 3, "inject: program irq code 0x%x", irq
->u
.pgm
.code
);
1060 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_PROGRAM_INT
,
1061 irq
->u
.pgm
.code
, 0);
1063 if (irq
->u
.pgm
.code
== PGM_PER
) {
1064 li
->irq
.pgm
.code
|= PGM_PER
;
1065 /* only modify PER related information */
1066 li
->irq
.pgm
.per_address
= irq
->u
.pgm
.per_address
;
1067 li
->irq
.pgm
.per_code
= irq
->u
.pgm
.per_code
;
1068 li
->irq
.pgm
.per_atmid
= irq
->u
.pgm
.per_atmid
;
1069 li
->irq
.pgm
.per_access_id
= irq
->u
.pgm
.per_access_id
;
1070 } else if (!(irq
->u
.pgm
.code
& PGM_PER
)) {
1071 li
->irq
.pgm
.code
= (li
->irq
.pgm
.code
& PGM_PER
) |
1073 /* only modify non-PER information */
1074 li
->irq
.pgm
.trans_exc_code
= irq
->u
.pgm
.trans_exc_code
;
1075 li
->irq
.pgm
.mon_code
= irq
->u
.pgm
.mon_code
;
1076 li
->irq
.pgm
.data_exc_code
= irq
->u
.pgm
.data_exc_code
;
1077 li
->irq
.pgm
.mon_class_nr
= irq
->u
.pgm
.mon_class_nr
;
1078 li
->irq
.pgm
.exc_access_id
= irq
->u
.pgm
.exc_access_id
;
1079 li
->irq
.pgm
.op_access_id
= irq
->u
.pgm
.op_access_id
;
1081 li
->irq
.pgm
= irq
->u
.pgm
;
1083 set_bit(IRQ_PEND_PROG
, &li
->pending_irqs
);
1087 static int __inject_pfault_init(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1089 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1091 VCPU_EVENT(vcpu
, 4, "inject: pfault init parameter block at 0x%llx",
1092 irq
->u
.ext
.ext_params2
);
1093 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_INT_PFAULT_INIT
,
1094 irq
->u
.ext
.ext_params
,
1095 irq
->u
.ext
.ext_params2
);
1097 li
->irq
.ext
= irq
->u
.ext
;
1098 set_bit(IRQ_PEND_PFAULT_INIT
, &li
->pending_irqs
);
1099 atomic_or(CPUSTAT_EXT_INT
, li
->cpuflags
);
1103 static int __inject_extcall(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1105 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1106 struct kvm_s390_extcall_info
*extcall
= &li
->irq
.extcall
;
1107 uint16_t src_id
= irq
->u
.extcall
.code
;
1109 VCPU_EVENT(vcpu
, 4, "inject: external call source-cpu:%u",
1111 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_INT_EXTERNAL_CALL
,
1114 /* sending vcpu invalid */
1115 if (kvm_get_vcpu_by_id(vcpu
->kvm
, src_id
) == NULL
)
1118 if (sclp
.has_sigpif
)
1119 return sca_inject_ext_call(vcpu
, src_id
);
1121 if (test_and_set_bit(IRQ_PEND_EXT_EXTERNAL
, &li
->pending_irqs
))
1123 *extcall
= irq
->u
.extcall
;
1124 atomic_or(CPUSTAT_EXT_INT
, li
->cpuflags
);
1128 static int __inject_set_prefix(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1130 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1131 struct kvm_s390_prefix_info
*prefix
= &li
->irq
.prefix
;
1133 VCPU_EVENT(vcpu
, 3, "inject: set prefix to %x",
1134 irq
->u
.prefix
.address
);
1135 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_SIGP_SET_PREFIX
,
1136 irq
->u
.prefix
.address
, 0);
1138 if (!is_vcpu_stopped(vcpu
))
1141 *prefix
= irq
->u
.prefix
;
1142 set_bit(IRQ_PEND_SET_PREFIX
, &li
->pending_irqs
);
1146 #define KVM_S390_STOP_SUPP_FLAGS (KVM_S390_STOP_FLAG_STORE_STATUS)
1147 static int __inject_sigp_stop(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1149 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1150 struct kvm_s390_stop_info
*stop
= &li
->irq
.stop
;
1153 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_SIGP_STOP
, 0, 0);
1155 if (irq
->u
.stop
.flags
& ~KVM_S390_STOP_SUPP_FLAGS
)
1158 if (is_vcpu_stopped(vcpu
)) {
1159 if (irq
->u
.stop
.flags
& KVM_S390_STOP_FLAG_STORE_STATUS
)
1160 rc
= kvm_s390_store_status_unloaded(vcpu
,
1161 KVM_S390_STORE_STATUS_NOADDR
);
1165 if (test_and_set_bit(IRQ_PEND_SIGP_STOP
, &li
->pending_irqs
))
1167 stop
->flags
= irq
->u
.stop
.flags
;
1168 __set_cpuflag(vcpu
, CPUSTAT_STOP_INT
);
1172 static int __inject_sigp_restart(struct kvm_vcpu
*vcpu
,
1173 struct kvm_s390_irq
*irq
)
1175 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1177 VCPU_EVENT(vcpu
, 3, "%s", "inject: restart int");
1178 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_RESTART
, 0, 0);
1180 set_bit(IRQ_PEND_RESTART
, &li
->pending_irqs
);
1184 static int __inject_sigp_emergency(struct kvm_vcpu
*vcpu
,
1185 struct kvm_s390_irq
*irq
)
1187 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1189 VCPU_EVENT(vcpu
, 4, "inject: emergency from cpu %u",
1191 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_INT_EMERGENCY
,
1192 irq
->u
.emerg
.code
, 0);
1194 /* sending vcpu invalid */
1195 if (kvm_get_vcpu_by_id(vcpu
->kvm
, irq
->u
.emerg
.code
) == NULL
)
1198 set_bit(irq
->u
.emerg
.code
, li
->sigp_emerg_pending
);
1199 set_bit(IRQ_PEND_EXT_EMERGENCY
, &li
->pending_irqs
);
1200 atomic_or(CPUSTAT_EXT_INT
, li
->cpuflags
);
1204 static int __inject_mchk(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1206 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1207 struct kvm_s390_mchk_info
*mchk
= &li
->irq
.mchk
;
1209 VCPU_EVENT(vcpu
, 3, "inject: machine check mcic 0x%llx",
1211 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_MCHK
, 0,
1215 * Because repressible machine checks can be indicated along with
1216 * exigent machine checks (PoP, Chapter 11, Interruption action)
1217 * we need to combine cr14, mcic and external damage code.
1218 * Failing storage address and the logout area should not be or'ed
1219 * together, we just indicate the last occurrence of the corresponding
1222 mchk
->cr14
|= irq
->u
.mchk
.cr14
;
1223 mchk
->mcic
|= irq
->u
.mchk
.mcic
;
1224 mchk
->ext_damage_code
|= irq
->u
.mchk
.ext_damage_code
;
1225 mchk
->failing_storage_address
= irq
->u
.mchk
.failing_storage_address
;
1226 memcpy(&mchk
->fixed_logout
, &irq
->u
.mchk
.fixed_logout
,
1227 sizeof(mchk
->fixed_logout
));
1228 if (mchk
->mcic
& MCHK_EX_MASK
)
1229 set_bit(IRQ_PEND_MCHK_EX
, &li
->pending_irqs
);
1230 else if (mchk
->mcic
& MCHK_REP_MASK
)
1231 set_bit(IRQ_PEND_MCHK_REP
, &li
->pending_irqs
);
1235 static int __inject_ckc(struct kvm_vcpu
*vcpu
)
1237 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1239 VCPU_EVENT(vcpu
, 3, "%s", "inject: clock comparator external");
1240 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_INT_CLOCK_COMP
,
1243 set_bit(IRQ_PEND_EXT_CLOCK_COMP
, &li
->pending_irqs
);
1244 atomic_or(CPUSTAT_EXT_INT
, li
->cpuflags
);
1248 static int __inject_cpu_timer(struct kvm_vcpu
*vcpu
)
1250 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1252 VCPU_EVENT(vcpu
, 3, "%s", "inject: cpu timer external");
1253 trace_kvm_s390_inject_vcpu(vcpu
->vcpu_id
, KVM_S390_INT_CPU_TIMER
,
1256 set_bit(IRQ_PEND_EXT_CPU_TIMER
, &li
->pending_irqs
);
1257 atomic_or(CPUSTAT_EXT_INT
, li
->cpuflags
);
1261 static struct kvm_s390_interrupt_info
*get_io_int(struct kvm
*kvm
,
1264 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1265 struct list_head
*isc_list
= &fi
->lists
[FIRQ_LIST_IO_ISC_0
+ isc
];
1266 struct kvm_s390_interrupt_info
*iter
;
1267 u16 id
= (schid
& 0xffff0000U
) >> 16;
1268 u16 nr
= schid
& 0x0000ffffU
;
1270 spin_lock(&fi
->lock
);
1271 list_for_each_entry(iter
, isc_list
, list
) {
1272 if (schid
&& (id
!= iter
->io
.subchannel_id
||
1273 nr
!= iter
->io
.subchannel_nr
))
1275 /* found an appropriate entry */
1276 list_del_init(&iter
->list
);
1277 fi
->counters
[FIRQ_CNTR_IO
] -= 1;
1278 if (list_empty(isc_list
))
1279 clear_bit(IRQ_PEND_IO_ISC_0
+ isc
, &fi
->pending_irqs
);
1280 spin_unlock(&fi
->lock
);
1283 spin_unlock(&fi
->lock
);
1288 * Dequeue and return an I/O interrupt matching any of the interruption
1289 * subclasses as designated by the isc mask in cr6 and the schid (if != 0).
1291 struct kvm_s390_interrupt_info
*kvm_s390_get_io_int(struct kvm
*kvm
,
1292 u64 isc_mask
, u32 schid
)
1294 struct kvm_s390_interrupt_info
*inti
= NULL
;
1297 for (isc
= 0; isc
<= MAX_ISC
&& !inti
; isc
++) {
1298 if (isc_mask
& isc_to_isc_bits(isc
))
1299 inti
= get_io_int(kvm
, isc
, schid
);
1304 #define SCCB_MASK 0xFFFFFFF8
1305 #define SCCB_EVENT_PENDING 0x3
1307 static int __inject_service(struct kvm
*kvm
,
1308 struct kvm_s390_interrupt_info
*inti
)
1310 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1312 spin_lock(&fi
->lock
);
1313 fi
->srv_signal
.ext_params
|= inti
->ext
.ext_params
& SCCB_EVENT_PENDING
;
1315 * Early versions of the QEMU s390 bios will inject several
1316 * service interrupts after another without handling a
1317 * condition code indicating busy.
1318 * We will silently ignore those superfluous sccb values.
1319 * A future version of QEMU will take care of serialization
1322 if (fi
->srv_signal
.ext_params
& SCCB_MASK
)
1324 fi
->srv_signal
.ext_params
|= inti
->ext
.ext_params
& SCCB_MASK
;
1325 set_bit(IRQ_PEND_EXT_SERVICE
, &fi
->pending_irqs
);
1327 spin_unlock(&fi
->lock
);
1332 static int __inject_virtio(struct kvm
*kvm
,
1333 struct kvm_s390_interrupt_info
*inti
)
1335 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1337 spin_lock(&fi
->lock
);
1338 if (fi
->counters
[FIRQ_CNTR_VIRTIO
] >= KVM_S390_MAX_VIRTIO_IRQS
) {
1339 spin_unlock(&fi
->lock
);
1342 fi
->counters
[FIRQ_CNTR_VIRTIO
] += 1;
1343 list_add_tail(&inti
->list
, &fi
->lists
[FIRQ_LIST_VIRTIO
]);
1344 set_bit(IRQ_PEND_VIRTIO
, &fi
->pending_irqs
);
1345 spin_unlock(&fi
->lock
);
1349 static int __inject_pfault_done(struct kvm
*kvm
,
1350 struct kvm_s390_interrupt_info
*inti
)
1352 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1354 spin_lock(&fi
->lock
);
1355 if (fi
->counters
[FIRQ_CNTR_PFAULT
] >=
1356 (ASYNC_PF_PER_VCPU
* KVM_MAX_VCPUS
)) {
1357 spin_unlock(&fi
->lock
);
1360 fi
->counters
[FIRQ_CNTR_PFAULT
] += 1;
1361 list_add_tail(&inti
->list
, &fi
->lists
[FIRQ_LIST_PFAULT
]);
1362 set_bit(IRQ_PEND_PFAULT_DONE
, &fi
->pending_irqs
);
1363 spin_unlock(&fi
->lock
);
1367 #define CR_PENDING_SUBCLASS 28
1368 static int __inject_float_mchk(struct kvm
*kvm
,
1369 struct kvm_s390_interrupt_info
*inti
)
1371 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1373 spin_lock(&fi
->lock
);
1374 fi
->mchk
.cr14
|= inti
->mchk
.cr14
& (1UL << CR_PENDING_SUBCLASS
);
1375 fi
->mchk
.mcic
|= inti
->mchk
.mcic
;
1376 set_bit(IRQ_PEND_MCHK_REP
, &fi
->pending_irqs
);
1377 spin_unlock(&fi
->lock
);
1382 static int __inject_io(struct kvm
*kvm
, struct kvm_s390_interrupt_info
*inti
)
1384 struct kvm_s390_float_interrupt
*fi
;
1385 struct list_head
*list
;
1388 fi
= &kvm
->arch
.float_int
;
1389 spin_lock(&fi
->lock
);
1390 if (fi
->counters
[FIRQ_CNTR_IO
] >= KVM_S390_MAX_FLOAT_IRQS
) {
1391 spin_unlock(&fi
->lock
);
1394 fi
->counters
[FIRQ_CNTR_IO
] += 1;
1396 isc
= int_word_to_isc(inti
->io
.io_int_word
);
1397 list
= &fi
->lists
[FIRQ_LIST_IO_ISC_0
+ isc
];
1398 list_add_tail(&inti
->list
, list
);
1399 set_bit(IRQ_PEND_IO_ISC_0
+ isc
, &fi
->pending_irqs
);
1400 spin_unlock(&fi
->lock
);
1405 * Find a destination VCPU for a floating irq and kick it.
1407 static void __floating_irq_kick(struct kvm
*kvm
, u64 type
)
1409 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1410 struct kvm_s390_local_interrupt
*li
;
1411 struct kvm_vcpu
*dst_vcpu
;
1412 int sigcpu
, online_vcpus
, nr_tries
= 0;
1414 online_vcpus
= atomic_read(&kvm
->online_vcpus
);
1418 /* find idle VCPUs first, then round robin */
1419 sigcpu
= find_first_bit(fi
->idle_mask
, online_vcpus
);
1420 if (sigcpu
== online_vcpus
) {
1422 sigcpu
= fi
->next_rr_cpu
;
1423 fi
->next_rr_cpu
= (fi
->next_rr_cpu
+ 1) % online_vcpus
;
1424 /* avoid endless loops if all vcpus are stopped */
1425 if (nr_tries
++ >= online_vcpus
)
1427 } while (is_vcpu_stopped(kvm_get_vcpu(kvm
, sigcpu
)));
1429 dst_vcpu
= kvm_get_vcpu(kvm
, sigcpu
);
1431 /* make the VCPU drop out of the SIE, or wake it up if sleeping */
1432 li
= &dst_vcpu
->arch
.local_int
;
1433 spin_lock(&li
->lock
);
1436 atomic_or(CPUSTAT_STOP_INT
, li
->cpuflags
);
1438 case KVM_S390_INT_IO_MIN
...KVM_S390_INT_IO_MAX
:
1439 atomic_or(CPUSTAT_IO_INT
, li
->cpuflags
);
1442 atomic_or(CPUSTAT_EXT_INT
, li
->cpuflags
);
1445 spin_unlock(&li
->lock
);
1446 kvm_s390_vcpu_wakeup(dst_vcpu
);
1449 static int __inject_vm(struct kvm
*kvm
, struct kvm_s390_interrupt_info
*inti
)
1451 u64 type
= READ_ONCE(inti
->type
);
1456 rc
= __inject_float_mchk(kvm
, inti
);
1458 case KVM_S390_INT_VIRTIO
:
1459 rc
= __inject_virtio(kvm
, inti
);
1461 case KVM_S390_INT_SERVICE
:
1462 rc
= __inject_service(kvm
, inti
);
1464 case KVM_S390_INT_PFAULT_DONE
:
1465 rc
= __inject_pfault_done(kvm
, inti
);
1467 case KVM_S390_INT_IO_MIN
...KVM_S390_INT_IO_MAX
:
1468 rc
= __inject_io(kvm
, inti
);
1476 __floating_irq_kick(kvm
, type
);
1480 int kvm_s390_inject_vm(struct kvm
*kvm
,
1481 struct kvm_s390_interrupt
*s390int
)
1483 struct kvm_s390_interrupt_info
*inti
;
1486 inti
= kzalloc(sizeof(*inti
), GFP_KERNEL
);
1490 inti
->type
= s390int
->type
;
1491 switch (inti
->type
) {
1492 case KVM_S390_INT_VIRTIO
:
1493 VM_EVENT(kvm
, 5, "inject: virtio parm:%x,parm64:%llx",
1494 s390int
->parm
, s390int
->parm64
);
1495 inti
->ext
.ext_params
= s390int
->parm
;
1496 inti
->ext
.ext_params2
= s390int
->parm64
;
1498 case KVM_S390_INT_SERVICE
:
1499 VM_EVENT(kvm
, 4, "inject: sclp parm:%x", s390int
->parm
);
1500 inti
->ext
.ext_params
= s390int
->parm
;
1502 case KVM_S390_INT_PFAULT_DONE
:
1503 inti
->ext
.ext_params2
= s390int
->parm64
;
1506 VM_EVENT(kvm
, 3, "inject: machine check mcic 0x%llx",
1508 inti
->mchk
.cr14
= s390int
->parm
; /* upper bits are not used */
1509 inti
->mchk
.mcic
= s390int
->parm64
;
1511 case KVM_S390_INT_IO_MIN
...KVM_S390_INT_IO_MAX
:
1512 if (inti
->type
& KVM_S390_INT_IO_AI_MASK
)
1513 VM_EVENT(kvm
, 5, "%s", "inject: I/O (AI)");
1515 VM_EVENT(kvm
, 5, "inject: I/O css %x ss %x schid %04x",
1516 s390int
->type
& IOINT_CSSID_MASK
,
1517 s390int
->type
& IOINT_SSID_MASK
,
1518 s390int
->type
& IOINT_SCHID_MASK
);
1519 inti
->io
.subchannel_id
= s390int
->parm
>> 16;
1520 inti
->io
.subchannel_nr
= s390int
->parm
& 0x0000ffffu
;
1521 inti
->io
.io_int_parm
= s390int
->parm64
>> 32;
1522 inti
->io
.io_int_word
= s390int
->parm64
& 0x00000000ffffffffull
;
1528 trace_kvm_s390_inject_vm(s390int
->type
, s390int
->parm
, s390int
->parm64
,
1531 rc
= __inject_vm(kvm
, inti
);
1537 int kvm_s390_reinject_io_int(struct kvm
*kvm
,
1538 struct kvm_s390_interrupt_info
*inti
)
1540 return __inject_vm(kvm
, inti
);
1543 int s390int_to_s390irq(struct kvm_s390_interrupt
*s390int
,
1544 struct kvm_s390_irq
*irq
)
1546 irq
->type
= s390int
->type
;
1547 switch (irq
->type
) {
1548 case KVM_S390_PROGRAM_INT
:
1549 if (s390int
->parm
& 0xffff0000)
1551 irq
->u
.pgm
.code
= s390int
->parm
;
1553 case KVM_S390_SIGP_SET_PREFIX
:
1554 irq
->u
.prefix
.address
= s390int
->parm
;
1556 case KVM_S390_SIGP_STOP
:
1557 irq
->u
.stop
.flags
= s390int
->parm
;
1559 case KVM_S390_INT_EXTERNAL_CALL
:
1560 if (s390int
->parm
& 0xffff0000)
1562 irq
->u
.extcall
.code
= s390int
->parm
;
1564 case KVM_S390_INT_EMERGENCY
:
1565 if (s390int
->parm
& 0xffff0000)
1567 irq
->u
.emerg
.code
= s390int
->parm
;
1570 irq
->u
.mchk
.mcic
= s390int
->parm64
;
1576 int kvm_s390_is_stop_irq_pending(struct kvm_vcpu
*vcpu
)
1578 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1580 return test_bit(IRQ_PEND_SIGP_STOP
, &li
->pending_irqs
);
1583 void kvm_s390_clear_stop_irq(struct kvm_vcpu
*vcpu
)
1585 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1587 spin_lock(&li
->lock
);
1588 li
->irq
.stop
.flags
= 0;
1589 clear_bit(IRQ_PEND_SIGP_STOP
, &li
->pending_irqs
);
1590 spin_unlock(&li
->lock
);
1593 static int do_inject_vcpu(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1597 switch (irq
->type
) {
1598 case KVM_S390_PROGRAM_INT
:
1599 rc
= __inject_prog(vcpu
, irq
);
1601 case KVM_S390_SIGP_SET_PREFIX
:
1602 rc
= __inject_set_prefix(vcpu
, irq
);
1604 case KVM_S390_SIGP_STOP
:
1605 rc
= __inject_sigp_stop(vcpu
, irq
);
1607 case KVM_S390_RESTART
:
1608 rc
= __inject_sigp_restart(vcpu
, irq
);
1610 case KVM_S390_INT_CLOCK_COMP
:
1611 rc
= __inject_ckc(vcpu
);
1613 case KVM_S390_INT_CPU_TIMER
:
1614 rc
= __inject_cpu_timer(vcpu
);
1616 case KVM_S390_INT_EXTERNAL_CALL
:
1617 rc
= __inject_extcall(vcpu
, irq
);
1619 case KVM_S390_INT_EMERGENCY
:
1620 rc
= __inject_sigp_emergency(vcpu
, irq
);
1623 rc
= __inject_mchk(vcpu
, irq
);
1625 case KVM_S390_INT_PFAULT_INIT
:
1626 rc
= __inject_pfault_init(vcpu
, irq
);
1628 case KVM_S390_INT_VIRTIO
:
1629 case KVM_S390_INT_SERVICE
:
1630 case KVM_S390_INT_IO_MIN
...KVM_S390_INT_IO_MAX
:
1638 int kvm_s390_inject_vcpu(struct kvm_vcpu
*vcpu
, struct kvm_s390_irq
*irq
)
1640 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
1643 spin_lock(&li
->lock
);
1644 rc
= do_inject_vcpu(vcpu
, irq
);
1645 spin_unlock(&li
->lock
);
1647 kvm_s390_vcpu_wakeup(vcpu
);
1651 static inline void clear_irq_list(struct list_head
*_list
)
1653 struct kvm_s390_interrupt_info
*inti
, *n
;
1655 list_for_each_entry_safe(inti
, n
, _list
, list
) {
1656 list_del(&inti
->list
);
1661 static void inti_to_irq(struct kvm_s390_interrupt_info
*inti
,
1662 struct kvm_s390_irq
*irq
)
1664 irq
->type
= inti
->type
;
1665 switch (inti
->type
) {
1666 case KVM_S390_INT_PFAULT_INIT
:
1667 case KVM_S390_INT_PFAULT_DONE
:
1668 case KVM_S390_INT_VIRTIO
:
1669 irq
->u
.ext
= inti
->ext
;
1671 case KVM_S390_INT_IO_MIN
...KVM_S390_INT_IO_MAX
:
1672 irq
->u
.io
= inti
->io
;
1677 void kvm_s390_clear_float_irqs(struct kvm
*kvm
)
1679 struct kvm_s390_float_interrupt
*fi
= &kvm
->arch
.float_int
;
1682 spin_lock(&fi
->lock
);
1683 fi
->pending_irqs
= 0;
1684 memset(&fi
->srv_signal
, 0, sizeof(fi
->srv_signal
));
1685 memset(&fi
->mchk
, 0, sizeof(fi
->mchk
));
1686 for (i
= 0; i
< FIRQ_LIST_COUNT
; i
++)
1687 clear_irq_list(&fi
->lists
[i
]);
1688 for (i
= 0; i
< FIRQ_MAX_COUNT
; i
++)
1689 fi
->counters
[i
] = 0;
1690 spin_unlock(&fi
->lock
);
1693 static int get_all_floating_irqs(struct kvm
*kvm
, u8 __user
*usrbuf
, u64 len
)
1695 struct kvm_s390_interrupt_info
*inti
;
1696 struct kvm_s390_float_interrupt
*fi
;
1697 struct kvm_s390_irq
*buf
;
1698 struct kvm_s390_irq
*irq
;
1704 if (len
> KVM_S390_FLIC_MAX_BUFFER
|| len
== 0)
1708 * We are already using -ENOMEM to signal
1709 * userspace it may retry with a bigger buffer,
1710 * so we need to use something else for this case
1716 max_irqs
= len
/ sizeof(struct kvm_s390_irq
);
1718 fi
= &kvm
->arch
.float_int
;
1719 spin_lock(&fi
->lock
);
1720 for (i
= 0; i
< FIRQ_LIST_COUNT
; i
++) {
1721 list_for_each_entry(inti
, &fi
->lists
[i
], list
) {
1722 if (n
== max_irqs
) {
1723 /* signal userspace to try again */
1727 inti_to_irq(inti
, &buf
[n
]);
1731 if (test_bit(IRQ_PEND_EXT_SERVICE
, &fi
->pending_irqs
)) {
1732 if (n
== max_irqs
) {
1733 /* signal userspace to try again */
1737 irq
= (struct kvm_s390_irq
*) &buf
[n
];
1738 irq
->type
= KVM_S390_INT_SERVICE
;
1739 irq
->u
.ext
= fi
->srv_signal
;
1742 if (test_bit(IRQ_PEND_MCHK_REP
, &fi
->pending_irqs
)) {
1743 if (n
== max_irqs
) {
1744 /* signal userspace to try again */
1748 irq
= (struct kvm_s390_irq
*) &buf
[n
];
1749 irq
->type
= KVM_S390_MCHK
;
1750 irq
->u
.mchk
= fi
->mchk
;
1755 spin_unlock(&fi
->lock
);
1756 if (!ret
&& n
> 0) {
1757 if (copy_to_user(usrbuf
, buf
, sizeof(struct kvm_s390_irq
) * n
))
1762 return ret
< 0 ? ret
: n
;
1765 static int flic_get_attr(struct kvm_device
*dev
, struct kvm_device_attr
*attr
)
1769 switch (attr
->group
) {
1770 case KVM_DEV_FLIC_GET_ALL_IRQS
:
1771 r
= get_all_floating_irqs(dev
->kvm
, (u8 __user
*) attr
->addr
,
1781 static inline int copy_irq_from_user(struct kvm_s390_interrupt_info
*inti
,
1784 struct kvm_s390_irq __user
*uptr
= (struct kvm_s390_irq __user
*) addr
;
1785 void *target
= NULL
;
1786 void __user
*source
;
1789 if (get_user(inti
->type
, (u64 __user
*)addr
))
1792 switch (inti
->type
) {
1793 case KVM_S390_INT_PFAULT_INIT
:
1794 case KVM_S390_INT_PFAULT_DONE
:
1795 case KVM_S390_INT_VIRTIO
:
1796 case KVM_S390_INT_SERVICE
:
1797 target
= (void *) &inti
->ext
;
1798 source
= &uptr
->u
.ext
;
1799 size
= sizeof(inti
->ext
);
1801 case KVM_S390_INT_IO_MIN
...KVM_S390_INT_IO_MAX
:
1802 target
= (void *) &inti
->io
;
1803 source
= &uptr
->u
.io
;
1804 size
= sizeof(inti
->io
);
1807 target
= (void *) &inti
->mchk
;
1808 source
= &uptr
->u
.mchk
;
1809 size
= sizeof(inti
->mchk
);
1815 if (copy_from_user(target
, source
, size
))
1821 static int enqueue_floating_irq(struct kvm_device
*dev
,
1822 struct kvm_device_attr
*attr
)
1824 struct kvm_s390_interrupt_info
*inti
= NULL
;
1826 int len
= attr
->attr
;
1828 if (len
% sizeof(struct kvm_s390_irq
) != 0)
1830 else if (len
> KVM_S390_FLIC_MAX_BUFFER
)
1833 while (len
>= sizeof(struct kvm_s390_irq
)) {
1834 inti
= kzalloc(sizeof(*inti
), GFP_KERNEL
);
1838 r
= copy_irq_from_user(inti
, attr
->addr
);
1843 r
= __inject_vm(dev
->kvm
, inti
);
1848 len
-= sizeof(struct kvm_s390_irq
);
1849 attr
->addr
+= sizeof(struct kvm_s390_irq
);
1855 static struct s390_io_adapter
*get_io_adapter(struct kvm
*kvm
, unsigned int id
)
1857 if (id
>= MAX_S390_IO_ADAPTERS
)
1859 return kvm
->arch
.adapters
[id
];
1862 static int register_io_adapter(struct kvm_device
*dev
,
1863 struct kvm_device_attr
*attr
)
1865 struct s390_io_adapter
*adapter
;
1866 struct kvm_s390_io_adapter adapter_info
;
1868 if (copy_from_user(&adapter_info
,
1869 (void __user
*)attr
->addr
, sizeof(adapter_info
)))
1872 if ((adapter_info
.id
>= MAX_S390_IO_ADAPTERS
) ||
1873 (dev
->kvm
->arch
.adapters
[adapter_info
.id
] != NULL
))
1876 adapter
= kzalloc(sizeof(*adapter
), GFP_KERNEL
);
1880 INIT_LIST_HEAD(&adapter
->maps
);
1881 init_rwsem(&adapter
->maps_lock
);
1882 atomic_set(&adapter
->nr_maps
, 0);
1883 adapter
->id
= adapter_info
.id
;
1884 adapter
->isc
= adapter_info
.isc
;
1885 adapter
->maskable
= adapter_info
.maskable
;
1886 adapter
->masked
= false;
1887 adapter
->swap
= adapter_info
.swap
;
1888 dev
->kvm
->arch
.adapters
[adapter
->id
] = adapter
;
1893 int kvm_s390_mask_adapter(struct kvm
*kvm
, unsigned int id
, bool masked
)
1896 struct s390_io_adapter
*adapter
= get_io_adapter(kvm
, id
);
1898 if (!adapter
|| !adapter
->maskable
)
1900 ret
= adapter
->masked
;
1901 adapter
->masked
= masked
;
1905 static int kvm_s390_adapter_map(struct kvm
*kvm
, unsigned int id
, __u64 addr
)
1907 struct s390_io_adapter
*adapter
= get_io_adapter(kvm
, id
);
1908 struct s390_map_info
*map
;
1911 if (!adapter
|| !addr
)
1914 map
= kzalloc(sizeof(*map
), GFP_KERNEL
);
1919 INIT_LIST_HEAD(&map
->list
);
1920 map
->guest_addr
= addr
;
1921 map
->addr
= gmap_translate(kvm
->arch
.gmap
, addr
);
1922 if (map
->addr
== -EFAULT
) {
1926 ret
= get_user_pages_fast(map
->addr
, 1, 1, &map
->page
);
1930 down_write(&adapter
->maps_lock
);
1931 if (atomic_inc_return(&adapter
->nr_maps
) < MAX_S390_ADAPTER_MAPS
) {
1932 list_add_tail(&map
->list
, &adapter
->maps
);
1935 put_page(map
->page
);
1938 up_write(&adapter
->maps_lock
);
1945 static int kvm_s390_adapter_unmap(struct kvm
*kvm
, unsigned int id
, __u64 addr
)
1947 struct s390_io_adapter
*adapter
= get_io_adapter(kvm
, id
);
1948 struct s390_map_info
*map
, *tmp
;
1951 if (!adapter
|| !addr
)
1954 down_write(&adapter
->maps_lock
);
1955 list_for_each_entry_safe(map
, tmp
, &adapter
->maps
, list
) {
1956 if (map
->guest_addr
== addr
) {
1958 atomic_dec(&adapter
->nr_maps
);
1959 list_del(&map
->list
);
1960 put_page(map
->page
);
1965 up_write(&adapter
->maps_lock
);
1967 return found
? 0 : -EINVAL
;
1970 void kvm_s390_destroy_adapters(struct kvm
*kvm
)
1973 struct s390_map_info
*map
, *tmp
;
1975 for (i
= 0; i
< MAX_S390_IO_ADAPTERS
; i
++) {
1976 if (!kvm
->arch
.adapters
[i
])
1978 list_for_each_entry_safe(map
, tmp
,
1979 &kvm
->arch
.adapters
[i
]->maps
, list
) {
1980 list_del(&map
->list
);
1981 put_page(map
->page
);
1984 kfree(kvm
->arch
.adapters
[i
]);
1988 static int modify_io_adapter(struct kvm_device
*dev
,
1989 struct kvm_device_attr
*attr
)
1991 struct kvm_s390_io_adapter_req req
;
1992 struct s390_io_adapter
*adapter
;
1995 if (copy_from_user(&req
, (void __user
*)attr
->addr
, sizeof(req
)))
1998 adapter
= get_io_adapter(dev
->kvm
, req
.id
);
2002 case KVM_S390_IO_ADAPTER_MASK
:
2003 ret
= kvm_s390_mask_adapter(dev
->kvm
, req
.id
, req
.mask
);
2007 case KVM_S390_IO_ADAPTER_MAP
:
2008 ret
= kvm_s390_adapter_map(dev
->kvm
, req
.id
, req
.addr
);
2010 case KVM_S390_IO_ADAPTER_UNMAP
:
2011 ret
= kvm_s390_adapter_unmap(dev
->kvm
, req
.id
, req
.addr
);
2020 static int flic_set_attr(struct kvm_device
*dev
, struct kvm_device_attr
*attr
)
2024 struct kvm_vcpu
*vcpu
;
2026 switch (attr
->group
) {
2027 case KVM_DEV_FLIC_ENQUEUE
:
2028 r
= enqueue_floating_irq(dev
, attr
);
2030 case KVM_DEV_FLIC_CLEAR_IRQS
:
2031 kvm_s390_clear_float_irqs(dev
->kvm
);
2033 case KVM_DEV_FLIC_APF_ENABLE
:
2034 dev
->kvm
->arch
.gmap
->pfault_enabled
= 1;
2036 case KVM_DEV_FLIC_APF_DISABLE_WAIT
:
2037 dev
->kvm
->arch
.gmap
->pfault_enabled
= 0;
2039 * Make sure no async faults are in transition when
2040 * clearing the queues. So we don't need to worry
2041 * about late coming workers.
2043 synchronize_srcu(&dev
->kvm
->srcu
);
2044 kvm_for_each_vcpu(i
, vcpu
, dev
->kvm
)
2045 kvm_clear_async_pf_completion_queue(vcpu
);
2047 case KVM_DEV_FLIC_ADAPTER_REGISTER
:
2048 r
= register_io_adapter(dev
, attr
);
2050 case KVM_DEV_FLIC_ADAPTER_MODIFY
:
2051 r
= modify_io_adapter(dev
, attr
);
2060 static int flic_create(struct kvm_device
*dev
, u32 type
)
2064 if (dev
->kvm
->arch
.flic
)
2066 dev
->kvm
->arch
.flic
= dev
;
2070 static void flic_destroy(struct kvm_device
*dev
)
2072 dev
->kvm
->arch
.flic
= NULL
;
2076 /* s390 floating irq controller (flic) */
2077 struct kvm_device_ops kvm_flic_ops
= {
2079 .get_attr
= flic_get_attr
,
2080 .set_attr
= flic_set_attr
,
2081 .create
= flic_create
,
2082 .destroy
= flic_destroy
,
2085 static unsigned long get_ind_bit(__u64 addr
, unsigned long bit_nr
, bool swap
)
2089 bit
= bit_nr
+ (addr
% PAGE_SIZE
) * 8;
2091 return swap
? (bit
^ (BITS_PER_LONG
- 1)) : bit
;
2094 static struct s390_map_info
*get_map_info(struct s390_io_adapter
*adapter
,
2097 struct s390_map_info
*map
;
2102 list_for_each_entry(map
, &adapter
->maps
, list
) {
2103 if (map
->guest_addr
== addr
)
2109 static int adapter_indicators_set(struct kvm
*kvm
,
2110 struct s390_io_adapter
*adapter
,
2111 struct kvm_s390_adapter_int
*adapter_int
)
2114 int summary_set
, idx
;
2115 struct s390_map_info
*info
;
2118 info
= get_map_info(adapter
, adapter_int
->ind_addr
);
2121 map
= page_address(info
->page
);
2122 bit
= get_ind_bit(info
->addr
, adapter_int
->ind_offset
, adapter
->swap
);
2124 idx
= srcu_read_lock(&kvm
->srcu
);
2125 mark_page_dirty(kvm
, info
->guest_addr
>> PAGE_SHIFT
);
2126 set_page_dirty_lock(info
->page
);
2127 info
= get_map_info(adapter
, adapter_int
->summary_addr
);
2129 srcu_read_unlock(&kvm
->srcu
, idx
);
2132 map
= page_address(info
->page
);
2133 bit
= get_ind_bit(info
->addr
, adapter_int
->summary_offset
,
2135 summary_set
= test_and_set_bit(bit
, map
);
2136 mark_page_dirty(kvm
, info
->guest_addr
>> PAGE_SHIFT
);
2137 set_page_dirty_lock(info
->page
);
2138 srcu_read_unlock(&kvm
->srcu
, idx
);
2139 return summary_set
? 0 : 1;
2143 * < 0 - not injected due to error
2144 * = 0 - coalesced, summary indicator already active
2145 * > 0 - injected interrupt
2147 static int set_adapter_int(struct kvm_kernel_irq_routing_entry
*e
,
2148 struct kvm
*kvm
, int irq_source_id
, int level
,
2152 struct s390_io_adapter
*adapter
;
2154 /* We're only interested in the 0->1 transition. */
2157 adapter
= get_io_adapter(kvm
, e
->adapter
.adapter_id
);
2160 down_read(&adapter
->maps_lock
);
2161 ret
= adapter_indicators_set(kvm
, adapter
, &e
->adapter
);
2162 up_read(&adapter
->maps_lock
);
2163 if ((ret
> 0) && !adapter
->masked
) {
2164 struct kvm_s390_interrupt s390int
= {
2165 .type
= KVM_S390_INT_IO(1, 0, 0, 0),
2167 .parm64
= (adapter
->isc
<< 27) | 0x80000000,
2169 ret
= kvm_s390_inject_vm(kvm
, &s390int
);
2176 int kvm_set_routing_entry(struct kvm_kernel_irq_routing_entry
*e
,
2177 const struct kvm_irq_routing_entry
*ue
)
2182 case KVM_IRQ_ROUTING_S390_ADAPTER
:
2183 e
->set
= set_adapter_int
;
2184 e
->adapter
.summary_addr
= ue
->u
.adapter
.summary_addr
;
2185 e
->adapter
.ind_addr
= ue
->u
.adapter
.ind_addr
;
2186 e
->adapter
.summary_offset
= ue
->u
.adapter
.summary_offset
;
2187 e
->adapter
.ind_offset
= ue
->u
.adapter
.ind_offset
;
2188 e
->adapter
.adapter_id
= ue
->u
.adapter
.adapter_id
;
2198 int kvm_set_msi(struct kvm_kernel_irq_routing_entry
*e
, struct kvm
*kvm
,
2199 int irq_source_id
, int level
, bool line_status
)
2204 int kvm_s390_set_irq_state(struct kvm_vcpu
*vcpu
, void __user
*irqstate
, int len
)
2206 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
2207 struct kvm_s390_irq
*buf
;
2215 if (copy_from_user((void *) buf
, irqstate
, len
)) {
2221 * Don't allow setting the interrupt state
2222 * when there are already interrupts pending
2224 spin_lock(&li
->lock
);
2225 if (li
->pending_irqs
) {
2230 for (n
= 0; n
< len
/ sizeof(*buf
); n
++) {
2231 r
= do_inject_vcpu(vcpu
, &buf
[n
]);
2237 spin_unlock(&li
->lock
);
2244 static void store_local_irq(struct kvm_s390_local_interrupt
*li
,
2245 struct kvm_s390_irq
*irq
,
2246 unsigned long irq_type
)
2249 case IRQ_PEND_MCHK_EX
:
2250 case IRQ_PEND_MCHK_REP
:
2251 irq
->type
= KVM_S390_MCHK
;
2252 irq
->u
.mchk
= li
->irq
.mchk
;
2255 irq
->type
= KVM_S390_PROGRAM_INT
;
2256 irq
->u
.pgm
= li
->irq
.pgm
;
2258 case IRQ_PEND_PFAULT_INIT
:
2259 irq
->type
= KVM_S390_INT_PFAULT_INIT
;
2260 irq
->u
.ext
= li
->irq
.ext
;
2262 case IRQ_PEND_EXT_EXTERNAL
:
2263 irq
->type
= KVM_S390_INT_EXTERNAL_CALL
;
2264 irq
->u
.extcall
= li
->irq
.extcall
;
2266 case IRQ_PEND_EXT_CLOCK_COMP
:
2267 irq
->type
= KVM_S390_INT_CLOCK_COMP
;
2269 case IRQ_PEND_EXT_CPU_TIMER
:
2270 irq
->type
= KVM_S390_INT_CPU_TIMER
;
2272 case IRQ_PEND_SIGP_STOP
:
2273 irq
->type
= KVM_S390_SIGP_STOP
;
2274 irq
->u
.stop
= li
->irq
.stop
;
2276 case IRQ_PEND_RESTART
:
2277 irq
->type
= KVM_S390_RESTART
;
2279 case IRQ_PEND_SET_PREFIX
:
2280 irq
->type
= KVM_S390_SIGP_SET_PREFIX
;
2281 irq
->u
.prefix
= li
->irq
.prefix
;
2286 int kvm_s390_get_irq_state(struct kvm_vcpu
*vcpu
, __u8 __user
*buf
, int len
)
2289 unsigned long sigp_emerg_pending
[BITS_TO_LONGS(KVM_MAX_VCPUS
)];
2290 struct kvm_s390_local_interrupt
*li
= &vcpu
->arch
.local_int
;
2291 unsigned long pending_irqs
;
2292 struct kvm_s390_irq irq
;
2293 unsigned long irq_type
;
2297 spin_lock(&li
->lock
);
2298 pending_irqs
= li
->pending_irqs
;
2299 memcpy(&sigp_emerg_pending
, &li
->sigp_emerg_pending
,
2300 sizeof(sigp_emerg_pending
));
2301 spin_unlock(&li
->lock
);
2303 for_each_set_bit(irq_type
, &pending_irqs
, IRQ_PEND_COUNT
) {
2304 memset(&irq
, 0, sizeof(irq
));
2305 if (irq_type
== IRQ_PEND_EXT_EMERGENCY
)
2307 if (n
+ sizeof(irq
) > len
)
2309 store_local_irq(&vcpu
->arch
.local_int
, &irq
, irq_type
);
2310 if (copy_to_user(&buf
[n
], &irq
, sizeof(irq
)))
2315 if (test_bit(IRQ_PEND_EXT_EMERGENCY
, &pending_irqs
)) {
2316 for_each_set_bit(cpuaddr
, sigp_emerg_pending
, KVM_MAX_VCPUS
) {
2317 memset(&irq
, 0, sizeof(irq
));
2318 if (n
+ sizeof(irq
) > len
)
2320 irq
.type
= KVM_S390_INT_EMERGENCY
;
2321 irq
.u
.emerg
.code
= cpuaddr
;
2322 if (copy_to_user(&buf
[n
], &irq
, sizeof(irq
)))
2328 if (sca_ext_call_pending(vcpu
, &scn
)) {
2329 if (n
+ sizeof(irq
) > len
)
2331 memset(&irq
, 0, sizeof(irq
));
2332 irq
.type
= KVM_S390_INT_EXTERNAL_CALL
;
2333 irq
.u
.extcall
.code
= scn
;
2334 if (copy_to_user(&buf
[n
], &irq
, sizeof(irq
)))