s390/sclp: unify basic sclp access by exposing "struct sclp"
[deliverable/linux.git] / arch / s390 / kvm / kvm-s390.c
1 /*
2 * hosting zSeries kernel virtual machines
3 *
4 * Copyright IBM Corp. 2008, 2009
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License (version 2 only)
8 * as published by the Free Software Foundation.
9 *
10 * Author(s): Carsten Otte <cotte@de.ibm.com>
11 * Christian Borntraeger <borntraeger@de.ibm.com>
12 * Heiko Carstens <heiko.carstens@de.ibm.com>
13 * Christian Ehrhardt <ehrhardt@de.ibm.com>
14 * Jason J. Herne <jjherne@us.ibm.com>
15 */
16
17 #include <linux/compiler.h>
18 #include <linux/err.h>
19 #include <linux/fs.h>
20 #include <linux/hrtimer.h>
21 #include <linux/init.h>
22 #include <linux/kvm.h>
23 #include <linux/kvm_host.h>
24 #include <linux/module.h>
25 #include <linux/random.h>
26 #include <linux/slab.h>
27 #include <linux/timer.h>
28 #include <linux/vmalloc.h>
29 #include <asm/asm-offsets.h>
30 #include <asm/lowcore.h>
31 #include <asm/pgtable.h>
32 #include <asm/nmi.h>
33 #include <asm/switch_to.h>
34 #include <asm/isc.h>
35 #include <asm/sclp.h>
36 #include "kvm-s390.h"
37 #include "gaccess.h"
38
39 #define CREATE_TRACE_POINTS
40 #include "trace.h"
41 #include "trace-s390.h"
42
43 #define MEM_OP_MAX_SIZE 65536 /* Maximum transfer size for KVM_S390_MEM_OP */
44 #define LOCAL_IRQS 32
45 #define VCPU_IRQS_MAX_BUF (sizeof(struct kvm_s390_irq) * \
46 (KVM_MAX_VCPUS + LOCAL_IRQS))
47
48 #define VCPU_STAT(x) offsetof(struct kvm_vcpu, stat.x), KVM_STAT_VCPU
49
50 struct kvm_stats_debugfs_item debugfs_entries[] = {
51 { "userspace_handled", VCPU_STAT(exit_userspace) },
52 { "exit_null", VCPU_STAT(exit_null) },
53 { "exit_validity", VCPU_STAT(exit_validity) },
54 { "exit_stop_request", VCPU_STAT(exit_stop_request) },
55 { "exit_external_request", VCPU_STAT(exit_external_request) },
56 { "exit_external_interrupt", VCPU_STAT(exit_external_interrupt) },
57 { "exit_instruction", VCPU_STAT(exit_instruction) },
58 { "exit_program_interruption", VCPU_STAT(exit_program_interruption) },
59 { "exit_instr_and_program_int", VCPU_STAT(exit_instr_and_program) },
60 { "halt_successful_poll", VCPU_STAT(halt_successful_poll) },
61 { "halt_wakeup", VCPU_STAT(halt_wakeup) },
62 { "instruction_lctlg", VCPU_STAT(instruction_lctlg) },
63 { "instruction_lctl", VCPU_STAT(instruction_lctl) },
64 { "instruction_stctl", VCPU_STAT(instruction_stctl) },
65 { "instruction_stctg", VCPU_STAT(instruction_stctg) },
66 { "deliver_emergency_signal", VCPU_STAT(deliver_emergency_signal) },
67 { "deliver_external_call", VCPU_STAT(deliver_external_call) },
68 { "deliver_service_signal", VCPU_STAT(deliver_service_signal) },
69 { "deliver_virtio_interrupt", VCPU_STAT(deliver_virtio_interrupt) },
70 { "deliver_stop_signal", VCPU_STAT(deliver_stop_signal) },
71 { "deliver_prefix_signal", VCPU_STAT(deliver_prefix_signal) },
72 { "deliver_restart_signal", VCPU_STAT(deliver_restart_signal) },
73 { "deliver_program_interruption", VCPU_STAT(deliver_program_int) },
74 { "exit_wait_state", VCPU_STAT(exit_wait_state) },
75 { "instruction_pfmf", VCPU_STAT(instruction_pfmf) },
76 { "instruction_stidp", VCPU_STAT(instruction_stidp) },
77 { "instruction_spx", VCPU_STAT(instruction_spx) },
78 { "instruction_stpx", VCPU_STAT(instruction_stpx) },
79 { "instruction_stap", VCPU_STAT(instruction_stap) },
80 { "instruction_storage_key", VCPU_STAT(instruction_storage_key) },
81 { "instruction_ipte_interlock", VCPU_STAT(instruction_ipte_interlock) },
82 { "instruction_stsch", VCPU_STAT(instruction_stsch) },
83 { "instruction_chsc", VCPU_STAT(instruction_chsc) },
84 { "instruction_essa", VCPU_STAT(instruction_essa) },
85 { "instruction_stsi", VCPU_STAT(instruction_stsi) },
86 { "instruction_stfl", VCPU_STAT(instruction_stfl) },
87 { "instruction_tprot", VCPU_STAT(instruction_tprot) },
88 { "instruction_sigp_sense", VCPU_STAT(instruction_sigp_sense) },
89 { "instruction_sigp_sense_running", VCPU_STAT(instruction_sigp_sense_running) },
90 { "instruction_sigp_external_call", VCPU_STAT(instruction_sigp_external_call) },
91 { "instruction_sigp_emergency", VCPU_STAT(instruction_sigp_emergency) },
92 { "instruction_sigp_cond_emergency", VCPU_STAT(instruction_sigp_cond_emergency) },
93 { "instruction_sigp_start", VCPU_STAT(instruction_sigp_start) },
94 { "instruction_sigp_stop", VCPU_STAT(instruction_sigp_stop) },
95 { "instruction_sigp_stop_store_status", VCPU_STAT(instruction_sigp_stop_store_status) },
96 { "instruction_sigp_store_status", VCPU_STAT(instruction_sigp_store_status) },
97 { "instruction_sigp_store_adtl_status", VCPU_STAT(instruction_sigp_store_adtl_status) },
98 { "instruction_sigp_set_arch", VCPU_STAT(instruction_sigp_arch) },
99 { "instruction_sigp_set_prefix", VCPU_STAT(instruction_sigp_prefix) },
100 { "instruction_sigp_restart", VCPU_STAT(instruction_sigp_restart) },
101 { "instruction_sigp_cpu_reset", VCPU_STAT(instruction_sigp_cpu_reset) },
102 { "instruction_sigp_init_cpu_reset", VCPU_STAT(instruction_sigp_init_cpu_reset) },
103 { "instruction_sigp_unknown", VCPU_STAT(instruction_sigp_unknown) },
104 { "diagnose_10", VCPU_STAT(diagnose_10) },
105 { "diagnose_44", VCPU_STAT(diagnose_44) },
106 { "diagnose_9c", VCPU_STAT(diagnose_9c) },
107 { NULL }
108 };
109
110 /* upper facilities limit for kvm */
111 unsigned long kvm_s390_fac_list_mask[] = {
112 0xffe6fffbfcfdfc40UL,
113 0x005c800000000000UL,
114 };
115
116 unsigned long kvm_s390_fac_list_mask_size(void)
117 {
118 BUILD_BUG_ON(ARRAY_SIZE(kvm_s390_fac_list_mask) > S390_ARCH_FAC_MASK_SIZE_U64);
119 return ARRAY_SIZE(kvm_s390_fac_list_mask);
120 }
121
122 static struct gmap_notifier gmap_notifier;
123
124 /* Section: not file related */
125 int kvm_arch_hardware_enable(void)
126 {
127 /* every s390 is virtualization enabled ;-) */
128 return 0;
129 }
130
131 static void kvm_gmap_notifier(struct gmap *gmap, unsigned long address);
132
133 int kvm_arch_hardware_setup(void)
134 {
135 gmap_notifier.notifier_call = kvm_gmap_notifier;
136 gmap_register_ipte_notifier(&gmap_notifier);
137 return 0;
138 }
139
140 void kvm_arch_hardware_unsetup(void)
141 {
142 gmap_unregister_ipte_notifier(&gmap_notifier);
143 }
144
145 int kvm_arch_init(void *opaque)
146 {
147 /* Register floating interrupt controller interface. */
148 return kvm_register_device_ops(&kvm_flic_ops, KVM_DEV_TYPE_FLIC);
149 }
150
151 /* Section: device related */
152 long kvm_arch_dev_ioctl(struct file *filp,
153 unsigned int ioctl, unsigned long arg)
154 {
155 if (ioctl == KVM_S390_ENABLE_SIE)
156 return s390_enable_sie();
157 return -EINVAL;
158 }
159
160 int kvm_vm_ioctl_check_extension(struct kvm *kvm, long ext)
161 {
162 int r;
163
164 switch (ext) {
165 case KVM_CAP_S390_PSW:
166 case KVM_CAP_S390_GMAP:
167 case KVM_CAP_SYNC_MMU:
168 #ifdef CONFIG_KVM_S390_UCONTROL
169 case KVM_CAP_S390_UCONTROL:
170 #endif
171 case KVM_CAP_ASYNC_PF:
172 case KVM_CAP_SYNC_REGS:
173 case KVM_CAP_ONE_REG:
174 case KVM_CAP_ENABLE_CAP:
175 case KVM_CAP_S390_CSS_SUPPORT:
176 case KVM_CAP_IOEVENTFD:
177 case KVM_CAP_DEVICE_CTRL:
178 case KVM_CAP_ENABLE_CAP_VM:
179 case KVM_CAP_S390_IRQCHIP:
180 case KVM_CAP_VM_ATTRIBUTES:
181 case KVM_CAP_MP_STATE:
182 case KVM_CAP_S390_INJECT_IRQ:
183 case KVM_CAP_S390_USER_SIGP:
184 case KVM_CAP_S390_USER_STSI:
185 case KVM_CAP_S390_SKEYS:
186 case KVM_CAP_S390_IRQ_STATE:
187 r = 1;
188 break;
189 case KVM_CAP_S390_MEM_OP:
190 r = MEM_OP_MAX_SIZE;
191 break;
192 case KVM_CAP_NR_VCPUS:
193 case KVM_CAP_MAX_VCPUS:
194 r = KVM_MAX_VCPUS;
195 break;
196 case KVM_CAP_NR_MEMSLOTS:
197 r = KVM_USER_MEM_SLOTS;
198 break;
199 case KVM_CAP_S390_COW:
200 r = MACHINE_HAS_ESOP;
201 break;
202 case KVM_CAP_S390_VECTOR_REGISTERS:
203 r = MACHINE_HAS_VX;
204 break;
205 default:
206 r = 0;
207 }
208 return r;
209 }
210
211 static void kvm_s390_sync_dirty_log(struct kvm *kvm,
212 struct kvm_memory_slot *memslot)
213 {
214 gfn_t cur_gfn, last_gfn;
215 unsigned long address;
216 struct gmap *gmap = kvm->arch.gmap;
217
218 down_read(&gmap->mm->mmap_sem);
219 /* Loop over all guest pages */
220 last_gfn = memslot->base_gfn + memslot->npages;
221 for (cur_gfn = memslot->base_gfn; cur_gfn <= last_gfn; cur_gfn++) {
222 address = gfn_to_hva_memslot(memslot, cur_gfn);
223
224 if (gmap_test_and_clear_dirty(address, gmap))
225 mark_page_dirty(kvm, cur_gfn);
226 }
227 up_read(&gmap->mm->mmap_sem);
228 }
229
230 /* Section: vm related */
231 /*
232 * Get (and clear) the dirty memory log for a memory slot.
233 */
234 int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm,
235 struct kvm_dirty_log *log)
236 {
237 int r;
238 unsigned long n;
239 struct kvm_memory_slot *memslot;
240 int is_dirty = 0;
241
242 mutex_lock(&kvm->slots_lock);
243
244 r = -EINVAL;
245 if (log->slot >= KVM_USER_MEM_SLOTS)
246 goto out;
247
248 memslot = id_to_memslot(kvm->memslots, log->slot);
249 r = -ENOENT;
250 if (!memslot->dirty_bitmap)
251 goto out;
252
253 kvm_s390_sync_dirty_log(kvm, memslot);
254 r = kvm_get_dirty_log(kvm, log, &is_dirty);
255 if (r)
256 goto out;
257
258 /* Clear the dirty log */
259 if (is_dirty) {
260 n = kvm_dirty_bitmap_bytes(memslot);
261 memset(memslot->dirty_bitmap, 0, n);
262 }
263 r = 0;
264 out:
265 mutex_unlock(&kvm->slots_lock);
266 return r;
267 }
268
269 static int kvm_vm_ioctl_enable_cap(struct kvm *kvm, struct kvm_enable_cap *cap)
270 {
271 int r;
272
273 if (cap->flags)
274 return -EINVAL;
275
276 switch (cap->cap) {
277 case KVM_CAP_S390_IRQCHIP:
278 kvm->arch.use_irqchip = 1;
279 r = 0;
280 break;
281 case KVM_CAP_S390_USER_SIGP:
282 kvm->arch.user_sigp = 1;
283 r = 0;
284 break;
285 case KVM_CAP_S390_VECTOR_REGISTERS:
286 if (MACHINE_HAS_VX) {
287 set_kvm_facility(kvm->arch.model.fac->mask, 129);
288 set_kvm_facility(kvm->arch.model.fac->list, 129);
289 r = 0;
290 } else
291 r = -EINVAL;
292 break;
293 case KVM_CAP_S390_USER_STSI:
294 kvm->arch.user_stsi = 1;
295 r = 0;
296 break;
297 default:
298 r = -EINVAL;
299 break;
300 }
301 return r;
302 }
303
304 static int kvm_s390_get_mem_control(struct kvm *kvm, struct kvm_device_attr *attr)
305 {
306 int ret;
307
308 switch (attr->attr) {
309 case KVM_S390_VM_MEM_LIMIT_SIZE:
310 ret = 0;
311 if (put_user(kvm->arch.gmap->asce_end, (u64 __user *)attr->addr))
312 ret = -EFAULT;
313 break;
314 default:
315 ret = -ENXIO;
316 break;
317 }
318 return ret;
319 }
320
321 static int kvm_s390_set_mem_control(struct kvm *kvm, struct kvm_device_attr *attr)
322 {
323 int ret;
324 unsigned int idx;
325 switch (attr->attr) {
326 case KVM_S390_VM_MEM_ENABLE_CMMA:
327 ret = -EBUSY;
328 mutex_lock(&kvm->lock);
329 if (atomic_read(&kvm->online_vcpus) == 0) {
330 kvm->arch.use_cmma = 1;
331 ret = 0;
332 }
333 mutex_unlock(&kvm->lock);
334 break;
335 case KVM_S390_VM_MEM_CLR_CMMA:
336 mutex_lock(&kvm->lock);
337 idx = srcu_read_lock(&kvm->srcu);
338 s390_reset_cmma(kvm->arch.gmap->mm);
339 srcu_read_unlock(&kvm->srcu, idx);
340 mutex_unlock(&kvm->lock);
341 ret = 0;
342 break;
343 case KVM_S390_VM_MEM_LIMIT_SIZE: {
344 unsigned long new_limit;
345
346 if (kvm_is_ucontrol(kvm))
347 return -EINVAL;
348
349 if (get_user(new_limit, (u64 __user *)attr->addr))
350 return -EFAULT;
351
352 if (new_limit > kvm->arch.gmap->asce_end)
353 return -E2BIG;
354
355 ret = -EBUSY;
356 mutex_lock(&kvm->lock);
357 if (atomic_read(&kvm->online_vcpus) == 0) {
358 /* gmap_alloc will round the limit up */
359 struct gmap *new = gmap_alloc(current->mm, new_limit);
360
361 if (!new) {
362 ret = -ENOMEM;
363 } else {
364 gmap_free(kvm->arch.gmap);
365 new->private = kvm;
366 kvm->arch.gmap = new;
367 ret = 0;
368 }
369 }
370 mutex_unlock(&kvm->lock);
371 break;
372 }
373 default:
374 ret = -ENXIO;
375 break;
376 }
377 return ret;
378 }
379
380 static void kvm_s390_vcpu_crypto_setup(struct kvm_vcpu *vcpu);
381
382 static int kvm_s390_vm_set_crypto(struct kvm *kvm, struct kvm_device_attr *attr)
383 {
384 struct kvm_vcpu *vcpu;
385 int i;
386
387 if (!test_kvm_facility(kvm, 76))
388 return -EINVAL;
389
390 mutex_lock(&kvm->lock);
391 switch (attr->attr) {
392 case KVM_S390_VM_CRYPTO_ENABLE_AES_KW:
393 get_random_bytes(
394 kvm->arch.crypto.crycb->aes_wrapping_key_mask,
395 sizeof(kvm->arch.crypto.crycb->aes_wrapping_key_mask));
396 kvm->arch.crypto.aes_kw = 1;
397 break;
398 case KVM_S390_VM_CRYPTO_ENABLE_DEA_KW:
399 get_random_bytes(
400 kvm->arch.crypto.crycb->dea_wrapping_key_mask,
401 sizeof(kvm->arch.crypto.crycb->dea_wrapping_key_mask));
402 kvm->arch.crypto.dea_kw = 1;
403 break;
404 case KVM_S390_VM_CRYPTO_DISABLE_AES_KW:
405 kvm->arch.crypto.aes_kw = 0;
406 memset(kvm->arch.crypto.crycb->aes_wrapping_key_mask, 0,
407 sizeof(kvm->arch.crypto.crycb->aes_wrapping_key_mask));
408 break;
409 case KVM_S390_VM_CRYPTO_DISABLE_DEA_KW:
410 kvm->arch.crypto.dea_kw = 0;
411 memset(kvm->arch.crypto.crycb->dea_wrapping_key_mask, 0,
412 sizeof(kvm->arch.crypto.crycb->dea_wrapping_key_mask));
413 break;
414 default:
415 mutex_unlock(&kvm->lock);
416 return -ENXIO;
417 }
418
419 kvm_for_each_vcpu(i, vcpu, kvm) {
420 kvm_s390_vcpu_crypto_setup(vcpu);
421 exit_sie(vcpu);
422 }
423 mutex_unlock(&kvm->lock);
424 return 0;
425 }
426
427 static int kvm_s390_set_tod_high(struct kvm *kvm, struct kvm_device_attr *attr)
428 {
429 u8 gtod_high;
430
431 if (copy_from_user(&gtod_high, (void __user *)attr->addr,
432 sizeof(gtod_high)))
433 return -EFAULT;
434
435 if (gtod_high != 0)
436 return -EINVAL;
437
438 return 0;
439 }
440
441 static int kvm_s390_set_tod_low(struct kvm *kvm, struct kvm_device_attr *attr)
442 {
443 struct kvm_vcpu *cur_vcpu;
444 unsigned int vcpu_idx;
445 u64 host_tod, gtod;
446 int r;
447
448 if (copy_from_user(&gtod, (void __user *)attr->addr, sizeof(gtod)))
449 return -EFAULT;
450
451 r = store_tod_clock(&host_tod);
452 if (r)
453 return r;
454
455 mutex_lock(&kvm->lock);
456 kvm->arch.epoch = gtod - host_tod;
457 kvm_for_each_vcpu(vcpu_idx, cur_vcpu, kvm) {
458 cur_vcpu->arch.sie_block->epoch = kvm->arch.epoch;
459 exit_sie(cur_vcpu);
460 }
461 mutex_unlock(&kvm->lock);
462 return 0;
463 }
464
465 static int kvm_s390_set_tod(struct kvm *kvm, struct kvm_device_attr *attr)
466 {
467 int ret;
468
469 if (attr->flags)
470 return -EINVAL;
471
472 switch (attr->attr) {
473 case KVM_S390_VM_TOD_HIGH:
474 ret = kvm_s390_set_tod_high(kvm, attr);
475 break;
476 case KVM_S390_VM_TOD_LOW:
477 ret = kvm_s390_set_tod_low(kvm, attr);
478 break;
479 default:
480 ret = -ENXIO;
481 break;
482 }
483 return ret;
484 }
485
486 static int kvm_s390_get_tod_high(struct kvm *kvm, struct kvm_device_attr *attr)
487 {
488 u8 gtod_high = 0;
489
490 if (copy_to_user((void __user *)attr->addr, &gtod_high,
491 sizeof(gtod_high)))
492 return -EFAULT;
493
494 return 0;
495 }
496
497 static int kvm_s390_get_tod_low(struct kvm *kvm, struct kvm_device_attr *attr)
498 {
499 u64 host_tod, gtod;
500 int r;
501
502 r = store_tod_clock(&host_tod);
503 if (r)
504 return r;
505
506 gtod = host_tod + kvm->arch.epoch;
507 if (copy_to_user((void __user *)attr->addr, &gtod, sizeof(gtod)))
508 return -EFAULT;
509
510 return 0;
511 }
512
513 static int kvm_s390_get_tod(struct kvm *kvm, struct kvm_device_attr *attr)
514 {
515 int ret;
516
517 if (attr->flags)
518 return -EINVAL;
519
520 switch (attr->attr) {
521 case KVM_S390_VM_TOD_HIGH:
522 ret = kvm_s390_get_tod_high(kvm, attr);
523 break;
524 case KVM_S390_VM_TOD_LOW:
525 ret = kvm_s390_get_tod_low(kvm, attr);
526 break;
527 default:
528 ret = -ENXIO;
529 break;
530 }
531 return ret;
532 }
533
534 static int kvm_s390_set_processor(struct kvm *kvm, struct kvm_device_attr *attr)
535 {
536 struct kvm_s390_vm_cpu_processor *proc;
537 int ret = 0;
538
539 mutex_lock(&kvm->lock);
540 if (atomic_read(&kvm->online_vcpus)) {
541 ret = -EBUSY;
542 goto out;
543 }
544 proc = kzalloc(sizeof(*proc), GFP_KERNEL);
545 if (!proc) {
546 ret = -ENOMEM;
547 goto out;
548 }
549 if (!copy_from_user(proc, (void __user *)attr->addr,
550 sizeof(*proc))) {
551 memcpy(&kvm->arch.model.cpu_id, &proc->cpuid,
552 sizeof(struct cpuid));
553 kvm->arch.model.ibc = proc->ibc;
554 memcpy(kvm->arch.model.fac->list, proc->fac_list,
555 S390_ARCH_FAC_LIST_SIZE_BYTE);
556 } else
557 ret = -EFAULT;
558 kfree(proc);
559 out:
560 mutex_unlock(&kvm->lock);
561 return ret;
562 }
563
564 static int kvm_s390_set_cpu_model(struct kvm *kvm, struct kvm_device_attr *attr)
565 {
566 int ret = -ENXIO;
567
568 switch (attr->attr) {
569 case KVM_S390_VM_CPU_PROCESSOR:
570 ret = kvm_s390_set_processor(kvm, attr);
571 break;
572 }
573 return ret;
574 }
575
576 static int kvm_s390_get_processor(struct kvm *kvm, struct kvm_device_attr *attr)
577 {
578 struct kvm_s390_vm_cpu_processor *proc;
579 int ret = 0;
580
581 proc = kzalloc(sizeof(*proc), GFP_KERNEL);
582 if (!proc) {
583 ret = -ENOMEM;
584 goto out;
585 }
586 memcpy(&proc->cpuid, &kvm->arch.model.cpu_id, sizeof(struct cpuid));
587 proc->ibc = kvm->arch.model.ibc;
588 memcpy(&proc->fac_list, kvm->arch.model.fac->list, S390_ARCH_FAC_LIST_SIZE_BYTE);
589 if (copy_to_user((void __user *)attr->addr, proc, sizeof(*proc)))
590 ret = -EFAULT;
591 kfree(proc);
592 out:
593 return ret;
594 }
595
596 static int kvm_s390_get_machine(struct kvm *kvm, struct kvm_device_attr *attr)
597 {
598 struct kvm_s390_vm_cpu_machine *mach;
599 int ret = 0;
600
601 mach = kzalloc(sizeof(*mach), GFP_KERNEL);
602 if (!mach) {
603 ret = -ENOMEM;
604 goto out;
605 }
606 get_cpu_id((struct cpuid *) &mach->cpuid);
607 mach->ibc = sclp.ibc;
608 memcpy(&mach->fac_mask, kvm->arch.model.fac->mask,
609 S390_ARCH_FAC_LIST_SIZE_BYTE);
610 memcpy((unsigned long *)&mach->fac_list, S390_lowcore.stfle_fac_list,
611 S390_ARCH_FAC_LIST_SIZE_BYTE);
612 if (copy_to_user((void __user *)attr->addr, mach, sizeof(*mach)))
613 ret = -EFAULT;
614 kfree(mach);
615 out:
616 return ret;
617 }
618
619 static int kvm_s390_get_cpu_model(struct kvm *kvm, struct kvm_device_attr *attr)
620 {
621 int ret = -ENXIO;
622
623 switch (attr->attr) {
624 case KVM_S390_VM_CPU_PROCESSOR:
625 ret = kvm_s390_get_processor(kvm, attr);
626 break;
627 case KVM_S390_VM_CPU_MACHINE:
628 ret = kvm_s390_get_machine(kvm, attr);
629 break;
630 }
631 return ret;
632 }
633
634 static int kvm_s390_vm_set_attr(struct kvm *kvm, struct kvm_device_attr *attr)
635 {
636 int ret;
637
638 switch (attr->group) {
639 case KVM_S390_VM_MEM_CTRL:
640 ret = kvm_s390_set_mem_control(kvm, attr);
641 break;
642 case KVM_S390_VM_TOD:
643 ret = kvm_s390_set_tod(kvm, attr);
644 break;
645 case KVM_S390_VM_CPU_MODEL:
646 ret = kvm_s390_set_cpu_model(kvm, attr);
647 break;
648 case KVM_S390_VM_CRYPTO:
649 ret = kvm_s390_vm_set_crypto(kvm, attr);
650 break;
651 default:
652 ret = -ENXIO;
653 break;
654 }
655
656 return ret;
657 }
658
659 static int kvm_s390_vm_get_attr(struct kvm *kvm, struct kvm_device_attr *attr)
660 {
661 int ret;
662
663 switch (attr->group) {
664 case KVM_S390_VM_MEM_CTRL:
665 ret = kvm_s390_get_mem_control(kvm, attr);
666 break;
667 case KVM_S390_VM_TOD:
668 ret = kvm_s390_get_tod(kvm, attr);
669 break;
670 case KVM_S390_VM_CPU_MODEL:
671 ret = kvm_s390_get_cpu_model(kvm, attr);
672 break;
673 default:
674 ret = -ENXIO;
675 break;
676 }
677
678 return ret;
679 }
680
681 static int kvm_s390_vm_has_attr(struct kvm *kvm, struct kvm_device_attr *attr)
682 {
683 int ret;
684
685 switch (attr->group) {
686 case KVM_S390_VM_MEM_CTRL:
687 switch (attr->attr) {
688 case KVM_S390_VM_MEM_ENABLE_CMMA:
689 case KVM_S390_VM_MEM_CLR_CMMA:
690 case KVM_S390_VM_MEM_LIMIT_SIZE:
691 ret = 0;
692 break;
693 default:
694 ret = -ENXIO;
695 break;
696 }
697 break;
698 case KVM_S390_VM_TOD:
699 switch (attr->attr) {
700 case KVM_S390_VM_TOD_LOW:
701 case KVM_S390_VM_TOD_HIGH:
702 ret = 0;
703 break;
704 default:
705 ret = -ENXIO;
706 break;
707 }
708 break;
709 case KVM_S390_VM_CPU_MODEL:
710 switch (attr->attr) {
711 case KVM_S390_VM_CPU_PROCESSOR:
712 case KVM_S390_VM_CPU_MACHINE:
713 ret = 0;
714 break;
715 default:
716 ret = -ENXIO;
717 break;
718 }
719 break;
720 case KVM_S390_VM_CRYPTO:
721 switch (attr->attr) {
722 case KVM_S390_VM_CRYPTO_ENABLE_AES_KW:
723 case KVM_S390_VM_CRYPTO_ENABLE_DEA_KW:
724 case KVM_S390_VM_CRYPTO_DISABLE_AES_KW:
725 case KVM_S390_VM_CRYPTO_DISABLE_DEA_KW:
726 ret = 0;
727 break;
728 default:
729 ret = -ENXIO;
730 break;
731 }
732 break;
733 default:
734 ret = -ENXIO;
735 break;
736 }
737
738 return ret;
739 }
740
741 static long kvm_s390_get_skeys(struct kvm *kvm, struct kvm_s390_skeys *args)
742 {
743 uint8_t *keys;
744 uint64_t hva;
745 unsigned long curkey;
746 int i, r = 0;
747
748 if (args->flags != 0)
749 return -EINVAL;
750
751 /* Is this guest using storage keys? */
752 if (!mm_use_skey(current->mm))
753 return KVM_S390_GET_SKEYS_NONE;
754
755 /* Enforce sane limit on memory allocation */
756 if (args->count < 1 || args->count > KVM_S390_SKEYS_MAX)
757 return -EINVAL;
758
759 keys = kmalloc_array(args->count, sizeof(uint8_t),
760 GFP_KERNEL | __GFP_NOWARN);
761 if (!keys)
762 keys = vmalloc(sizeof(uint8_t) * args->count);
763 if (!keys)
764 return -ENOMEM;
765
766 for (i = 0; i < args->count; i++) {
767 hva = gfn_to_hva(kvm, args->start_gfn + i);
768 if (kvm_is_error_hva(hva)) {
769 r = -EFAULT;
770 goto out;
771 }
772
773 curkey = get_guest_storage_key(current->mm, hva);
774 if (IS_ERR_VALUE(curkey)) {
775 r = curkey;
776 goto out;
777 }
778 keys[i] = curkey;
779 }
780
781 r = copy_to_user((uint8_t __user *)args->skeydata_addr, keys,
782 sizeof(uint8_t) * args->count);
783 if (r)
784 r = -EFAULT;
785 out:
786 kvfree(keys);
787 return r;
788 }
789
790 static long kvm_s390_set_skeys(struct kvm *kvm, struct kvm_s390_skeys *args)
791 {
792 uint8_t *keys;
793 uint64_t hva;
794 int i, r = 0;
795
796 if (args->flags != 0)
797 return -EINVAL;
798
799 /* Enforce sane limit on memory allocation */
800 if (args->count < 1 || args->count > KVM_S390_SKEYS_MAX)
801 return -EINVAL;
802
803 keys = kmalloc_array(args->count, sizeof(uint8_t),
804 GFP_KERNEL | __GFP_NOWARN);
805 if (!keys)
806 keys = vmalloc(sizeof(uint8_t) * args->count);
807 if (!keys)
808 return -ENOMEM;
809
810 r = copy_from_user(keys, (uint8_t __user *)args->skeydata_addr,
811 sizeof(uint8_t) * args->count);
812 if (r) {
813 r = -EFAULT;
814 goto out;
815 }
816
817 /* Enable storage key handling for the guest */
818 s390_enable_skey();
819
820 for (i = 0; i < args->count; i++) {
821 hva = gfn_to_hva(kvm, args->start_gfn + i);
822 if (kvm_is_error_hva(hva)) {
823 r = -EFAULT;
824 goto out;
825 }
826
827 /* Lowest order bit is reserved */
828 if (keys[i] & 0x01) {
829 r = -EINVAL;
830 goto out;
831 }
832
833 r = set_guest_storage_key(current->mm, hva,
834 (unsigned long)keys[i], 0);
835 if (r)
836 goto out;
837 }
838 out:
839 kvfree(keys);
840 return r;
841 }
842
843 long kvm_arch_vm_ioctl(struct file *filp,
844 unsigned int ioctl, unsigned long arg)
845 {
846 struct kvm *kvm = filp->private_data;
847 void __user *argp = (void __user *)arg;
848 struct kvm_device_attr attr;
849 int r;
850
851 switch (ioctl) {
852 case KVM_S390_INTERRUPT: {
853 struct kvm_s390_interrupt s390int;
854
855 r = -EFAULT;
856 if (copy_from_user(&s390int, argp, sizeof(s390int)))
857 break;
858 r = kvm_s390_inject_vm(kvm, &s390int);
859 break;
860 }
861 case KVM_ENABLE_CAP: {
862 struct kvm_enable_cap cap;
863 r = -EFAULT;
864 if (copy_from_user(&cap, argp, sizeof(cap)))
865 break;
866 r = kvm_vm_ioctl_enable_cap(kvm, &cap);
867 break;
868 }
869 case KVM_CREATE_IRQCHIP: {
870 struct kvm_irq_routing_entry routing;
871
872 r = -EINVAL;
873 if (kvm->arch.use_irqchip) {
874 /* Set up dummy routing. */
875 memset(&routing, 0, sizeof(routing));
876 kvm_set_irq_routing(kvm, &routing, 0, 0);
877 r = 0;
878 }
879 break;
880 }
881 case KVM_SET_DEVICE_ATTR: {
882 r = -EFAULT;
883 if (copy_from_user(&attr, (void __user *)arg, sizeof(attr)))
884 break;
885 r = kvm_s390_vm_set_attr(kvm, &attr);
886 break;
887 }
888 case KVM_GET_DEVICE_ATTR: {
889 r = -EFAULT;
890 if (copy_from_user(&attr, (void __user *)arg, sizeof(attr)))
891 break;
892 r = kvm_s390_vm_get_attr(kvm, &attr);
893 break;
894 }
895 case KVM_HAS_DEVICE_ATTR: {
896 r = -EFAULT;
897 if (copy_from_user(&attr, (void __user *)arg, sizeof(attr)))
898 break;
899 r = kvm_s390_vm_has_attr(kvm, &attr);
900 break;
901 }
902 case KVM_S390_GET_SKEYS: {
903 struct kvm_s390_skeys args;
904
905 r = -EFAULT;
906 if (copy_from_user(&args, argp,
907 sizeof(struct kvm_s390_skeys)))
908 break;
909 r = kvm_s390_get_skeys(kvm, &args);
910 break;
911 }
912 case KVM_S390_SET_SKEYS: {
913 struct kvm_s390_skeys args;
914
915 r = -EFAULT;
916 if (copy_from_user(&args, argp,
917 sizeof(struct kvm_s390_skeys)))
918 break;
919 r = kvm_s390_set_skeys(kvm, &args);
920 break;
921 }
922 default:
923 r = -ENOTTY;
924 }
925
926 return r;
927 }
928
929 static int kvm_s390_query_ap_config(u8 *config)
930 {
931 u32 fcn_code = 0x04000000UL;
932 u32 cc = 0;
933
934 memset(config, 0, 128);
935 asm volatile(
936 "lgr 0,%1\n"
937 "lgr 2,%2\n"
938 ".long 0xb2af0000\n" /* PQAP(QCI) */
939 "0: ipm %0\n"
940 "srl %0,28\n"
941 "1:\n"
942 EX_TABLE(0b, 1b)
943 : "+r" (cc)
944 : "r" (fcn_code), "r" (config)
945 : "cc", "0", "2", "memory"
946 );
947
948 return cc;
949 }
950
951 static int kvm_s390_apxa_installed(void)
952 {
953 u8 config[128];
954 int cc;
955
956 if (test_facility(2) && test_facility(12)) {
957 cc = kvm_s390_query_ap_config(config);
958
959 if (cc)
960 pr_err("PQAP(QCI) failed with cc=%d", cc);
961 else
962 return config[0] & 0x40;
963 }
964
965 return 0;
966 }
967
968 static void kvm_s390_set_crycb_format(struct kvm *kvm)
969 {
970 kvm->arch.crypto.crycbd = (__u32)(unsigned long) kvm->arch.crypto.crycb;
971
972 if (kvm_s390_apxa_installed())
973 kvm->arch.crypto.crycbd |= CRYCB_FORMAT2;
974 else
975 kvm->arch.crypto.crycbd |= CRYCB_FORMAT1;
976 }
977
978 static void kvm_s390_get_cpu_id(struct cpuid *cpu_id)
979 {
980 get_cpu_id(cpu_id);
981 cpu_id->version = 0xff;
982 }
983
984 static int kvm_s390_crypto_init(struct kvm *kvm)
985 {
986 if (!test_kvm_facility(kvm, 76))
987 return 0;
988
989 kvm->arch.crypto.crycb = kzalloc(sizeof(*kvm->arch.crypto.crycb),
990 GFP_KERNEL | GFP_DMA);
991 if (!kvm->arch.crypto.crycb)
992 return -ENOMEM;
993
994 kvm_s390_set_crycb_format(kvm);
995
996 /* Enable AES/DEA protected key functions by default */
997 kvm->arch.crypto.aes_kw = 1;
998 kvm->arch.crypto.dea_kw = 1;
999 get_random_bytes(kvm->arch.crypto.crycb->aes_wrapping_key_mask,
1000 sizeof(kvm->arch.crypto.crycb->aes_wrapping_key_mask));
1001 get_random_bytes(kvm->arch.crypto.crycb->dea_wrapping_key_mask,
1002 sizeof(kvm->arch.crypto.crycb->dea_wrapping_key_mask));
1003
1004 return 0;
1005 }
1006
1007 int kvm_arch_init_vm(struct kvm *kvm, unsigned long type)
1008 {
1009 int i, rc;
1010 char debug_name[16];
1011 static unsigned long sca_offset;
1012
1013 rc = -EINVAL;
1014 #ifdef CONFIG_KVM_S390_UCONTROL
1015 if (type & ~KVM_VM_S390_UCONTROL)
1016 goto out_err;
1017 if ((type & KVM_VM_S390_UCONTROL) && (!capable(CAP_SYS_ADMIN)))
1018 goto out_err;
1019 #else
1020 if (type)
1021 goto out_err;
1022 #endif
1023
1024 rc = s390_enable_sie();
1025 if (rc)
1026 goto out_err;
1027
1028 rc = -ENOMEM;
1029
1030 kvm->arch.sca = (struct sca_block *) get_zeroed_page(GFP_KERNEL);
1031 if (!kvm->arch.sca)
1032 goto out_err;
1033 spin_lock(&kvm_lock);
1034 sca_offset = (sca_offset + 16) & 0x7f0;
1035 kvm->arch.sca = (struct sca_block *) ((char *) kvm->arch.sca + sca_offset);
1036 spin_unlock(&kvm_lock);
1037
1038 sprintf(debug_name, "kvm-%u", current->pid);
1039
1040 kvm->arch.dbf = debug_register(debug_name, 8, 2, 8 * sizeof(long));
1041 if (!kvm->arch.dbf)
1042 goto out_err;
1043
1044 /*
1045 * The architectural maximum amount of facilities is 16 kbit. To store
1046 * this amount, 2 kbyte of memory is required. Thus we need a full
1047 * page to hold the guest facility list (arch.model.fac->list) and the
1048 * facility mask (arch.model.fac->mask). Its address size has to be
1049 * 31 bits and word aligned.
1050 */
1051 kvm->arch.model.fac =
1052 (struct kvm_s390_fac *) get_zeroed_page(GFP_KERNEL | GFP_DMA);
1053 if (!kvm->arch.model.fac)
1054 goto out_err;
1055
1056 /* Populate the facility mask initially. */
1057 memcpy(kvm->arch.model.fac->mask, S390_lowcore.stfle_fac_list,
1058 S390_ARCH_FAC_LIST_SIZE_BYTE);
1059 for (i = 0; i < S390_ARCH_FAC_LIST_SIZE_U64; i++) {
1060 if (i < kvm_s390_fac_list_mask_size())
1061 kvm->arch.model.fac->mask[i] &= kvm_s390_fac_list_mask[i];
1062 else
1063 kvm->arch.model.fac->mask[i] = 0UL;
1064 }
1065
1066 /* Populate the facility list initially. */
1067 memcpy(kvm->arch.model.fac->list, kvm->arch.model.fac->mask,
1068 S390_ARCH_FAC_LIST_SIZE_BYTE);
1069
1070 kvm_s390_get_cpu_id(&kvm->arch.model.cpu_id);
1071 kvm->arch.model.ibc = sclp.ibc & 0x0fff;
1072
1073 if (kvm_s390_crypto_init(kvm) < 0)
1074 goto out_err;
1075
1076 spin_lock_init(&kvm->arch.float_int.lock);
1077 for (i = 0; i < FIRQ_LIST_COUNT; i++)
1078 INIT_LIST_HEAD(&kvm->arch.float_int.lists[i]);
1079 init_waitqueue_head(&kvm->arch.ipte_wq);
1080 mutex_init(&kvm->arch.ipte_mutex);
1081
1082 debug_register_view(kvm->arch.dbf, &debug_sprintf_view);
1083 VM_EVENT(kvm, 3, "%s", "vm created");
1084
1085 if (type & KVM_VM_S390_UCONTROL) {
1086 kvm->arch.gmap = NULL;
1087 } else {
1088 kvm->arch.gmap = gmap_alloc(current->mm, (1UL << 44) - 1);
1089 if (!kvm->arch.gmap)
1090 goto out_err;
1091 kvm->arch.gmap->private = kvm;
1092 kvm->arch.gmap->pfault_enabled = 0;
1093 }
1094
1095 kvm->arch.css_support = 0;
1096 kvm->arch.use_irqchip = 0;
1097 kvm->arch.epoch = 0;
1098
1099 spin_lock_init(&kvm->arch.start_stop_lock);
1100
1101 return 0;
1102 out_err:
1103 kfree(kvm->arch.crypto.crycb);
1104 free_page((unsigned long)kvm->arch.model.fac);
1105 debug_unregister(kvm->arch.dbf);
1106 free_page((unsigned long)(kvm->arch.sca));
1107 return rc;
1108 }
1109
1110 void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu)
1111 {
1112 VCPU_EVENT(vcpu, 3, "%s", "free cpu");
1113 trace_kvm_s390_destroy_vcpu(vcpu->vcpu_id);
1114 kvm_s390_clear_local_irqs(vcpu);
1115 kvm_clear_async_pf_completion_queue(vcpu);
1116 if (!kvm_is_ucontrol(vcpu->kvm)) {
1117 clear_bit(63 - vcpu->vcpu_id,
1118 (unsigned long *) &vcpu->kvm->arch.sca->mcn);
1119 if (vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].sda ==
1120 (__u64) vcpu->arch.sie_block)
1121 vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].sda = 0;
1122 }
1123 smp_mb();
1124
1125 if (kvm_is_ucontrol(vcpu->kvm))
1126 gmap_free(vcpu->arch.gmap);
1127
1128 if (kvm_s390_cmma_enabled(vcpu->kvm))
1129 kvm_s390_vcpu_unsetup_cmma(vcpu);
1130 free_page((unsigned long)(vcpu->arch.sie_block));
1131
1132 kvm_vcpu_uninit(vcpu);
1133 kmem_cache_free(kvm_vcpu_cache, vcpu);
1134 }
1135
1136 static void kvm_free_vcpus(struct kvm *kvm)
1137 {
1138 unsigned int i;
1139 struct kvm_vcpu *vcpu;
1140
1141 kvm_for_each_vcpu(i, vcpu, kvm)
1142 kvm_arch_vcpu_destroy(vcpu);
1143
1144 mutex_lock(&kvm->lock);
1145 for (i = 0; i < atomic_read(&kvm->online_vcpus); i++)
1146 kvm->vcpus[i] = NULL;
1147
1148 atomic_set(&kvm->online_vcpus, 0);
1149 mutex_unlock(&kvm->lock);
1150 }
1151
1152 void kvm_arch_destroy_vm(struct kvm *kvm)
1153 {
1154 kvm_free_vcpus(kvm);
1155 free_page((unsigned long)kvm->arch.model.fac);
1156 free_page((unsigned long)(kvm->arch.sca));
1157 debug_unregister(kvm->arch.dbf);
1158 kfree(kvm->arch.crypto.crycb);
1159 if (!kvm_is_ucontrol(kvm))
1160 gmap_free(kvm->arch.gmap);
1161 kvm_s390_destroy_adapters(kvm);
1162 kvm_s390_clear_float_irqs(kvm);
1163 }
1164
1165 /* Section: vcpu related */
1166 static int __kvm_ucontrol_vcpu_init(struct kvm_vcpu *vcpu)
1167 {
1168 vcpu->arch.gmap = gmap_alloc(current->mm, -1UL);
1169 if (!vcpu->arch.gmap)
1170 return -ENOMEM;
1171 vcpu->arch.gmap->private = vcpu->kvm;
1172
1173 return 0;
1174 }
1175
1176 int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu)
1177 {
1178 vcpu->arch.pfault_token = KVM_S390_PFAULT_TOKEN_INVALID;
1179 kvm_clear_async_pf_completion_queue(vcpu);
1180 vcpu->run->kvm_valid_regs = KVM_SYNC_PREFIX |
1181 KVM_SYNC_GPRS |
1182 KVM_SYNC_ACRS |
1183 KVM_SYNC_CRS |
1184 KVM_SYNC_ARCH0 |
1185 KVM_SYNC_PFAULT;
1186 if (test_kvm_facility(vcpu->kvm, 129))
1187 vcpu->run->kvm_valid_regs |= KVM_SYNC_VRS;
1188
1189 if (kvm_is_ucontrol(vcpu->kvm))
1190 return __kvm_ucontrol_vcpu_init(vcpu);
1191
1192 return 0;
1193 }
1194
1195 void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu)
1196 {
1197 save_fp_ctl(&vcpu->arch.host_fpregs.fpc);
1198 if (test_kvm_facility(vcpu->kvm, 129))
1199 save_vx_regs((__vector128 *)&vcpu->arch.host_vregs->vrs);
1200 else
1201 save_fp_regs(vcpu->arch.host_fpregs.fprs);
1202 save_access_regs(vcpu->arch.host_acrs);
1203 if (test_kvm_facility(vcpu->kvm, 129)) {
1204 restore_fp_ctl(&vcpu->run->s.regs.fpc);
1205 restore_vx_regs((__vector128 *)&vcpu->run->s.regs.vrs);
1206 } else {
1207 restore_fp_ctl(&vcpu->arch.guest_fpregs.fpc);
1208 restore_fp_regs(vcpu->arch.guest_fpregs.fprs);
1209 }
1210 restore_access_regs(vcpu->run->s.regs.acrs);
1211 gmap_enable(vcpu->arch.gmap);
1212 atomic_set_mask(CPUSTAT_RUNNING, &vcpu->arch.sie_block->cpuflags);
1213 }
1214
1215 void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu)
1216 {
1217 atomic_clear_mask(CPUSTAT_RUNNING, &vcpu->arch.sie_block->cpuflags);
1218 gmap_disable(vcpu->arch.gmap);
1219 if (test_kvm_facility(vcpu->kvm, 129)) {
1220 save_fp_ctl(&vcpu->run->s.regs.fpc);
1221 save_vx_regs((__vector128 *)&vcpu->run->s.regs.vrs);
1222 } else {
1223 save_fp_ctl(&vcpu->arch.guest_fpregs.fpc);
1224 save_fp_regs(vcpu->arch.guest_fpregs.fprs);
1225 }
1226 save_access_regs(vcpu->run->s.regs.acrs);
1227 restore_fp_ctl(&vcpu->arch.host_fpregs.fpc);
1228 if (test_kvm_facility(vcpu->kvm, 129))
1229 restore_vx_regs((__vector128 *)&vcpu->arch.host_vregs->vrs);
1230 else
1231 restore_fp_regs(vcpu->arch.host_fpregs.fprs);
1232 restore_access_regs(vcpu->arch.host_acrs);
1233 }
1234
1235 static void kvm_s390_vcpu_initial_reset(struct kvm_vcpu *vcpu)
1236 {
1237 /* this equals initial cpu reset in pop, but we don't switch to ESA */
1238 vcpu->arch.sie_block->gpsw.mask = 0UL;
1239 vcpu->arch.sie_block->gpsw.addr = 0UL;
1240 kvm_s390_set_prefix(vcpu, 0);
1241 vcpu->arch.sie_block->cputm = 0UL;
1242 vcpu->arch.sie_block->ckc = 0UL;
1243 vcpu->arch.sie_block->todpr = 0;
1244 memset(vcpu->arch.sie_block->gcr, 0, 16 * sizeof(__u64));
1245 vcpu->arch.sie_block->gcr[0] = 0xE0UL;
1246 vcpu->arch.sie_block->gcr[14] = 0xC2000000UL;
1247 vcpu->arch.guest_fpregs.fpc = 0;
1248 asm volatile("lfpc %0" : : "Q" (vcpu->arch.guest_fpregs.fpc));
1249 vcpu->arch.sie_block->gbea = 1;
1250 vcpu->arch.sie_block->pp = 0;
1251 vcpu->arch.pfault_token = KVM_S390_PFAULT_TOKEN_INVALID;
1252 kvm_clear_async_pf_completion_queue(vcpu);
1253 if (!kvm_s390_user_cpu_state_ctrl(vcpu->kvm))
1254 kvm_s390_vcpu_stop(vcpu);
1255 kvm_s390_clear_local_irqs(vcpu);
1256 }
1257
1258 void kvm_arch_vcpu_postcreate(struct kvm_vcpu *vcpu)
1259 {
1260 mutex_lock(&vcpu->kvm->lock);
1261 vcpu->arch.sie_block->epoch = vcpu->kvm->arch.epoch;
1262 mutex_unlock(&vcpu->kvm->lock);
1263 if (!kvm_is_ucontrol(vcpu->kvm))
1264 vcpu->arch.gmap = vcpu->kvm->arch.gmap;
1265 }
1266
1267 static void kvm_s390_vcpu_crypto_setup(struct kvm_vcpu *vcpu)
1268 {
1269 if (!test_kvm_facility(vcpu->kvm, 76))
1270 return;
1271
1272 vcpu->arch.sie_block->ecb3 &= ~(ECB3_AES | ECB3_DEA);
1273
1274 if (vcpu->kvm->arch.crypto.aes_kw)
1275 vcpu->arch.sie_block->ecb3 |= ECB3_AES;
1276 if (vcpu->kvm->arch.crypto.dea_kw)
1277 vcpu->arch.sie_block->ecb3 |= ECB3_DEA;
1278
1279 vcpu->arch.sie_block->crycbd = vcpu->kvm->arch.crypto.crycbd;
1280 }
1281
1282 void kvm_s390_vcpu_unsetup_cmma(struct kvm_vcpu *vcpu)
1283 {
1284 free_page(vcpu->arch.sie_block->cbrlo);
1285 vcpu->arch.sie_block->cbrlo = 0;
1286 }
1287
1288 int kvm_s390_vcpu_setup_cmma(struct kvm_vcpu *vcpu)
1289 {
1290 vcpu->arch.sie_block->cbrlo = get_zeroed_page(GFP_KERNEL);
1291 if (!vcpu->arch.sie_block->cbrlo)
1292 return -ENOMEM;
1293
1294 vcpu->arch.sie_block->ecb2 |= 0x80;
1295 vcpu->arch.sie_block->ecb2 &= ~0x08;
1296 return 0;
1297 }
1298
1299 static void kvm_s390_vcpu_setup_model(struct kvm_vcpu *vcpu)
1300 {
1301 struct kvm_s390_cpu_model *model = &vcpu->kvm->arch.model;
1302
1303 vcpu->arch.cpu_id = model->cpu_id;
1304 vcpu->arch.sie_block->ibc = model->ibc;
1305 vcpu->arch.sie_block->fac = (int) (long) model->fac->list;
1306 }
1307
1308 int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu)
1309 {
1310 int rc = 0;
1311
1312 atomic_set(&vcpu->arch.sie_block->cpuflags, CPUSTAT_ZARCH |
1313 CPUSTAT_SM |
1314 CPUSTAT_STOPPED |
1315 CPUSTAT_GED);
1316 kvm_s390_vcpu_setup_model(vcpu);
1317
1318 vcpu->arch.sie_block->ecb = 6;
1319 if (test_kvm_facility(vcpu->kvm, 50) && test_kvm_facility(vcpu->kvm, 73))
1320 vcpu->arch.sie_block->ecb |= 0x10;
1321
1322 vcpu->arch.sie_block->ecb2 = 8;
1323 vcpu->arch.sie_block->eca = 0xC1002000U;
1324 if (sclp.has_siif)
1325 vcpu->arch.sie_block->eca |= 1;
1326 if (sclp.has_sigpif)
1327 vcpu->arch.sie_block->eca |= 0x10000000U;
1328 if (test_kvm_facility(vcpu->kvm, 129)) {
1329 vcpu->arch.sie_block->eca |= 0x00020000;
1330 vcpu->arch.sie_block->ecd |= 0x20000000;
1331 }
1332 vcpu->arch.sie_block->ictl |= ICTL_ISKE | ICTL_SSKE | ICTL_RRBE;
1333
1334 if (kvm_s390_cmma_enabled(vcpu->kvm)) {
1335 rc = kvm_s390_vcpu_setup_cmma(vcpu);
1336 if (rc)
1337 return rc;
1338 }
1339 hrtimer_init(&vcpu->arch.ckc_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
1340 vcpu->arch.ckc_timer.function = kvm_s390_idle_wakeup;
1341
1342 kvm_s390_vcpu_crypto_setup(vcpu);
1343
1344 return rc;
1345 }
1346
1347 struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm,
1348 unsigned int id)
1349 {
1350 struct kvm_vcpu *vcpu;
1351 struct sie_page *sie_page;
1352 int rc = -EINVAL;
1353
1354 if (id >= KVM_MAX_VCPUS)
1355 goto out;
1356
1357 rc = -ENOMEM;
1358
1359 vcpu = kmem_cache_zalloc(kvm_vcpu_cache, GFP_KERNEL);
1360 if (!vcpu)
1361 goto out;
1362
1363 sie_page = (struct sie_page *) get_zeroed_page(GFP_KERNEL);
1364 if (!sie_page)
1365 goto out_free_cpu;
1366
1367 vcpu->arch.sie_block = &sie_page->sie_block;
1368 vcpu->arch.sie_block->itdba = (unsigned long) &sie_page->itdb;
1369 vcpu->arch.host_vregs = &sie_page->vregs;
1370
1371 vcpu->arch.sie_block->icpua = id;
1372 if (!kvm_is_ucontrol(kvm)) {
1373 if (!kvm->arch.sca) {
1374 WARN_ON_ONCE(1);
1375 goto out_free_cpu;
1376 }
1377 if (!kvm->arch.sca->cpu[id].sda)
1378 kvm->arch.sca->cpu[id].sda =
1379 (__u64) vcpu->arch.sie_block;
1380 vcpu->arch.sie_block->scaoh =
1381 (__u32)(((__u64)kvm->arch.sca) >> 32);
1382 vcpu->arch.sie_block->scaol = (__u32)(__u64)kvm->arch.sca;
1383 set_bit(63 - id, (unsigned long *) &kvm->arch.sca->mcn);
1384 }
1385
1386 spin_lock_init(&vcpu->arch.local_int.lock);
1387 vcpu->arch.local_int.float_int = &kvm->arch.float_int;
1388 vcpu->arch.local_int.wq = &vcpu->wq;
1389 vcpu->arch.local_int.cpuflags = &vcpu->arch.sie_block->cpuflags;
1390
1391 rc = kvm_vcpu_init(vcpu, kvm, id);
1392 if (rc)
1393 goto out_free_sie_block;
1394 VM_EVENT(kvm, 3, "create cpu %d at %p, sie block at %p", id, vcpu,
1395 vcpu->arch.sie_block);
1396 trace_kvm_s390_create_vcpu(id, vcpu, vcpu->arch.sie_block);
1397
1398 return vcpu;
1399 out_free_sie_block:
1400 free_page((unsigned long)(vcpu->arch.sie_block));
1401 out_free_cpu:
1402 kmem_cache_free(kvm_vcpu_cache, vcpu);
1403 out:
1404 return ERR_PTR(rc);
1405 }
1406
1407 int kvm_arch_vcpu_runnable(struct kvm_vcpu *vcpu)
1408 {
1409 return kvm_s390_vcpu_has_irq(vcpu, 0);
1410 }
1411
1412 void s390_vcpu_block(struct kvm_vcpu *vcpu)
1413 {
1414 atomic_set_mask(PROG_BLOCK_SIE, &vcpu->arch.sie_block->prog20);
1415 }
1416
1417 void s390_vcpu_unblock(struct kvm_vcpu *vcpu)
1418 {
1419 atomic_clear_mask(PROG_BLOCK_SIE, &vcpu->arch.sie_block->prog20);
1420 }
1421
1422 /*
1423 * Kick a guest cpu out of SIE and wait until SIE is not running.
1424 * If the CPU is not running (e.g. waiting as idle) the function will
1425 * return immediately. */
1426 void exit_sie(struct kvm_vcpu *vcpu)
1427 {
1428 atomic_set_mask(CPUSTAT_STOP_INT, &vcpu->arch.sie_block->cpuflags);
1429 while (vcpu->arch.sie_block->prog0c & PROG_IN_SIE)
1430 cpu_relax();
1431 }
1432
1433 /* Kick a guest cpu out of SIE and prevent SIE-reentry */
1434 void exit_sie_sync(struct kvm_vcpu *vcpu)
1435 {
1436 s390_vcpu_block(vcpu);
1437 exit_sie(vcpu);
1438 }
1439
1440 static void kvm_gmap_notifier(struct gmap *gmap, unsigned long address)
1441 {
1442 int i;
1443 struct kvm *kvm = gmap->private;
1444 struct kvm_vcpu *vcpu;
1445
1446 kvm_for_each_vcpu(i, vcpu, kvm) {
1447 /* match against both prefix pages */
1448 if (kvm_s390_get_prefix(vcpu) == (address & ~0x1000UL)) {
1449 VCPU_EVENT(vcpu, 2, "gmap notifier for %lx", address);
1450 kvm_make_request(KVM_REQ_MMU_RELOAD, vcpu);
1451 exit_sie_sync(vcpu);
1452 }
1453 }
1454 }
1455
1456 int kvm_arch_vcpu_should_kick(struct kvm_vcpu *vcpu)
1457 {
1458 /* kvm common code refers to this, but never calls it */
1459 BUG();
1460 return 0;
1461 }
1462
1463 static int kvm_arch_vcpu_ioctl_get_one_reg(struct kvm_vcpu *vcpu,
1464 struct kvm_one_reg *reg)
1465 {
1466 int r = -EINVAL;
1467
1468 switch (reg->id) {
1469 case KVM_REG_S390_TODPR:
1470 r = put_user(vcpu->arch.sie_block->todpr,
1471 (u32 __user *)reg->addr);
1472 break;
1473 case KVM_REG_S390_EPOCHDIFF:
1474 r = put_user(vcpu->arch.sie_block->epoch,
1475 (u64 __user *)reg->addr);
1476 break;
1477 case KVM_REG_S390_CPU_TIMER:
1478 r = put_user(vcpu->arch.sie_block->cputm,
1479 (u64 __user *)reg->addr);
1480 break;
1481 case KVM_REG_S390_CLOCK_COMP:
1482 r = put_user(vcpu->arch.sie_block->ckc,
1483 (u64 __user *)reg->addr);
1484 break;
1485 case KVM_REG_S390_PFTOKEN:
1486 r = put_user(vcpu->arch.pfault_token,
1487 (u64 __user *)reg->addr);
1488 break;
1489 case KVM_REG_S390_PFCOMPARE:
1490 r = put_user(vcpu->arch.pfault_compare,
1491 (u64 __user *)reg->addr);
1492 break;
1493 case KVM_REG_S390_PFSELECT:
1494 r = put_user(vcpu->arch.pfault_select,
1495 (u64 __user *)reg->addr);
1496 break;
1497 case KVM_REG_S390_PP:
1498 r = put_user(vcpu->arch.sie_block->pp,
1499 (u64 __user *)reg->addr);
1500 break;
1501 case KVM_REG_S390_GBEA:
1502 r = put_user(vcpu->arch.sie_block->gbea,
1503 (u64 __user *)reg->addr);
1504 break;
1505 default:
1506 break;
1507 }
1508
1509 return r;
1510 }
1511
1512 static int kvm_arch_vcpu_ioctl_set_one_reg(struct kvm_vcpu *vcpu,
1513 struct kvm_one_reg *reg)
1514 {
1515 int r = -EINVAL;
1516
1517 switch (reg->id) {
1518 case KVM_REG_S390_TODPR:
1519 r = get_user(vcpu->arch.sie_block->todpr,
1520 (u32 __user *)reg->addr);
1521 break;
1522 case KVM_REG_S390_EPOCHDIFF:
1523 r = get_user(vcpu->arch.sie_block->epoch,
1524 (u64 __user *)reg->addr);
1525 break;
1526 case KVM_REG_S390_CPU_TIMER:
1527 r = get_user(vcpu->arch.sie_block->cputm,
1528 (u64 __user *)reg->addr);
1529 break;
1530 case KVM_REG_S390_CLOCK_COMP:
1531 r = get_user(vcpu->arch.sie_block->ckc,
1532 (u64 __user *)reg->addr);
1533 break;
1534 case KVM_REG_S390_PFTOKEN:
1535 r = get_user(vcpu->arch.pfault_token,
1536 (u64 __user *)reg->addr);
1537 if (vcpu->arch.pfault_token == KVM_S390_PFAULT_TOKEN_INVALID)
1538 kvm_clear_async_pf_completion_queue(vcpu);
1539 break;
1540 case KVM_REG_S390_PFCOMPARE:
1541 r = get_user(vcpu->arch.pfault_compare,
1542 (u64 __user *)reg->addr);
1543 break;
1544 case KVM_REG_S390_PFSELECT:
1545 r = get_user(vcpu->arch.pfault_select,
1546 (u64 __user *)reg->addr);
1547 break;
1548 case KVM_REG_S390_PP:
1549 r = get_user(vcpu->arch.sie_block->pp,
1550 (u64 __user *)reg->addr);
1551 break;
1552 case KVM_REG_S390_GBEA:
1553 r = get_user(vcpu->arch.sie_block->gbea,
1554 (u64 __user *)reg->addr);
1555 break;
1556 default:
1557 break;
1558 }
1559
1560 return r;
1561 }
1562
1563 static int kvm_arch_vcpu_ioctl_initial_reset(struct kvm_vcpu *vcpu)
1564 {
1565 kvm_s390_vcpu_initial_reset(vcpu);
1566 return 0;
1567 }
1568
1569 int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs)
1570 {
1571 memcpy(&vcpu->run->s.regs.gprs, &regs->gprs, sizeof(regs->gprs));
1572 return 0;
1573 }
1574
1575 int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs)
1576 {
1577 memcpy(&regs->gprs, &vcpu->run->s.regs.gprs, sizeof(regs->gprs));
1578 return 0;
1579 }
1580
1581 int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
1582 struct kvm_sregs *sregs)
1583 {
1584 memcpy(&vcpu->run->s.regs.acrs, &sregs->acrs, sizeof(sregs->acrs));
1585 memcpy(&vcpu->arch.sie_block->gcr, &sregs->crs, sizeof(sregs->crs));
1586 restore_access_regs(vcpu->run->s.regs.acrs);
1587 return 0;
1588 }
1589
1590 int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
1591 struct kvm_sregs *sregs)
1592 {
1593 memcpy(&sregs->acrs, &vcpu->run->s.regs.acrs, sizeof(sregs->acrs));
1594 memcpy(&sregs->crs, &vcpu->arch.sie_block->gcr, sizeof(sregs->crs));
1595 return 0;
1596 }
1597
1598 int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu)
1599 {
1600 if (test_fp_ctl(fpu->fpc))
1601 return -EINVAL;
1602 memcpy(&vcpu->arch.guest_fpregs.fprs, &fpu->fprs, sizeof(fpu->fprs));
1603 vcpu->arch.guest_fpregs.fpc = fpu->fpc;
1604 restore_fp_ctl(&vcpu->arch.guest_fpregs.fpc);
1605 restore_fp_regs(vcpu->arch.guest_fpregs.fprs);
1606 return 0;
1607 }
1608
1609 int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu)
1610 {
1611 memcpy(&fpu->fprs, &vcpu->arch.guest_fpregs.fprs, sizeof(fpu->fprs));
1612 fpu->fpc = vcpu->arch.guest_fpregs.fpc;
1613 return 0;
1614 }
1615
1616 static int kvm_arch_vcpu_ioctl_set_initial_psw(struct kvm_vcpu *vcpu, psw_t psw)
1617 {
1618 int rc = 0;
1619
1620 if (!is_vcpu_stopped(vcpu))
1621 rc = -EBUSY;
1622 else {
1623 vcpu->run->psw_mask = psw.mask;
1624 vcpu->run->psw_addr = psw.addr;
1625 }
1626 return rc;
1627 }
1628
1629 int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
1630 struct kvm_translation *tr)
1631 {
1632 return -EINVAL; /* not implemented yet */
1633 }
1634
1635 #define VALID_GUESTDBG_FLAGS (KVM_GUESTDBG_SINGLESTEP | \
1636 KVM_GUESTDBG_USE_HW_BP | \
1637 KVM_GUESTDBG_ENABLE)
1638
1639 int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
1640 struct kvm_guest_debug *dbg)
1641 {
1642 int rc = 0;
1643
1644 vcpu->guest_debug = 0;
1645 kvm_s390_clear_bp_data(vcpu);
1646
1647 if (dbg->control & ~VALID_GUESTDBG_FLAGS)
1648 return -EINVAL;
1649
1650 if (dbg->control & KVM_GUESTDBG_ENABLE) {
1651 vcpu->guest_debug = dbg->control;
1652 /* enforce guest PER */
1653 atomic_set_mask(CPUSTAT_P, &vcpu->arch.sie_block->cpuflags);
1654
1655 if (dbg->control & KVM_GUESTDBG_USE_HW_BP)
1656 rc = kvm_s390_import_bp_data(vcpu, dbg);
1657 } else {
1658 atomic_clear_mask(CPUSTAT_P, &vcpu->arch.sie_block->cpuflags);
1659 vcpu->arch.guestdbg.last_bp = 0;
1660 }
1661
1662 if (rc) {
1663 vcpu->guest_debug = 0;
1664 kvm_s390_clear_bp_data(vcpu);
1665 atomic_clear_mask(CPUSTAT_P, &vcpu->arch.sie_block->cpuflags);
1666 }
1667
1668 return rc;
1669 }
1670
1671 int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu,
1672 struct kvm_mp_state *mp_state)
1673 {
1674 /* CHECK_STOP and LOAD are not supported yet */
1675 return is_vcpu_stopped(vcpu) ? KVM_MP_STATE_STOPPED :
1676 KVM_MP_STATE_OPERATING;
1677 }
1678
1679 int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
1680 struct kvm_mp_state *mp_state)
1681 {
1682 int rc = 0;
1683
1684 /* user space knows about this interface - let it control the state */
1685 vcpu->kvm->arch.user_cpu_state_ctrl = 1;
1686
1687 switch (mp_state->mp_state) {
1688 case KVM_MP_STATE_STOPPED:
1689 kvm_s390_vcpu_stop(vcpu);
1690 break;
1691 case KVM_MP_STATE_OPERATING:
1692 kvm_s390_vcpu_start(vcpu);
1693 break;
1694 case KVM_MP_STATE_LOAD:
1695 case KVM_MP_STATE_CHECK_STOP:
1696 /* fall through - CHECK_STOP and LOAD are not supported yet */
1697 default:
1698 rc = -ENXIO;
1699 }
1700
1701 return rc;
1702 }
1703
1704 bool kvm_s390_cmma_enabled(struct kvm *kvm)
1705 {
1706 if (!MACHINE_IS_LPAR)
1707 return false;
1708 /* only enable for z10 and later */
1709 if (!MACHINE_HAS_EDAT1)
1710 return false;
1711 if (!kvm->arch.use_cmma)
1712 return false;
1713 return true;
1714 }
1715
1716 static bool ibs_enabled(struct kvm_vcpu *vcpu)
1717 {
1718 return atomic_read(&vcpu->arch.sie_block->cpuflags) & CPUSTAT_IBS;
1719 }
1720
1721 static int kvm_s390_handle_requests(struct kvm_vcpu *vcpu)
1722 {
1723 retry:
1724 s390_vcpu_unblock(vcpu);
1725 /*
1726 * We use MMU_RELOAD just to re-arm the ipte notifier for the
1727 * guest prefix page. gmap_ipte_notify will wait on the ptl lock.
1728 * This ensures that the ipte instruction for this request has
1729 * already finished. We might race against a second unmapper that
1730 * wants to set the blocking bit. Lets just retry the request loop.
1731 */
1732 if (kvm_check_request(KVM_REQ_MMU_RELOAD, vcpu)) {
1733 int rc;
1734 rc = gmap_ipte_notify(vcpu->arch.gmap,
1735 kvm_s390_get_prefix(vcpu),
1736 PAGE_SIZE * 2);
1737 if (rc)
1738 return rc;
1739 goto retry;
1740 }
1741
1742 if (kvm_check_request(KVM_REQ_TLB_FLUSH, vcpu)) {
1743 vcpu->arch.sie_block->ihcpu = 0xffff;
1744 goto retry;
1745 }
1746
1747 if (kvm_check_request(KVM_REQ_ENABLE_IBS, vcpu)) {
1748 if (!ibs_enabled(vcpu)) {
1749 trace_kvm_s390_enable_disable_ibs(vcpu->vcpu_id, 1);
1750 atomic_set_mask(CPUSTAT_IBS,
1751 &vcpu->arch.sie_block->cpuflags);
1752 }
1753 goto retry;
1754 }
1755
1756 if (kvm_check_request(KVM_REQ_DISABLE_IBS, vcpu)) {
1757 if (ibs_enabled(vcpu)) {
1758 trace_kvm_s390_enable_disable_ibs(vcpu->vcpu_id, 0);
1759 atomic_clear_mask(CPUSTAT_IBS,
1760 &vcpu->arch.sie_block->cpuflags);
1761 }
1762 goto retry;
1763 }
1764
1765 /* nothing to do, just clear the request */
1766 clear_bit(KVM_REQ_UNHALT, &vcpu->requests);
1767
1768 return 0;
1769 }
1770
1771 /**
1772 * kvm_arch_fault_in_page - fault-in guest page if necessary
1773 * @vcpu: The corresponding virtual cpu
1774 * @gpa: Guest physical address
1775 * @writable: Whether the page should be writable or not
1776 *
1777 * Make sure that a guest page has been faulted-in on the host.
1778 *
1779 * Return: Zero on success, negative error code otherwise.
1780 */
1781 long kvm_arch_fault_in_page(struct kvm_vcpu *vcpu, gpa_t gpa, int writable)
1782 {
1783 return gmap_fault(vcpu->arch.gmap, gpa,
1784 writable ? FAULT_FLAG_WRITE : 0);
1785 }
1786
1787 static void __kvm_inject_pfault_token(struct kvm_vcpu *vcpu, bool start_token,
1788 unsigned long token)
1789 {
1790 struct kvm_s390_interrupt inti;
1791 struct kvm_s390_irq irq;
1792
1793 if (start_token) {
1794 irq.u.ext.ext_params2 = token;
1795 irq.type = KVM_S390_INT_PFAULT_INIT;
1796 WARN_ON_ONCE(kvm_s390_inject_vcpu(vcpu, &irq));
1797 } else {
1798 inti.type = KVM_S390_INT_PFAULT_DONE;
1799 inti.parm64 = token;
1800 WARN_ON_ONCE(kvm_s390_inject_vm(vcpu->kvm, &inti));
1801 }
1802 }
1803
1804 void kvm_arch_async_page_not_present(struct kvm_vcpu *vcpu,
1805 struct kvm_async_pf *work)
1806 {
1807 trace_kvm_s390_pfault_init(vcpu, work->arch.pfault_token);
1808 __kvm_inject_pfault_token(vcpu, true, work->arch.pfault_token);
1809 }
1810
1811 void kvm_arch_async_page_present(struct kvm_vcpu *vcpu,
1812 struct kvm_async_pf *work)
1813 {
1814 trace_kvm_s390_pfault_done(vcpu, work->arch.pfault_token);
1815 __kvm_inject_pfault_token(vcpu, false, work->arch.pfault_token);
1816 }
1817
1818 void kvm_arch_async_page_ready(struct kvm_vcpu *vcpu,
1819 struct kvm_async_pf *work)
1820 {
1821 /* s390 will always inject the page directly */
1822 }
1823
1824 bool kvm_arch_can_inject_async_page_present(struct kvm_vcpu *vcpu)
1825 {
1826 /*
1827 * s390 will always inject the page directly,
1828 * but we still want check_async_completion to cleanup
1829 */
1830 return true;
1831 }
1832
1833 static int kvm_arch_setup_async_pf(struct kvm_vcpu *vcpu)
1834 {
1835 hva_t hva;
1836 struct kvm_arch_async_pf arch;
1837 int rc;
1838
1839 if (vcpu->arch.pfault_token == KVM_S390_PFAULT_TOKEN_INVALID)
1840 return 0;
1841 if ((vcpu->arch.sie_block->gpsw.mask & vcpu->arch.pfault_select) !=
1842 vcpu->arch.pfault_compare)
1843 return 0;
1844 if (psw_extint_disabled(vcpu))
1845 return 0;
1846 if (kvm_s390_vcpu_has_irq(vcpu, 0))
1847 return 0;
1848 if (!(vcpu->arch.sie_block->gcr[0] & 0x200ul))
1849 return 0;
1850 if (!vcpu->arch.gmap->pfault_enabled)
1851 return 0;
1852
1853 hva = gfn_to_hva(vcpu->kvm, gpa_to_gfn(current->thread.gmap_addr));
1854 hva += current->thread.gmap_addr & ~PAGE_MASK;
1855 if (read_guest_real(vcpu, vcpu->arch.pfault_token, &arch.pfault_token, 8))
1856 return 0;
1857
1858 rc = kvm_setup_async_pf(vcpu, current->thread.gmap_addr, hva, &arch);
1859 return rc;
1860 }
1861
1862 static int vcpu_pre_run(struct kvm_vcpu *vcpu)
1863 {
1864 int rc, cpuflags;
1865
1866 /*
1867 * On s390 notifications for arriving pages will be delivered directly
1868 * to the guest but the house keeping for completed pfaults is
1869 * handled outside the worker.
1870 */
1871 kvm_check_async_pf_completion(vcpu);
1872
1873 memcpy(&vcpu->arch.sie_block->gg14, &vcpu->run->s.regs.gprs[14], 16);
1874
1875 if (need_resched())
1876 schedule();
1877
1878 if (test_cpu_flag(CIF_MCCK_PENDING))
1879 s390_handle_mcck();
1880
1881 if (!kvm_is_ucontrol(vcpu->kvm)) {
1882 rc = kvm_s390_deliver_pending_interrupts(vcpu);
1883 if (rc)
1884 return rc;
1885 }
1886
1887 rc = kvm_s390_handle_requests(vcpu);
1888 if (rc)
1889 return rc;
1890
1891 if (guestdbg_enabled(vcpu)) {
1892 kvm_s390_backup_guest_per_regs(vcpu);
1893 kvm_s390_patch_guest_per_regs(vcpu);
1894 }
1895
1896 vcpu->arch.sie_block->icptcode = 0;
1897 cpuflags = atomic_read(&vcpu->arch.sie_block->cpuflags);
1898 VCPU_EVENT(vcpu, 6, "entering sie flags %x", cpuflags);
1899 trace_kvm_s390_sie_enter(vcpu, cpuflags);
1900
1901 return 0;
1902 }
1903
1904 static int vcpu_post_run_fault_in_sie(struct kvm_vcpu *vcpu)
1905 {
1906 psw_t *psw = &vcpu->arch.sie_block->gpsw;
1907 u8 opcode;
1908 int rc;
1909
1910 VCPU_EVENT(vcpu, 3, "%s", "fault in sie instruction");
1911 trace_kvm_s390_sie_fault(vcpu);
1912
1913 /*
1914 * We want to inject an addressing exception, which is defined as a
1915 * suppressing or terminating exception. However, since we came here
1916 * by a DAT access exception, the PSW still points to the faulting
1917 * instruction since DAT exceptions are nullifying. So we've got
1918 * to look up the current opcode to get the length of the instruction
1919 * to be able to forward the PSW.
1920 */
1921 rc = read_guest(vcpu, psw->addr, 0, &opcode, 1);
1922 if (rc)
1923 return kvm_s390_inject_prog_cond(vcpu, rc);
1924 psw->addr = __rewind_psw(*psw, -insn_length(opcode));
1925
1926 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
1927 }
1928
1929 static int vcpu_post_run(struct kvm_vcpu *vcpu, int exit_reason)
1930 {
1931 int rc = -1;
1932
1933 VCPU_EVENT(vcpu, 6, "exit sie icptcode %d",
1934 vcpu->arch.sie_block->icptcode);
1935 trace_kvm_s390_sie_exit(vcpu, vcpu->arch.sie_block->icptcode);
1936
1937 if (guestdbg_enabled(vcpu))
1938 kvm_s390_restore_guest_per_regs(vcpu);
1939
1940 if (exit_reason >= 0) {
1941 rc = 0;
1942 } else if (kvm_is_ucontrol(vcpu->kvm)) {
1943 vcpu->run->exit_reason = KVM_EXIT_S390_UCONTROL;
1944 vcpu->run->s390_ucontrol.trans_exc_code =
1945 current->thread.gmap_addr;
1946 vcpu->run->s390_ucontrol.pgm_code = 0x10;
1947 rc = -EREMOTE;
1948
1949 } else if (current->thread.gmap_pfault) {
1950 trace_kvm_s390_major_guest_pfault(vcpu);
1951 current->thread.gmap_pfault = 0;
1952 if (kvm_arch_setup_async_pf(vcpu)) {
1953 rc = 0;
1954 } else {
1955 gpa_t gpa = current->thread.gmap_addr;
1956 rc = kvm_arch_fault_in_page(vcpu, gpa, 1);
1957 }
1958 }
1959
1960 if (rc == -1)
1961 rc = vcpu_post_run_fault_in_sie(vcpu);
1962
1963 memcpy(&vcpu->run->s.regs.gprs[14], &vcpu->arch.sie_block->gg14, 16);
1964
1965 if (rc == 0) {
1966 if (kvm_is_ucontrol(vcpu->kvm))
1967 /* Don't exit for host interrupts. */
1968 rc = vcpu->arch.sie_block->icptcode ? -EOPNOTSUPP : 0;
1969 else
1970 rc = kvm_handle_sie_intercept(vcpu);
1971 }
1972
1973 return rc;
1974 }
1975
1976 static int __vcpu_run(struct kvm_vcpu *vcpu)
1977 {
1978 int rc, exit_reason;
1979
1980 /*
1981 * We try to hold kvm->srcu during most of vcpu_run (except when run-
1982 * ning the guest), so that memslots (and other stuff) are protected
1983 */
1984 vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
1985
1986 do {
1987 rc = vcpu_pre_run(vcpu);
1988 if (rc)
1989 break;
1990
1991 srcu_read_unlock(&vcpu->kvm->srcu, vcpu->srcu_idx);
1992 /*
1993 * As PF_VCPU will be used in fault handler, between
1994 * guest_enter and guest_exit should be no uaccess.
1995 */
1996 preempt_disable();
1997 kvm_guest_enter();
1998 preempt_enable();
1999 exit_reason = sie64a(vcpu->arch.sie_block,
2000 vcpu->run->s.regs.gprs);
2001 kvm_guest_exit();
2002 vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
2003
2004 rc = vcpu_post_run(vcpu, exit_reason);
2005 } while (!signal_pending(current) && !guestdbg_exit_pending(vcpu) && !rc);
2006
2007 srcu_read_unlock(&vcpu->kvm->srcu, vcpu->srcu_idx);
2008 return rc;
2009 }
2010
2011 static void sync_regs(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run)
2012 {
2013 vcpu->arch.sie_block->gpsw.mask = kvm_run->psw_mask;
2014 vcpu->arch.sie_block->gpsw.addr = kvm_run->psw_addr;
2015 if (kvm_run->kvm_dirty_regs & KVM_SYNC_PREFIX)
2016 kvm_s390_set_prefix(vcpu, kvm_run->s.regs.prefix);
2017 if (kvm_run->kvm_dirty_regs & KVM_SYNC_CRS) {
2018 memcpy(&vcpu->arch.sie_block->gcr, &kvm_run->s.regs.crs, 128);
2019 /* some control register changes require a tlb flush */
2020 kvm_make_request(KVM_REQ_TLB_FLUSH, vcpu);
2021 }
2022 if (kvm_run->kvm_dirty_regs & KVM_SYNC_ARCH0) {
2023 vcpu->arch.sie_block->cputm = kvm_run->s.regs.cputm;
2024 vcpu->arch.sie_block->ckc = kvm_run->s.regs.ckc;
2025 vcpu->arch.sie_block->todpr = kvm_run->s.regs.todpr;
2026 vcpu->arch.sie_block->pp = kvm_run->s.regs.pp;
2027 vcpu->arch.sie_block->gbea = kvm_run->s.regs.gbea;
2028 }
2029 if (kvm_run->kvm_dirty_regs & KVM_SYNC_PFAULT) {
2030 vcpu->arch.pfault_token = kvm_run->s.regs.pft;
2031 vcpu->arch.pfault_select = kvm_run->s.regs.pfs;
2032 vcpu->arch.pfault_compare = kvm_run->s.regs.pfc;
2033 if (vcpu->arch.pfault_token == KVM_S390_PFAULT_TOKEN_INVALID)
2034 kvm_clear_async_pf_completion_queue(vcpu);
2035 }
2036 kvm_run->kvm_dirty_regs = 0;
2037 }
2038
2039 static void store_regs(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run)
2040 {
2041 kvm_run->psw_mask = vcpu->arch.sie_block->gpsw.mask;
2042 kvm_run->psw_addr = vcpu->arch.sie_block->gpsw.addr;
2043 kvm_run->s.regs.prefix = kvm_s390_get_prefix(vcpu);
2044 memcpy(&kvm_run->s.regs.crs, &vcpu->arch.sie_block->gcr, 128);
2045 kvm_run->s.regs.cputm = vcpu->arch.sie_block->cputm;
2046 kvm_run->s.regs.ckc = vcpu->arch.sie_block->ckc;
2047 kvm_run->s.regs.todpr = vcpu->arch.sie_block->todpr;
2048 kvm_run->s.regs.pp = vcpu->arch.sie_block->pp;
2049 kvm_run->s.regs.gbea = vcpu->arch.sie_block->gbea;
2050 kvm_run->s.regs.pft = vcpu->arch.pfault_token;
2051 kvm_run->s.regs.pfs = vcpu->arch.pfault_select;
2052 kvm_run->s.regs.pfc = vcpu->arch.pfault_compare;
2053 }
2054
2055 int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run)
2056 {
2057 int rc;
2058 sigset_t sigsaved;
2059
2060 if (guestdbg_exit_pending(vcpu)) {
2061 kvm_s390_prepare_debug_exit(vcpu);
2062 return 0;
2063 }
2064
2065 if (vcpu->sigset_active)
2066 sigprocmask(SIG_SETMASK, &vcpu->sigset, &sigsaved);
2067
2068 if (!kvm_s390_user_cpu_state_ctrl(vcpu->kvm)) {
2069 kvm_s390_vcpu_start(vcpu);
2070 } else if (is_vcpu_stopped(vcpu)) {
2071 pr_err_ratelimited("kvm-s390: can't run stopped vcpu %d\n",
2072 vcpu->vcpu_id);
2073 return -EINVAL;
2074 }
2075
2076 sync_regs(vcpu, kvm_run);
2077
2078 might_fault();
2079 rc = __vcpu_run(vcpu);
2080
2081 if (signal_pending(current) && !rc) {
2082 kvm_run->exit_reason = KVM_EXIT_INTR;
2083 rc = -EINTR;
2084 }
2085
2086 if (guestdbg_exit_pending(vcpu) && !rc) {
2087 kvm_s390_prepare_debug_exit(vcpu);
2088 rc = 0;
2089 }
2090
2091 if (rc == -EOPNOTSUPP) {
2092 /* intercept cannot be handled in-kernel, prepare kvm-run */
2093 kvm_run->exit_reason = KVM_EXIT_S390_SIEIC;
2094 kvm_run->s390_sieic.icptcode = vcpu->arch.sie_block->icptcode;
2095 kvm_run->s390_sieic.ipa = vcpu->arch.sie_block->ipa;
2096 kvm_run->s390_sieic.ipb = vcpu->arch.sie_block->ipb;
2097 rc = 0;
2098 }
2099
2100 if (rc == -EREMOTE) {
2101 /* intercept was handled, but userspace support is needed
2102 * kvm_run has been prepared by the handler */
2103 rc = 0;
2104 }
2105
2106 store_regs(vcpu, kvm_run);
2107
2108 if (vcpu->sigset_active)
2109 sigprocmask(SIG_SETMASK, &sigsaved, NULL);
2110
2111 vcpu->stat.exit_userspace++;
2112 return rc;
2113 }
2114
2115 /*
2116 * store status at address
2117 * we use have two special cases:
2118 * KVM_S390_STORE_STATUS_NOADDR: -> 0x1200 on 64 bit
2119 * KVM_S390_STORE_STATUS_PREFIXED: -> prefix
2120 */
2121 int kvm_s390_store_status_unloaded(struct kvm_vcpu *vcpu, unsigned long gpa)
2122 {
2123 unsigned char archmode = 1;
2124 unsigned int px;
2125 u64 clkcomp;
2126 int rc;
2127
2128 if (gpa == KVM_S390_STORE_STATUS_NOADDR) {
2129 if (write_guest_abs(vcpu, 163, &archmode, 1))
2130 return -EFAULT;
2131 gpa = SAVE_AREA_BASE;
2132 } else if (gpa == KVM_S390_STORE_STATUS_PREFIXED) {
2133 if (write_guest_real(vcpu, 163, &archmode, 1))
2134 return -EFAULT;
2135 gpa = kvm_s390_real_to_abs(vcpu, SAVE_AREA_BASE);
2136 }
2137 rc = write_guest_abs(vcpu, gpa + offsetof(struct save_area, fp_regs),
2138 vcpu->arch.guest_fpregs.fprs, 128);
2139 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, gp_regs),
2140 vcpu->run->s.regs.gprs, 128);
2141 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, psw),
2142 &vcpu->arch.sie_block->gpsw, 16);
2143 px = kvm_s390_get_prefix(vcpu);
2144 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, pref_reg),
2145 &px, 4);
2146 rc |= write_guest_abs(vcpu,
2147 gpa + offsetof(struct save_area, fp_ctrl_reg),
2148 &vcpu->arch.guest_fpregs.fpc, 4);
2149 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, tod_reg),
2150 &vcpu->arch.sie_block->todpr, 4);
2151 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, timer),
2152 &vcpu->arch.sie_block->cputm, 8);
2153 clkcomp = vcpu->arch.sie_block->ckc >> 8;
2154 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, clk_cmp),
2155 &clkcomp, 8);
2156 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, acc_regs),
2157 &vcpu->run->s.regs.acrs, 64);
2158 rc |= write_guest_abs(vcpu, gpa + offsetof(struct save_area, ctrl_regs),
2159 &vcpu->arch.sie_block->gcr, 128);
2160 return rc ? -EFAULT : 0;
2161 }
2162
2163 int kvm_s390_vcpu_store_status(struct kvm_vcpu *vcpu, unsigned long addr)
2164 {
2165 /*
2166 * The guest FPRS and ACRS are in the host FPRS/ACRS due to the lazy
2167 * copying in vcpu load/put. Lets update our copies before we save
2168 * it into the save area
2169 */
2170 save_fp_ctl(&vcpu->arch.guest_fpregs.fpc);
2171 save_fp_regs(vcpu->arch.guest_fpregs.fprs);
2172 save_access_regs(vcpu->run->s.regs.acrs);
2173
2174 return kvm_s390_store_status_unloaded(vcpu, addr);
2175 }
2176
2177 /*
2178 * store additional status at address
2179 */
2180 int kvm_s390_store_adtl_status_unloaded(struct kvm_vcpu *vcpu,
2181 unsigned long gpa)
2182 {
2183 /* Only bits 0-53 are used for address formation */
2184 if (!(gpa & ~0x3ff))
2185 return 0;
2186
2187 return write_guest_abs(vcpu, gpa & ~0x3ff,
2188 (void *)&vcpu->run->s.regs.vrs, 512);
2189 }
2190
2191 int kvm_s390_vcpu_store_adtl_status(struct kvm_vcpu *vcpu, unsigned long addr)
2192 {
2193 if (!test_kvm_facility(vcpu->kvm, 129))
2194 return 0;
2195
2196 /*
2197 * The guest VXRS are in the host VXRs due to the lazy
2198 * copying in vcpu load/put. Let's update our copies before we save
2199 * it into the save area.
2200 */
2201 save_vx_regs((__vector128 *)&vcpu->run->s.regs.vrs);
2202
2203 return kvm_s390_store_adtl_status_unloaded(vcpu, addr);
2204 }
2205
2206 static void __disable_ibs_on_vcpu(struct kvm_vcpu *vcpu)
2207 {
2208 kvm_check_request(KVM_REQ_ENABLE_IBS, vcpu);
2209 kvm_make_request(KVM_REQ_DISABLE_IBS, vcpu);
2210 exit_sie_sync(vcpu);
2211 }
2212
2213 static void __disable_ibs_on_all_vcpus(struct kvm *kvm)
2214 {
2215 unsigned int i;
2216 struct kvm_vcpu *vcpu;
2217
2218 kvm_for_each_vcpu(i, vcpu, kvm) {
2219 __disable_ibs_on_vcpu(vcpu);
2220 }
2221 }
2222
2223 static void __enable_ibs_on_vcpu(struct kvm_vcpu *vcpu)
2224 {
2225 kvm_check_request(KVM_REQ_DISABLE_IBS, vcpu);
2226 kvm_make_request(KVM_REQ_ENABLE_IBS, vcpu);
2227 exit_sie_sync(vcpu);
2228 }
2229
2230 void kvm_s390_vcpu_start(struct kvm_vcpu *vcpu)
2231 {
2232 int i, online_vcpus, started_vcpus = 0;
2233
2234 if (!is_vcpu_stopped(vcpu))
2235 return;
2236
2237 trace_kvm_s390_vcpu_start_stop(vcpu->vcpu_id, 1);
2238 /* Only one cpu at a time may enter/leave the STOPPED state. */
2239 spin_lock(&vcpu->kvm->arch.start_stop_lock);
2240 online_vcpus = atomic_read(&vcpu->kvm->online_vcpus);
2241
2242 for (i = 0; i < online_vcpus; i++) {
2243 if (!is_vcpu_stopped(vcpu->kvm->vcpus[i]))
2244 started_vcpus++;
2245 }
2246
2247 if (started_vcpus == 0) {
2248 /* we're the only active VCPU -> speed it up */
2249 __enable_ibs_on_vcpu(vcpu);
2250 } else if (started_vcpus == 1) {
2251 /*
2252 * As we are starting a second VCPU, we have to disable
2253 * the IBS facility on all VCPUs to remove potentially
2254 * oustanding ENABLE requests.
2255 */
2256 __disable_ibs_on_all_vcpus(vcpu->kvm);
2257 }
2258
2259 atomic_clear_mask(CPUSTAT_STOPPED, &vcpu->arch.sie_block->cpuflags);
2260 /*
2261 * Another VCPU might have used IBS while we were offline.
2262 * Let's play safe and flush the VCPU at startup.
2263 */
2264 kvm_make_request(KVM_REQ_TLB_FLUSH, vcpu);
2265 spin_unlock(&vcpu->kvm->arch.start_stop_lock);
2266 return;
2267 }
2268
2269 void kvm_s390_vcpu_stop(struct kvm_vcpu *vcpu)
2270 {
2271 int i, online_vcpus, started_vcpus = 0;
2272 struct kvm_vcpu *started_vcpu = NULL;
2273
2274 if (is_vcpu_stopped(vcpu))
2275 return;
2276
2277 trace_kvm_s390_vcpu_start_stop(vcpu->vcpu_id, 0);
2278 /* Only one cpu at a time may enter/leave the STOPPED state. */
2279 spin_lock(&vcpu->kvm->arch.start_stop_lock);
2280 online_vcpus = atomic_read(&vcpu->kvm->online_vcpus);
2281
2282 /* SIGP STOP and SIGP STOP AND STORE STATUS has been fully processed */
2283 kvm_s390_clear_stop_irq(vcpu);
2284
2285 atomic_set_mask(CPUSTAT_STOPPED, &vcpu->arch.sie_block->cpuflags);
2286 __disable_ibs_on_vcpu(vcpu);
2287
2288 for (i = 0; i < online_vcpus; i++) {
2289 if (!is_vcpu_stopped(vcpu->kvm->vcpus[i])) {
2290 started_vcpus++;
2291 started_vcpu = vcpu->kvm->vcpus[i];
2292 }
2293 }
2294
2295 if (started_vcpus == 1) {
2296 /*
2297 * As we only have one VCPU left, we want to enable the
2298 * IBS facility for that VCPU to speed it up.
2299 */
2300 __enable_ibs_on_vcpu(started_vcpu);
2301 }
2302
2303 spin_unlock(&vcpu->kvm->arch.start_stop_lock);
2304 return;
2305 }
2306
2307 static int kvm_vcpu_ioctl_enable_cap(struct kvm_vcpu *vcpu,
2308 struct kvm_enable_cap *cap)
2309 {
2310 int r;
2311
2312 if (cap->flags)
2313 return -EINVAL;
2314
2315 switch (cap->cap) {
2316 case KVM_CAP_S390_CSS_SUPPORT:
2317 if (!vcpu->kvm->arch.css_support) {
2318 vcpu->kvm->arch.css_support = 1;
2319 trace_kvm_s390_enable_css(vcpu->kvm);
2320 }
2321 r = 0;
2322 break;
2323 default:
2324 r = -EINVAL;
2325 break;
2326 }
2327 return r;
2328 }
2329
2330 static long kvm_s390_guest_mem_op(struct kvm_vcpu *vcpu,
2331 struct kvm_s390_mem_op *mop)
2332 {
2333 void __user *uaddr = (void __user *)mop->buf;
2334 void *tmpbuf = NULL;
2335 int r, srcu_idx;
2336 const u64 supported_flags = KVM_S390_MEMOP_F_INJECT_EXCEPTION
2337 | KVM_S390_MEMOP_F_CHECK_ONLY;
2338
2339 if (mop->flags & ~supported_flags)
2340 return -EINVAL;
2341
2342 if (mop->size > MEM_OP_MAX_SIZE)
2343 return -E2BIG;
2344
2345 if (!(mop->flags & KVM_S390_MEMOP_F_CHECK_ONLY)) {
2346 tmpbuf = vmalloc(mop->size);
2347 if (!tmpbuf)
2348 return -ENOMEM;
2349 }
2350
2351 srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
2352
2353 switch (mop->op) {
2354 case KVM_S390_MEMOP_LOGICAL_READ:
2355 if (mop->flags & KVM_S390_MEMOP_F_CHECK_ONLY) {
2356 r = check_gva_range(vcpu, mop->gaddr, mop->ar, mop->size, false);
2357 break;
2358 }
2359 r = read_guest(vcpu, mop->gaddr, mop->ar, tmpbuf, mop->size);
2360 if (r == 0) {
2361 if (copy_to_user(uaddr, tmpbuf, mop->size))
2362 r = -EFAULT;
2363 }
2364 break;
2365 case KVM_S390_MEMOP_LOGICAL_WRITE:
2366 if (mop->flags & KVM_S390_MEMOP_F_CHECK_ONLY) {
2367 r = check_gva_range(vcpu, mop->gaddr, mop->ar, mop->size, true);
2368 break;
2369 }
2370 if (copy_from_user(tmpbuf, uaddr, mop->size)) {
2371 r = -EFAULT;
2372 break;
2373 }
2374 r = write_guest(vcpu, mop->gaddr, mop->ar, tmpbuf, mop->size);
2375 break;
2376 default:
2377 r = -EINVAL;
2378 }
2379
2380 srcu_read_unlock(&vcpu->kvm->srcu, srcu_idx);
2381
2382 if (r > 0 && (mop->flags & KVM_S390_MEMOP_F_INJECT_EXCEPTION) != 0)
2383 kvm_s390_inject_prog_irq(vcpu, &vcpu->arch.pgm);
2384
2385 vfree(tmpbuf);
2386 return r;
2387 }
2388
2389 long kvm_arch_vcpu_ioctl(struct file *filp,
2390 unsigned int ioctl, unsigned long arg)
2391 {
2392 struct kvm_vcpu *vcpu = filp->private_data;
2393 void __user *argp = (void __user *)arg;
2394 int idx;
2395 long r;
2396
2397 switch (ioctl) {
2398 case KVM_S390_IRQ: {
2399 struct kvm_s390_irq s390irq;
2400
2401 r = -EFAULT;
2402 if (copy_from_user(&s390irq, argp, sizeof(s390irq)))
2403 break;
2404 r = kvm_s390_inject_vcpu(vcpu, &s390irq);
2405 break;
2406 }
2407 case KVM_S390_INTERRUPT: {
2408 struct kvm_s390_interrupt s390int;
2409 struct kvm_s390_irq s390irq;
2410
2411 r = -EFAULT;
2412 if (copy_from_user(&s390int, argp, sizeof(s390int)))
2413 break;
2414 if (s390int_to_s390irq(&s390int, &s390irq))
2415 return -EINVAL;
2416 r = kvm_s390_inject_vcpu(vcpu, &s390irq);
2417 break;
2418 }
2419 case KVM_S390_STORE_STATUS:
2420 idx = srcu_read_lock(&vcpu->kvm->srcu);
2421 r = kvm_s390_vcpu_store_status(vcpu, arg);
2422 srcu_read_unlock(&vcpu->kvm->srcu, idx);
2423 break;
2424 case KVM_S390_SET_INITIAL_PSW: {
2425 psw_t psw;
2426
2427 r = -EFAULT;
2428 if (copy_from_user(&psw, argp, sizeof(psw)))
2429 break;
2430 r = kvm_arch_vcpu_ioctl_set_initial_psw(vcpu, psw);
2431 break;
2432 }
2433 case KVM_S390_INITIAL_RESET:
2434 r = kvm_arch_vcpu_ioctl_initial_reset(vcpu);
2435 break;
2436 case KVM_SET_ONE_REG:
2437 case KVM_GET_ONE_REG: {
2438 struct kvm_one_reg reg;
2439 r = -EFAULT;
2440 if (copy_from_user(&reg, argp, sizeof(reg)))
2441 break;
2442 if (ioctl == KVM_SET_ONE_REG)
2443 r = kvm_arch_vcpu_ioctl_set_one_reg(vcpu, &reg);
2444 else
2445 r = kvm_arch_vcpu_ioctl_get_one_reg(vcpu, &reg);
2446 break;
2447 }
2448 #ifdef CONFIG_KVM_S390_UCONTROL
2449 case KVM_S390_UCAS_MAP: {
2450 struct kvm_s390_ucas_mapping ucasmap;
2451
2452 if (copy_from_user(&ucasmap, argp, sizeof(ucasmap))) {
2453 r = -EFAULT;
2454 break;
2455 }
2456
2457 if (!kvm_is_ucontrol(vcpu->kvm)) {
2458 r = -EINVAL;
2459 break;
2460 }
2461
2462 r = gmap_map_segment(vcpu->arch.gmap, ucasmap.user_addr,
2463 ucasmap.vcpu_addr, ucasmap.length);
2464 break;
2465 }
2466 case KVM_S390_UCAS_UNMAP: {
2467 struct kvm_s390_ucas_mapping ucasmap;
2468
2469 if (copy_from_user(&ucasmap, argp, sizeof(ucasmap))) {
2470 r = -EFAULT;
2471 break;
2472 }
2473
2474 if (!kvm_is_ucontrol(vcpu->kvm)) {
2475 r = -EINVAL;
2476 break;
2477 }
2478
2479 r = gmap_unmap_segment(vcpu->arch.gmap, ucasmap.vcpu_addr,
2480 ucasmap.length);
2481 break;
2482 }
2483 #endif
2484 case KVM_S390_VCPU_FAULT: {
2485 r = gmap_fault(vcpu->arch.gmap, arg, 0);
2486 break;
2487 }
2488 case KVM_ENABLE_CAP:
2489 {
2490 struct kvm_enable_cap cap;
2491 r = -EFAULT;
2492 if (copy_from_user(&cap, argp, sizeof(cap)))
2493 break;
2494 r = kvm_vcpu_ioctl_enable_cap(vcpu, &cap);
2495 break;
2496 }
2497 case KVM_S390_MEM_OP: {
2498 struct kvm_s390_mem_op mem_op;
2499
2500 if (copy_from_user(&mem_op, argp, sizeof(mem_op)) == 0)
2501 r = kvm_s390_guest_mem_op(vcpu, &mem_op);
2502 else
2503 r = -EFAULT;
2504 break;
2505 }
2506 case KVM_S390_SET_IRQ_STATE: {
2507 struct kvm_s390_irq_state irq_state;
2508
2509 r = -EFAULT;
2510 if (copy_from_user(&irq_state, argp, sizeof(irq_state)))
2511 break;
2512 if (irq_state.len > VCPU_IRQS_MAX_BUF ||
2513 irq_state.len == 0 ||
2514 irq_state.len % sizeof(struct kvm_s390_irq) > 0) {
2515 r = -EINVAL;
2516 break;
2517 }
2518 r = kvm_s390_set_irq_state(vcpu,
2519 (void __user *) irq_state.buf,
2520 irq_state.len);
2521 break;
2522 }
2523 case KVM_S390_GET_IRQ_STATE: {
2524 struct kvm_s390_irq_state irq_state;
2525
2526 r = -EFAULT;
2527 if (copy_from_user(&irq_state, argp, sizeof(irq_state)))
2528 break;
2529 if (irq_state.len == 0) {
2530 r = -EINVAL;
2531 break;
2532 }
2533 r = kvm_s390_get_irq_state(vcpu,
2534 (__u8 __user *) irq_state.buf,
2535 irq_state.len);
2536 break;
2537 }
2538 default:
2539 r = -ENOTTY;
2540 }
2541 return r;
2542 }
2543
2544 int kvm_arch_vcpu_fault(struct kvm_vcpu *vcpu, struct vm_fault *vmf)
2545 {
2546 #ifdef CONFIG_KVM_S390_UCONTROL
2547 if ((vmf->pgoff == KVM_S390_SIE_PAGE_OFFSET)
2548 && (kvm_is_ucontrol(vcpu->kvm))) {
2549 vmf->page = virt_to_page(vcpu->arch.sie_block);
2550 get_page(vmf->page);
2551 return 0;
2552 }
2553 #endif
2554 return VM_FAULT_SIGBUS;
2555 }
2556
2557 int kvm_arch_create_memslot(struct kvm *kvm, struct kvm_memory_slot *slot,
2558 unsigned long npages)
2559 {
2560 return 0;
2561 }
2562
2563 /* Section: memory related */
2564 int kvm_arch_prepare_memory_region(struct kvm *kvm,
2565 struct kvm_memory_slot *memslot,
2566 struct kvm_userspace_memory_region *mem,
2567 enum kvm_mr_change change)
2568 {
2569 /* A few sanity checks. We can have memory slots which have to be
2570 located/ended at a segment boundary (1MB). The memory in userland is
2571 ok to be fragmented into various different vmas. It is okay to mmap()
2572 and munmap() stuff in this slot after doing this call at any time */
2573
2574 if (mem->userspace_addr & 0xffffful)
2575 return -EINVAL;
2576
2577 if (mem->memory_size & 0xffffful)
2578 return -EINVAL;
2579
2580 return 0;
2581 }
2582
2583 void kvm_arch_commit_memory_region(struct kvm *kvm,
2584 struct kvm_userspace_memory_region *mem,
2585 const struct kvm_memory_slot *old,
2586 enum kvm_mr_change change)
2587 {
2588 int rc;
2589
2590 /* If the basics of the memslot do not change, we do not want
2591 * to update the gmap. Every update causes several unnecessary
2592 * segment translation exceptions. This is usually handled just
2593 * fine by the normal fault handler + gmap, but it will also
2594 * cause faults on the prefix page of running guest CPUs.
2595 */
2596 if (old->userspace_addr == mem->userspace_addr &&
2597 old->base_gfn * PAGE_SIZE == mem->guest_phys_addr &&
2598 old->npages * PAGE_SIZE == mem->memory_size)
2599 return;
2600
2601 rc = gmap_map_segment(kvm->arch.gmap, mem->userspace_addr,
2602 mem->guest_phys_addr, mem->memory_size);
2603 if (rc)
2604 printk(KERN_WARNING "kvm-s390: failed to commit memory region\n");
2605 return;
2606 }
2607
2608 static int __init kvm_s390_init(void)
2609 {
2610 return kvm_init(NULL, sizeof(struct kvm_vcpu), 0, THIS_MODULE);
2611 }
2612
2613 static void __exit kvm_s390_exit(void)
2614 {
2615 kvm_exit();
2616 }
2617
2618 module_init(kvm_s390_init);
2619 module_exit(kvm_s390_exit);
2620
2621 /*
2622 * Enable autoloading of the kvm module.
2623 * Note that we add the module alias here instead of virt/kvm/kvm_main.c
2624 * since x86 takes a different approach.
2625 */
2626 #include <linux/miscdevice.h>
2627 MODULE_ALIAS_MISCDEV(KVM_MINOR);
2628 MODULE_ALIAS("devname:kvm");
This page took 0.08663 seconds and 5 git commands to generate.