KVM: s390: move vcpu wakeup code to a central point
[pandora-kernel.git] / arch / s390 / kvm / interrupt.c
1 /*
2  * handling kvm guest interrupts
3  *
4  * Copyright IBM Corp. 2008,2014
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License (version 2 only)
8  * as published by the Free Software Foundation.
9  *
10  *    Author(s): Carsten Otte <cotte@de.ibm.com>
11  */
12
13 #include <linux/interrupt.h>
14 #include <linux/kvm_host.h>
15 #include <linux/hrtimer.h>
16 #include <linux/mmu_context.h>
17 #include <linux/signal.h>
18 #include <linux/slab.h>
19 #include <asm/asm-offsets.h>
20 #include <asm/uaccess.h>
21 #include "kvm-s390.h"
22 #include "gaccess.h"
23 #include "trace-s390.h"
24
25 #define IOINT_SCHID_MASK 0x0000ffff
26 #define IOINT_SSID_MASK 0x00030000
27 #define IOINT_CSSID_MASK 0x03fc0000
28 #define IOINT_AI_MASK 0x04000000
29
30 static void deliver_ckc_interrupt(struct kvm_vcpu *vcpu);
31
32 static int is_ioint(u64 type)
33 {
34         return ((type & 0xfffe0000u) != 0xfffe0000u);
35 }
36
37 int psw_extint_disabled(struct kvm_vcpu *vcpu)
38 {
39         return !(vcpu->arch.sie_block->gpsw.mask & PSW_MASK_EXT);
40 }
41
42 static int psw_ioint_disabled(struct kvm_vcpu *vcpu)
43 {
44         return !(vcpu->arch.sie_block->gpsw.mask & PSW_MASK_IO);
45 }
46
47 static int psw_mchk_disabled(struct kvm_vcpu *vcpu)
48 {
49         return !(vcpu->arch.sie_block->gpsw.mask & PSW_MASK_MCHECK);
50 }
51
52 static int psw_interrupts_disabled(struct kvm_vcpu *vcpu)
53 {
54         if ((vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PER) ||
55             (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_IO) ||
56             (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_EXT))
57                 return 0;
58         return 1;
59 }
60
61 static int ckc_interrupts_enabled(struct kvm_vcpu *vcpu)
62 {
63         if (psw_extint_disabled(vcpu) ||
64             !(vcpu->arch.sie_block->gcr[0] & 0x800ul))
65                 return 0;
66         if (guestdbg_enabled(vcpu) && guestdbg_sstep_enabled(vcpu))
67                 /* No timer interrupts when single stepping */
68                 return 0;
69         return 1;
70 }
71
72 static u64 int_word_to_isc_bits(u32 int_word)
73 {
74         u8 isc = (int_word & 0x38000000) >> 27;
75
76         return (0x80 >> isc) << 24;
77 }
78
79 static int __interrupt_is_deliverable(struct kvm_vcpu *vcpu,
80                                       struct kvm_s390_interrupt_info *inti)
81 {
82         switch (inti->type) {
83         case KVM_S390_INT_EXTERNAL_CALL:
84                 if (psw_extint_disabled(vcpu))
85                         return 0;
86                 if (vcpu->arch.sie_block->gcr[0] & 0x2000ul)
87                         return 1;
88         case KVM_S390_INT_EMERGENCY:
89                 if (psw_extint_disabled(vcpu))
90                         return 0;
91                 if (vcpu->arch.sie_block->gcr[0] & 0x4000ul)
92                         return 1;
93                 return 0;
94         case KVM_S390_INT_CLOCK_COMP:
95                 return ckc_interrupts_enabled(vcpu);
96         case KVM_S390_INT_CPU_TIMER:
97                 if (psw_extint_disabled(vcpu))
98                         return 0;
99                 if (vcpu->arch.sie_block->gcr[0] & 0x400ul)
100                         return 1;
101                 return 0;
102         case KVM_S390_INT_SERVICE:
103         case KVM_S390_INT_PFAULT_INIT:
104         case KVM_S390_INT_PFAULT_DONE:
105         case KVM_S390_INT_VIRTIO:
106                 if (psw_extint_disabled(vcpu))
107                         return 0;
108                 if (vcpu->arch.sie_block->gcr[0] & 0x200ul)
109                         return 1;
110                 return 0;
111         case KVM_S390_PROGRAM_INT:
112         case KVM_S390_SIGP_STOP:
113         case KVM_S390_SIGP_SET_PREFIX:
114         case KVM_S390_RESTART:
115                 return 1;
116         case KVM_S390_MCHK:
117                 if (psw_mchk_disabled(vcpu))
118                         return 0;
119                 if (vcpu->arch.sie_block->gcr[14] & inti->mchk.cr14)
120                         return 1;
121                 return 0;
122         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
123                 if (psw_ioint_disabled(vcpu))
124                         return 0;
125                 if (vcpu->arch.sie_block->gcr[6] &
126                     int_word_to_isc_bits(inti->io.io_int_word))
127                         return 1;
128                 return 0;
129         default:
130                 printk(KERN_WARNING "illegal interrupt type %llx\n",
131                        inti->type);
132                 BUG();
133         }
134         return 0;
135 }
136
137 static void __set_cpu_idle(struct kvm_vcpu *vcpu)
138 {
139         atomic_set_mask(CPUSTAT_WAIT, &vcpu->arch.sie_block->cpuflags);
140         set_bit(vcpu->vcpu_id, vcpu->arch.local_int.float_int->idle_mask);
141 }
142
143 static void __unset_cpu_idle(struct kvm_vcpu *vcpu)
144 {
145         atomic_clear_mask(CPUSTAT_WAIT, &vcpu->arch.sie_block->cpuflags);
146         clear_bit(vcpu->vcpu_id, vcpu->arch.local_int.float_int->idle_mask);
147 }
148
149 static void __reset_intercept_indicators(struct kvm_vcpu *vcpu)
150 {
151         atomic_clear_mask(CPUSTAT_IO_INT | CPUSTAT_EXT_INT | CPUSTAT_STOP_INT,
152                           &vcpu->arch.sie_block->cpuflags);
153         vcpu->arch.sie_block->lctl = 0x0000;
154         vcpu->arch.sie_block->ictl &= ~(ICTL_LPSW | ICTL_STCTL | ICTL_PINT);
155
156         if (guestdbg_enabled(vcpu)) {
157                 vcpu->arch.sie_block->lctl |= (LCTL_CR0 | LCTL_CR9 |
158                                                LCTL_CR10 | LCTL_CR11);
159                 vcpu->arch.sie_block->ictl |= (ICTL_STCTL | ICTL_PINT);
160         }
161 }
162
163 static void __set_cpuflag(struct kvm_vcpu *vcpu, u32 flag)
164 {
165         atomic_set_mask(flag, &vcpu->arch.sie_block->cpuflags);
166 }
167
168 static void __set_intercept_indicator(struct kvm_vcpu *vcpu,
169                                       struct kvm_s390_interrupt_info *inti)
170 {
171         switch (inti->type) {
172         case KVM_S390_INT_EXTERNAL_CALL:
173         case KVM_S390_INT_EMERGENCY:
174         case KVM_S390_INT_SERVICE:
175         case KVM_S390_INT_PFAULT_INIT:
176         case KVM_S390_INT_PFAULT_DONE:
177         case KVM_S390_INT_VIRTIO:
178         case KVM_S390_INT_CLOCK_COMP:
179         case KVM_S390_INT_CPU_TIMER:
180                 if (psw_extint_disabled(vcpu))
181                         __set_cpuflag(vcpu, CPUSTAT_EXT_INT);
182                 else
183                         vcpu->arch.sie_block->lctl |= LCTL_CR0;
184                 break;
185         case KVM_S390_SIGP_STOP:
186                 __set_cpuflag(vcpu, CPUSTAT_STOP_INT);
187                 break;
188         case KVM_S390_MCHK:
189                 if (psw_mchk_disabled(vcpu))
190                         vcpu->arch.sie_block->ictl |= ICTL_LPSW;
191                 else
192                         vcpu->arch.sie_block->lctl |= LCTL_CR14;
193                 break;
194         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
195                 if (psw_ioint_disabled(vcpu))
196                         __set_cpuflag(vcpu, CPUSTAT_IO_INT);
197                 else
198                         vcpu->arch.sie_block->lctl |= LCTL_CR6;
199                 break;
200         default:
201                 BUG();
202         }
203 }
204
205 static int __deliver_prog_irq(struct kvm_vcpu *vcpu,
206                               struct kvm_s390_pgm_info *pgm_info)
207 {
208         const unsigned short table[] = { 2, 4, 4, 6 };
209         int rc = 0;
210
211         switch (pgm_info->code & ~PGM_PER) {
212         case PGM_AFX_TRANSLATION:
213         case PGM_ASX_TRANSLATION:
214         case PGM_EX_TRANSLATION:
215         case PGM_LFX_TRANSLATION:
216         case PGM_LSTE_SEQUENCE:
217         case PGM_LSX_TRANSLATION:
218         case PGM_LX_TRANSLATION:
219         case PGM_PRIMARY_AUTHORITY:
220         case PGM_SECONDARY_AUTHORITY:
221         case PGM_SPACE_SWITCH:
222                 rc = put_guest_lc(vcpu, pgm_info->trans_exc_code,
223                                   (u64 *)__LC_TRANS_EXC_CODE);
224                 break;
225         case PGM_ALEN_TRANSLATION:
226         case PGM_ALE_SEQUENCE:
227         case PGM_ASTE_INSTANCE:
228         case PGM_ASTE_SEQUENCE:
229         case PGM_ASTE_VALIDITY:
230         case PGM_EXTENDED_AUTHORITY:
231                 rc = put_guest_lc(vcpu, pgm_info->exc_access_id,
232                                   (u8 *)__LC_EXC_ACCESS_ID);
233                 break;
234         case PGM_ASCE_TYPE:
235         case PGM_PAGE_TRANSLATION:
236         case PGM_REGION_FIRST_TRANS:
237         case PGM_REGION_SECOND_TRANS:
238         case PGM_REGION_THIRD_TRANS:
239         case PGM_SEGMENT_TRANSLATION:
240                 rc = put_guest_lc(vcpu, pgm_info->trans_exc_code,
241                                   (u64 *)__LC_TRANS_EXC_CODE);
242                 rc |= put_guest_lc(vcpu, pgm_info->exc_access_id,
243                                    (u8 *)__LC_EXC_ACCESS_ID);
244                 rc |= put_guest_lc(vcpu, pgm_info->op_access_id,
245                                    (u8 *)__LC_OP_ACCESS_ID);
246                 break;
247         case PGM_MONITOR:
248                 rc = put_guest_lc(vcpu, pgm_info->mon_class_nr,
249                                   (u64 *)__LC_MON_CLASS_NR);
250                 rc |= put_guest_lc(vcpu, pgm_info->mon_code,
251                                    (u64 *)__LC_MON_CODE);
252                 break;
253         case PGM_DATA:
254                 rc = put_guest_lc(vcpu, pgm_info->data_exc_code,
255                                   (u32 *)__LC_DATA_EXC_CODE);
256                 break;
257         case PGM_PROTECTION:
258                 rc = put_guest_lc(vcpu, pgm_info->trans_exc_code,
259                                   (u64 *)__LC_TRANS_EXC_CODE);
260                 rc |= put_guest_lc(vcpu, pgm_info->exc_access_id,
261                                    (u8 *)__LC_EXC_ACCESS_ID);
262                 break;
263         }
264
265         if (pgm_info->code & PGM_PER) {
266                 rc |= put_guest_lc(vcpu, pgm_info->per_code,
267                                    (u8 *) __LC_PER_CODE);
268                 rc |= put_guest_lc(vcpu, pgm_info->per_atmid,
269                                    (u8 *)__LC_PER_ATMID);
270                 rc |= put_guest_lc(vcpu, pgm_info->per_address,
271                                    (u64 *) __LC_PER_ADDRESS);
272                 rc |= put_guest_lc(vcpu, pgm_info->per_access_id,
273                                    (u8 *) __LC_PER_ACCESS_ID);
274         }
275
276         switch (vcpu->arch.sie_block->icptcode) {
277         case ICPT_INST:
278         case ICPT_INSTPROGI:
279         case ICPT_OPEREXC:
280         case ICPT_PARTEXEC:
281         case ICPT_IOINST:
282                 /* last instruction only stored for these icptcodes */
283                 rc |= put_guest_lc(vcpu, table[vcpu->arch.sie_block->ipa >> 14],
284                                    (u16 *) __LC_PGM_ILC);
285                 break;
286         case ICPT_PROGI:
287                 rc |= put_guest_lc(vcpu, vcpu->arch.sie_block->pgmilc,
288                                    (u16 *) __LC_PGM_ILC);
289                 break;
290         default:
291                 rc |= put_guest_lc(vcpu, 0,
292                                    (u16 *) __LC_PGM_ILC);
293         }
294
295         rc |= put_guest_lc(vcpu, pgm_info->code,
296                            (u16 *)__LC_PGM_INT_CODE);
297         rc |= write_guest_lc(vcpu, __LC_PGM_OLD_PSW,
298                              &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
299         rc |= read_guest_lc(vcpu, __LC_PGM_NEW_PSW,
300                             &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
301
302         return rc;
303 }
304
305 static void __do_deliver_interrupt(struct kvm_vcpu *vcpu,
306                                    struct kvm_s390_interrupt_info *inti)
307 {
308         const unsigned short table[] = { 2, 4, 4, 6 };
309         int rc = 0;
310
311         switch (inti->type) {
312         case KVM_S390_INT_EMERGENCY:
313                 VCPU_EVENT(vcpu, 4, "%s", "interrupt: sigp emerg");
314                 vcpu->stat.deliver_emergency_signal++;
315                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
316                                                  inti->emerg.code, 0);
317                 rc  = put_guest_lc(vcpu, 0x1201, (u16 *)__LC_EXT_INT_CODE);
318                 rc |= put_guest_lc(vcpu, inti->emerg.code,
319                                    (u16 *)__LC_EXT_CPU_ADDR);
320                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
321                                      &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
322                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
323                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
324                 break;
325         case KVM_S390_INT_EXTERNAL_CALL:
326                 VCPU_EVENT(vcpu, 4, "%s", "interrupt: sigp ext call");
327                 vcpu->stat.deliver_external_call++;
328                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
329                                                  inti->extcall.code, 0);
330                 rc  = put_guest_lc(vcpu, 0x1202, (u16 *)__LC_EXT_INT_CODE);
331                 rc |= put_guest_lc(vcpu, inti->extcall.code,
332                                    (u16 *)__LC_EXT_CPU_ADDR);
333                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
334                                      &vcpu->arch.sie_block->gpsw,
335                                      sizeof(psw_t));
336                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
337                                     &vcpu->arch.sie_block->gpsw,
338                                     sizeof(psw_t));
339                 break;
340         case KVM_S390_INT_CLOCK_COMP:
341                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
342                                                  inti->ext.ext_params, 0);
343                 deliver_ckc_interrupt(vcpu);
344                 break;
345         case KVM_S390_INT_CPU_TIMER:
346                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
347                                                  inti->ext.ext_params, 0);
348                 rc  = put_guest_lc(vcpu, EXT_IRQ_CPU_TIMER,
349                                    (u16 *)__LC_EXT_INT_CODE);
350                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
351                                      &vcpu->arch.sie_block->gpsw,
352                                      sizeof(psw_t));
353                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
354                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
355                 rc |= put_guest_lc(vcpu, inti->ext.ext_params,
356                                    (u32 *)__LC_EXT_PARAMS);
357                 break;
358         case KVM_S390_INT_SERVICE:
359                 VCPU_EVENT(vcpu, 4, "interrupt: sclp parm:%x",
360                            inti->ext.ext_params);
361                 vcpu->stat.deliver_service_signal++;
362                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
363                                                  inti->ext.ext_params, 0);
364                 rc  = put_guest_lc(vcpu, 0x2401, (u16 *)__LC_EXT_INT_CODE);
365                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
366                                      &vcpu->arch.sie_block->gpsw,
367                                      sizeof(psw_t));
368                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
369                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
370                 rc |= put_guest_lc(vcpu, inti->ext.ext_params,
371                                    (u32 *)__LC_EXT_PARAMS);
372                 break;
373         case KVM_S390_INT_PFAULT_INIT:
374                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type, 0,
375                                                  inti->ext.ext_params2);
376                 rc  = put_guest_lc(vcpu, 0x2603, (u16 *) __LC_EXT_INT_CODE);
377                 rc |= put_guest_lc(vcpu, 0x0600, (u16 *) __LC_EXT_CPU_ADDR);
378                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
379                                      &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
380                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
381                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
382                 rc |= put_guest_lc(vcpu, inti->ext.ext_params2,
383                                    (u64 *) __LC_EXT_PARAMS2);
384                 break;
385         case KVM_S390_INT_PFAULT_DONE:
386                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type, 0,
387                                                  inti->ext.ext_params2);
388                 rc  = put_guest_lc(vcpu, 0x2603, (u16 *)__LC_EXT_INT_CODE);
389                 rc |= put_guest_lc(vcpu, 0x0680, (u16 *)__LC_EXT_CPU_ADDR);
390                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
391                                      &vcpu->arch.sie_block->gpsw,
392                                      sizeof(psw_t));
393                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
394                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
395                 rc |= put_guest_lc(vcpu, inti->ext.ext_params2,
396                                    (u64 *)__LC_EXT_PARAMS2);
397                 break;
398         case KVM_S390_INT_VIRTIO:
399                 VCPU_EVENT(vcpu, 4, "interrupt: virtio parm:%x,parm64:%llx",
400                            inti->ext.ext_params, inti->ext.ext_params2);
401                 vcpu->stat.deliver_virtio_interrupt++;
402                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
403                                                  inti->ext.ext_params,
404                                                  inti->ext.ext_params2);
405                 rc  = put_guest_lc(vcpu, 0x2603, (u16 *)__LC_EXT_INT_CODE);
406                 rc |= put_guest_lc(vcpu, 0x0d00, (u16 *)__LC_EXT_CPU_ADDR);
407                 rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
408                                      &vcpu->arch.sie_block->gpsw,
409                                      sizeof(psw_t));
410                 rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
411                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
412                 rc |= put_guest_lc(vcpu, inti->ext.ext_params,
413                                    (u32 *)__LC_EXT_PARAMS);
414                 rc |= put_guest_lc(vcpu, inti->ext.ext_params2,
415                                    (u64 *)__LC_EXT_PARAMS2);
416                 break;
417         case KVM_S390_SIGP_STOP:
418                 VCPU_EVENT(vcpu, 4, "%s", "interrupt: cpu stop");
419                 vcpu->stat.deliver_stop_signal++;
420                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
421                                                  0, 0);
422                 __set_intercept_indicator(vcpu, inti);
423                 break;
424
425         case KVM_S390_SIGP_SET_PREFIX:
426                 VCPU_EVENT(vcpu, 4, "interrupt: set prefix to %x",
427                            inti->prefix.address);
428                 vcpu->stat.deliver_prefix_signal++;
429                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
430                                                  inti->prefix.address, 0);
431                 kvm_s390_set_prefix(vcpu, inti->prefix.address);
432                 break;
433
434         case KVM_S390_RESTART:
435                 VCPU_EVENT(vcpu, 4, "%s", "interrupt: cpu restart");
436                 vcpu->stat.deliver_restart_signal++;
437                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
438                                                  0, 0);
439                 rc  = write_guest_lc(vcpu,
440                                      offsetof(struct _lowcore, restart_old_psw),
441                                      &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
442                 rc |= read_guest_lc(vcpu, offsetof(struct _lowcore, restart_psw),
443                                     &vcpu->arch.sie_block->gpsw,
444                                     sizeof(psw_t));
445                 break;
446         case KVM_S390_PROGRAM_INT:
447                 VCPU_EVENT(vcpu, 4, "interrupt: pgm check code:%x, ilc:%x",
448                            inti->pgm.code,
449                            table[vcpu->arch.sie_block->ipa >> 14]);
450                 vcpu->stat.deliver_program_int++;
451                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
452                                                  inti->pgm.code, 0);
453                 rc = __deliver_prog_irq(vcpu, &inti->pgm);
454                 break;
455
456         case KVM_S390_MCHK:
457                 VCPU_EVENT(vcpu, 4, "interrupt: machine check mcic=%llx",
458                            inti->mchk.mcic);
459                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
460                                                  inti->mchk.cr14,
461                                                  inti->mchk.mcic);
462                 rc  = kvm_s390_vcpu_store_status(vcpu,
463                                                  KVM_S390_STORE_STATUS_PREFIXED);
464                 rc |= put_guest_lc(vcpu, inti->mchk.mcic, (u64 *)__LC_MCCK_CODE);
465                 rc |= write_guest_lc(vcpu, __LC_MCK_OLD_PSW,
466                                      &vcpu->arch.sie_block->gpsw,
467                                      sizeof(psw_t));
468                 rc |= read_guest_lc(vcpu, __LC_MCK_NEW_PSW,
469                                     &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
470                 break;
471
472         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
473         {
474                 __u32 param0 = ((__u32)inti->io.subchannel_id << 16) |
475                         inti->io.subchannel_nr;
476                 __u64 param1 = ((__u64)inti->io.io_int_parm << 32) |
477                         inti->io.io_int_word;
478                 VCPU_EVENT(vcpu, 4, "interrupt: I/O %llx", inti->type);
479                 vcpu->stat.deliver_io_int++;
480                 trace_kvm_s390_deliver_interrupt(vcpu->vcpu_id, inti->type,
481                                                  param0, param1);
482                 rc  = put_guest_lc(vcpu, inti->io.subchannel_id,
483                                    (u16 *)__LC_SUBCHANNEL_ID);
484                 rc |= put_guest_lc(vcpu, inti->io.subchannel_nr,
485                                    (u16 *)__LC_SUBCHANNEL_NR);
486                 rc |= put_guest_lc(vcpu, inti->io.io_int_parm,
487                                    (u32 *)__LC_IO_INT_PARM);
488                 rc |= put_guest_lc(vcpu, inti->io.io_int_word,
489                                    (u32 *)__LC_IO_INT_WORD);
490                 rc |= write_guest_lc(vcpu, __LC_IO_OLD_PSW,
491                                      &vcpu->arch.sie_block->gpsw,
492                                      sizeof(psw_t));
493                 rc |= read_guest_lc(vcpu, __LC_IO_NEW_PSW,
494                                     &vcpu->arch.sie_block->gpsw,
495                                     sizeof(psw_t));
496                 break;
497         }
498         default:
499                 BUG();
500         }
501         if (rc) {
502                 printk("kvm: The guest lowcore is not mapped during interrupt "
503                        "delivery, killing userspace\n");
504                 do_exit(SIGKILL);
505         }
506 }
507
508 static void deliver_ckc_interrupt(struct kvm_vcpu *vcpu)
509 {
510         int rc;
511
512         rc  = put_guest_lc(vcpu, 0x1004, (u16 __user *)__LC_EXT_INT_CODE);
513         rc |= write_guest_lc(vcpu, __LC_EXT_OLD_PSW,
514                              &vcpu->arch.sie_block->gpsw, sizeof(psw_t));
515         rc |= read_guest_lc(vcpu, __LC_EXT_NEW_PSW,
516                             &vcpu->arch.sie_block->gpsw,
517                             sizeof(psw_t));
518         if (rc) {
519                 printk("kvm: The guest lowcore is not mapped during interrupt "
520                         "delivery, killing userspace\n");
521                 do_exit(SIGKILL);
522         }
523 }
524
525 /* Check whether SIGP interpretation facility has an external call pending */
526 int kvm_s390_si_ext_call_pending(struct kvm_vcpu *vcpu)
527 {
528         atomic_t *sigp_ctrl = &vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].ctrl;
529
530         if (!psw_extint_disabled(vcpu) &&
531             (vcpu->arch.sie_block->gcr[0] & 0x2000ul) &&
532             (atomic_read(sigp_ctrl) & SIGP_CTRL_C) &&
533             (atomic_read(&vcpu->arch.sie_block->cpuflags) & CPUSTAT_ECALL_PEND))
534                 return 1;
535
536         return 0;
537 }
538
539 int kvm_cpu_has_interrupt(struct kvm_vcpu *vcpu)
540 {
541         struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
542         struct kvm_s390_float_interrupt *fi = vcpu->arch.local_int.float_int;
543         struct kvm_s390_interrupt_info  *inti;
544         int rc = 0;
545
546         if (atomic_read(&li->active)) {
547                 spin_lock(&li->lock);
548                 list_for_each_entry(inti, &li->list, list)
549                         if (__interrupt_is_deliverable(vcpu, inti)) {
550                                 rc = 1;
551                                 break;
552                         }
553                 spin_unlock(&li->lock);
554         }
555
556         if ((!rc) && atomic_read(&fi->active)) {
557                 spin_lock(&fi->lock);
558                 list_for_each_entry(inti, &fi->list, list)
559                         if (__interrupt_is_deliverable(vcpu, inti)) {
560                                 rc = 1;
561                                 break;
562                         }
563                 spin_unlock(&fi->lock);
564         }
565
566         if (!rc && kvm_cpu_has_pending_timer(vcpu))
567                 rc = 1;
568
569         if (!rc && kvm_s390_si_ext_call_pending(vcpu))
570                 rc = 1;
571
572         return rc;
573 }
574
575 int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu)
576 {
577         if (!(vcpu->arch.sie_block->ckc <
578               get_tod_clock_fast() + vcpu->arch.sie_block->epoch))
579                 return 0;
580         if (!ckc_interrupts_enabled(vcpu))
581                 return 0;
582         return 1;
583 }
584
585 int kvm_s390_handle_wait(struct kvm_vcpu *vcpu)
586 {
587         u64 now, sltime;
588
589         vcpu->stat.exit_wait_state++;
590
591         /* fast path */
592         if (kvm_cpu_has_pending_timer(vcpu) || kvm_arch_vcpu_runnable(vcpu))
593                 return 0;
594
595         if (psw_interrupts_disabled(vcpu)) {
596                 VCPU_EVENT(vcpu, 3, "%s", "disabled wait");
597                 return -EOPNOTSUPP; /* disabled wait */
598         }
599
600         __set_cpu_idle(vcpu);
601         if (!ckc_interrupts_enabled(vcpu)) {
602                 VCPU_EVENT(vcpu, 3, "%s", "enabled wait w/o timer");
603                 goto no_timer;
604         }
605
606         now = get_tod_clock_fast() + vcpu->arch.sie_block->epoch;
607         sltime = tod_to_ns(vcpu->arch.sie_block->ckc - now);
608         hrtimer_start(&vcpu->arch.ckc_timer, ktime_set (0, sltime) , HRTIMER_MODE_REL);
609         VCPU_EVENT(vcpu, 5, "enabled wait via clock comparator: %llx ns", sltime);
610 no_timer:
611         srcu_read_unlock(&vcpu->kvm->srcu, vcpu->srcu_idx);
612         kvm_vcpu_block(vcpu);
613         __unset_cpu_idle(vcpu);
614         vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
615
616         hrtimer_try_to_cancel(&vcpu->arch.ckc_timer);
617         return 0;
618 }
619
620 void kvm_s390_vcpu_wakeup(struct kvm_vcpu *vcpu)
621 {
622         if (waitqueue_active(&vcpu->wq)) {
623                 /*
624                  * The vcpu gave up the cpu voluntarily, mark it as a good
625                  * yield-candidate.
626                  */
627                 vcpu->preempted = true;
628                 wake_up_interruptible(&vcpu->wq);
629         }
630 }
631
632 void kvm_s390_tasklet(unsigned long parm)
633 {
634         struct kvm_vcpu *vcpu = (struct kvm_vcpu *) parm;
635         kvm_s390_vcpu_wakeup(vcpu);
636 }
637
638 /*
639  * low level hrtimer wake routine. Because this runs in hardirq context
640  * we schedule a tasklet to do the real work.
641  */
642 enum hrtimer_restart kvm_s390_idle_wakeup(struct hrtimer *timer)
643 {
644         struct kvm_vcpu *vcpu;
645
646         vcpu = container_of(timer, struct kvm_vcpu, arch.ckc_timer);
647         vcpu->preempted = true;
648         tasklet_schedule(&vcpu->arch.tasklet);
649
650         return HRTIMER_NORESTART;
651 }
652
653 void kvm_s390_clear_local_irqs(struct kvm_vcpu *vcpu)
654 {
655         struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
656         struct kvm_s390_interrupt_info  *n, *inti = NULL;
657
658         spin_lock(&li->lock);
659         list_for_each_entry_safe(inti, n, &li->list, list) {
660                 list_del(&inti->list);
661                 kfree(inti);
662         }
663         atomic_set(&li->active, 0);
664         spin_unlock(&li->lock);
665
666         /* clear pending external calls set by sigp interpretation facility */
667         atomic_clear_mask(CPUSTAT_ECALL_PEND, &vcpu->arch.sie_block->cpuflags);
668         atomic_clear_mask(SIGP_CTRL_C,
669                           &vcpu->kvm->arch.sca->cpu[vcpu->vcpu_id].ctrl);
670 }
671
672 void kvm_s390_deliver_pending_interrupts(struct kvm_vcpu *vcpu)
673 {
674         struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
675         struct kvm_s390_float_interrupt *fi = vcpu->arch.local_int.float_int;
676         struct kvm_s390_interrupt_info  *n, *inti = NULL;
677         int deliver;
678
679         __reset_intercept_indicators(vcpu);
680         if (atomic_read(&li->active)) {
681                 do {
682                         deliver = 0;
683                         spin_lock(&li->lock);
684                         list_for_each_entry_safe(inti, n, &li->list, list) {
685                                 if (__interrupt_is_deliverable(vcpu, inti)) {
686                                         list_del(&inti->list);
687                                         deliver = 1;
688                                         break;
689                                 }
690                                 __set_intercept_indicator(vcpu, inti);
691                         }
692                         if (list_empty(&li->list))
693                                 atomic_set(&li->active, 0);
694                         spin_unlock(&li->lock);
695                         if (deliver) {
696                                 __do_deliver_interrupt(vcpu, inti);
697                                 kfree(inti);
698                         }
699                 } while (deliver);
700         }
701
702         if (kvm_cpu_has_pending_timer(vcpu))
703                 deliver_ckc_interrupt(vcpu);
704
705         if (atomic_read(&fi->active)) {
706                 do {
707                         deliver = 0;
708                         spin_lock(&fi->lock);
709                         list_for_each_entry_safe(inti, n, &fi->list, list) {
710                                 if (__interrupt_is_deliverable(vcpu, inti)) {
711                                         list_del(&inti->list);
712                                         fi->irq_count--;
713                                         deliver = 1;
714                                         break;
715                                 }
716                                 __set_intercept_indicator(vcpu, inti);
717                         }
718                         if (list_empty(&fi->list))
719                                 atomic_set(&fi->active, 0);
720                         spin_unlock(&fi->lock);
721                         if (deliver) {
722                                 __do_deliver_interrupt(vcpu, inti);
723                                 kfree(inti);
724                         }
725                 } while (deliver);
726         }
727 }
728
729 void kvm_s390_deliver_pending_machine_checks(struct kvm_vcpu *vcpu)
730 {
731         struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
732         struct kvm_s390_float_interrupt *fi = vcpu->arch.local_int.float_int;
733         struct kvm_s390_interrupt_info  *n, *inti = NULL;
734         int deliver;
735
736         __reset_intercept_indicators(vcpu);
737         if (atomic_read(&li->active)) {
738                 do {
739                         deliver = 0;
740                         spin_lock(&li->lock);
741                         list_for_each_entry_safe(inti, n, &li->list, list) {
742                                 if ((inti->type == KVM_S390_MCHK) &&
743                                     __interrupt_is_deliverable(vcpu, inti)) {
744                                         list_del(&inti->list);
745                                         deliver = 1;
746                                         break;
747                                 }
748                                 __set_intercept_indicator(vcpu, inti);
749                         }
750                         if (list_empty(&li->list))
751                                 atomic_set(&li->active, 0);
752                         spin_unlock(&li->lock);
753                         if (deliver) {
754                                 __do_deliver_interrupt(vcpu, inti);
755                                 kfree(inti);
756                         }
757                 } while (deliver);
758         }
759
760         if (atomic_read(&fi->active)) {
761                 do {
762                         deliver = 0;
763                         spin_lock(&fi->lock);
764                         list_for_each_entry_safe(inti, n, &fi->list, list) {
765                                 if ((inti->type == KVM_S390_MCHK) &&
766                                     __interrupt_is_deliverable(vcpu, inti)) {
767                                         list_del(&inti->list);
768                                         fi->irq_count--;
769                                         deliver = 1;
770                                         break;
771                                 }
772                                 __set_intercept_indicator(vcpu, inti);
773                         }
774                         if (list_empty(&fi->list))
775                                 atomic_set(&fi->active, 0);
776                         spin_unlock(&fi->lock);
777                         if (deliver) {
778                                 __do_deliver_interrupt(vcpu, inti);
779                                 kfree(inti);
780                         }
781                 } while (deliver);
782         }
783 }
784
785 int kvm_s390_inject_program_int(struct kvm_vcpu *vcpu, u16 code)
786 {
787         struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
788         struct kvm_s390_interrupt_info *inti;
789
790         inti = kzalloc(sizeof(*inti), GFP_KERNEL);
791         if (!inti)
792                 return -ENOMEM;
793
794         inti->type = KVM_S390_PROGRAM_INT;
795         inti->pgm.code = code;
796
797         VCPU_EVENT(vcpu, 3, "inject: program check %d (from kernel)", code);
798         trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, inti->type, code, 0, 1);
799         spin_lock(&li->lock);
800         list_add(&inti->list, &li->list);
801         atomic_set(&li->active, 1);
802         BUG_ON(waitqueue_active(li->wq));
803         spin_unlock(&li->lock);
804         return 0;
805 }
806
807 int kvm_s390_inject_prog_irq(struct kvm_vcpu *vcpu,
808                              struct kvm_s390_pgm_info *pgm_info)
809 {
810         struct kvm_s390_local_interrupt *li = &vcpu->arch.local_int;
811         struct kvm_s390_interrupt_info *inti;
812
813         inti = kzalloc(sizeof(*inti), GFP_KERNEL);
814         if (!inti)
815                 return -ENOMEM;
816
817         VCPU_EVENT(vcpu, 3, "inject: prog irq %d (from kernel)",
818                    pgm_info->code);
819         trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, KVM_S390_PROGRAM_INT,
820                                    pgm_info->code, 0, 1);
821
822         inti->type = KVM_S390_PROGRAM_INT;
823         memcpy(&inti->pgm, pgm_info, sizeof(inti->pgm));
824         spin_lock(&li->lock);
825         list_add(&inti->list, &li->list);
826         atomic_set(&li->active, 1);
827         BUG_ON(waitqueue_active(li->wq));
828         spin_unlock(&li->lock);
829         return 0;
830 }
831
832 struct kvm_s390_interrupt_info *kvm_s390_get_io_int(struct kvm *kvm,
833                                                     u64 cr6, u64 schid)
834 {
835         struct kvm_s390_float_interrupt *fi;
836         struct kvm_s390_interrupt_info *inti, *iter;
837
838         if ((!schid && !cr6) || (schid && cr6))
839                 return NULL;
840         mutex_lock(&kvm->lock);
841         fi = &kvm->arch.float_int;
842         spin_lock(&fi->lock);
843         inti = NULL;
844         list_for_each_entry(iter, &fi->list, list) {
845                 if (!is_ioint(iter->type))
846                         continue;
847                 if (cr6 &&
848                     ((cr6 & int_word_to_isc_bits(iter->io.io_int_word)) == 0))
849                         continue;
850                 if (schid) {
851                         if (((schid & 0x00000000ffff0000) >> 16) !=
852                             iter->io.subchannel_id)
853                                 continue;
854                         if ((schid & 0x000000000000ffff) !=
855                             iter->io.subchannel_nr)
856                                 continue;
857                 }
858                 inti = iter;
859                 break;
860         }
861         if (inti) {
862                 list_del_init(&inti->list);
863                 fi->irq_count--;
864         }
865         if (list_empty(&fi->list))
866                 atomic_set(&fi->active, 0);
867         spin_unlock(&fi->lock);
868         mutex_unlock(&kvm->lock);
869         return inti;
870 }
871
872 static int __inject_vm(struct kvm *kvm, struct kvm_s390_interrupt_info *inti)
873 {
874         struct kvm_s390_local_interrupt *li;
875         struct kvm_s390_float_interrupt *fi;
876         struct kvm_s390_interrupt_info *iter;
877         struct kvm_vcpu *dst_vcpu = NULL;
878         int sigcpu;
879         int rc = 0;
880
881         mutex_lock(&kvm->lock);
882         fi = &kvm->arch.float_int;
883         spin_lock(&fi->lock);
884         if (fi->irq_count >= KVM_S390_MAX_FLOAT_IRQS) {
885                 rc = -EINVAL;
886                 goto unlock_fi;
887         }
888         fi->irq_count++;
889         if (!is_ioint(inti->type)) {
890                 list_add_tail(&inti->list, &fi->list);
891         } else {
892                 u64 isc_bits = int_word_to_isc_bits(inti->io.io_int_word);
893
894                 /* Keep I/O interrupts sorted in isc order. */
895                 list_for_each_entry(iter, &fi->list, list) {
896                         if (!is_ioint(iter->type))
897                                 continue;
898                         if (int_word_to_isc_bits(iter->io.io_int_word)
899                             <= isc_bits)
900                                 continue;
901                         break;
902                 }
903                 list_add_tail(&inti->list, &iter->list);
904         }
905         atomic_set(&fi->active, 1);
906         sigcpu = find_first_bit(fi->idle_mask, KVM_MAX_VCPUS);
907         if (sigcpu == KVM_MAX_VCPUS) {
908                 do {
909                         sigcpu = fi->next_rr_cpu++;
910                         if (sigcpu == KVM_MAX_VCPUS)
911                                 sigcpu = fi->next_rr_cpu = 0;
912                 } while (kvm_get_vcpu(kvm, sigcpu) == NULL);
913         }
914         dst_vcpu = kvm_get_vcpu(kvm, sigcpu);
915         li = &dst_vcpu->arch.local_int;
916         spin_lock(&li->lock);
917         atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
918         spin_unlock(&li->lock);
919         kvm_s390_vcpu_wakeup(kvm_get_vcpu(kvm, sigcpu));
920 unlock_fi:
921         spin_unlock(&fi->lock);
922         mutex_unlock(&kvm->lock);
923         return rc;
924 }
925
926 int kvm_s390_inject_vm(struct kvm *kvm,
927                        struct kvm_s390_interrupt *s390int)
928 {
929         struct kvm_s390_interrupt_info *inti;
930
931         inti = kzalloc(sizeof(*inti), GFP_KERNEL);
932         if (!inti)
933                 return -ENOMEM;
934
935         inti->type = s390int->type;
936         switch (inti->type) {
937         case KVM_S390_INT_VIRTIO:
938                 VM_EVENT(kvm, 5, "inject: virtio parm:%x,parm64:%llx",
939                          s390int->parm, s390int->parm64);
940                 inti->ext.ext_params = s390int->parm;
941                 inti->ext.ext_params2 = s390int->parm64;
942                 break;
943         case KVM_S390_INT_SERVICE:
944                 VM_EVENT(kvm, 5, "inject: sclp parm:%x", s390int->parm);
945                 inti->ext.ext_params = s390int->parm;
946                 break;
947         case KVM_S390_INT_PFAULT_DONE:
948                 inti->type = s390int->type;
949                 inti->ext.ext_params2 = s390int->parm64;
950                 break;
951         case KVM_S390_MCHK:
952                 VM_EVENT(kvm, 5, "inject: machine check parm64:%llx",
953                          s390int->parm64);
954                 inti->mchk.cr14 = s390int->parm; /* upper bits are not used */
955                 inti->mchk.mcic = s390int->parm64;
956                 break;
957         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
958                 if (inti->type & IOINT_AI_MASK)
959                         VM_EVENT(kvm, 5, "%s", "inject: I/O (AI)");
960                 else
961                         VM_EVENT(kvm, 5, "inject: I/O css %x ss %x schid %04x",
962                                  s390int->type & IOINT_CSSID_MASK,
963                                  s390int->type & IOINT_SSID_MASK,
964                                  s390int->type & IOINT_SCHID_MASK);
965                 inti->io.subchannel_id = s390int->parm >> 16;
966                 inti->io.subchannel_nr = s390int->parm & 0x0000ffffu;
967                 inti->io.io_int_parm = s390int->parm64 >> 32;
968                 inti->io.io_int_word = s390int->parm64 & 0x00000000ffffffffull;
969                 break;
970         default:
971                 kfree(inti);
972                 return -EINVAL;
973         }
974         trace_kvm_s390_inject_vm(s390int->type, s390int->parm, s390int->parm64,
975                                  2);
976
977         return __inject_vm(kvm, inti);
978 }
979
980 void kvm_s390_reinject_io_int(struct kvm *kvm,
981                               struct kvm_s390_interrupt_info *inti)
982 {
983         __inject_vm(kvm, inti);
984 }
985
986 int kvm_s390_inject_vcpu(struct kvm_vcpu *vcpu,
987                          struct kvm_s390_interrupt *s390int)
988 {
989         struct kvm_s390_local_interrupt *li;
990         struct kvm_s390_interrupt_info *inti;
991
992         inti = kzalloc(sizeof(*inti), GFP_KERNEL);
993         if (!inti)
994                 return -ENOMEM;
995
996         switch (s390int->type) {
997         case KVM_S390_PROGRAM_INT:
998                 if (s390int->parm & 0xffff0000) {
999                         kfree(inti);
1000                         return -EINVAL;
1001                 }
1002                 inti->type = s390int->type;
1003                 inti->pgm.code = s390int->parm;
1004                 VCPU_EVENT(vcpu, 3, "inject: program check %d (from user)",
1005                            s390int->parm);
1006                 break;
1007         case KVM_S390_SIGP_SET_PREFIX:
1008                 inti->prefix.address = s390int->parm;
1009                 inti->type = s390int->type;
1010                 VCPU_EVENT(vcpu, 3, "inject: set prefix to %x (from user)",
1011                            s390int->parm);
1012                 break;
1013         case KVM_S390_SIGP_STOP:
1014         case KVM_S390_RESTART:
1015         case KVM_S390_INT_CLOCK_COMP:
1016         case KVM_S390_INT_CPU_TIMER:
1017                 VCPU_EVENT(vcpu, 3, "inject: type %x", s390int->type);
1018                 inti->type = s390int->type;
1019                 break;
1020         case KVM_S390_INT_EXTERNAL_CALL:
1021                 if (s390int->parm & 0xffff0000) {
1022                         kfree(inti);
1023                         return -EINVAL;
1024                 }
1025                 VCPU_EVENT(vcpu, 3, "inject: external call source-cpu:%u",
1026                            s390int->parm);
1027                 inti->type = s390int->type;
1028                 inti->extcall.code = s390int->parm;
1029                 break;
1030         case KVM_S390_INT_EMERGENCY:
1031                 if (s390int->parm & 0xffff0000) {
1032                         kfree(inti);
1033                         return -EINVAL;
1034                 }
1035                 VCPU_EVENT(vcpu, 3, "inject: emergency %u\n", s390int->parm);
1036                 inti->type = s390int->type;
1037                 inti->emerg.code = s390int->parm;
1038                 break;
1039         case KVM_S390_MCHK:
1040                 VCPU_EVENT(vcpu, 5, "inject: machine check parm64:%llx",
1041                            s390int->parm64);
1042                 inti->type = s390int->type;
1043                 inti->mchk.mcic = s390int->parm64;
1044                 break;
1045         case KVM_S390_INT_PFAULT_INIT:
1046                 inti->type = s390int->type;
1047                 inti->ext.ext_params2 = s390int->parm64;
1048                 break;
1049         case KVM_S390_INT_VIRTIO:
1050         case KVM_S390_INT_SERVICE:
1051         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1052         default:
1053                 kfree(inti);
1054                 return -EINVAL;
1055         }
1056         trace_kvm_s390_inject_vcpu(vcpu->vcpu_id, s390int->type, s390int->parm,
1057                                    s390int->parm64, 2);
1058
1059         mutex_lock(&vcpu->kvm->lock);
1060         li = &vcpu->arch.local_int;
1061         spin_lock(&li->lock);
1062         if (inti->type == KVM_S390_PROGRAM_INT)
1063                 list_add(&inti->list, &li->list);
1064         else
1065                 list_add_tail(&inti->list, &li->list);
1066         atomic_set(&li->active, 1);
1067         if (inti->type == KVM_S390_SIGP_STOP)
1068                 li->action_bits |= ACTION_STOP_ON_STOP;
1069         atomic_set_mask(CPUSTAT_EXT_INT, li->cpuflags);
1070         spin_unlock(&li->lock);
1071         mutex_unlock(&vcpu->kvm->lock);
1072         kvm_s390_vcpu_wakeup(vcpu);
1073         return 0;
1074 }
1075
1076 void kvm_s390_clear_float_irqs(struct kvm *kvm)
1077 {
1078         struct kvm_s390_float_interrupt *fi;
1079         struct kvm_s390_interrupt_info  *n, *inti = NULL;
1080
1081         mutex_lock(&kvm->lock);
1082         fi = &kvm->arch.float_int;
1083         spin_lock(&fi->lock);
1084         list_for_each_entry_safe(inti, n, &fi->list, list) {
1085                 list_del(&inti->list);
1086                 kfree(inti);
1087         }
1088         fi->irq_count = 0;
1089         atomic_set(&fi->active, 0);
1090         spin_unlock(&fi->lock);
1091         mutex_unlock(&kvm->lock);
1092 }
1093
1094 static inline int copy_irq_to_user(struct kvm_s390_interrupt_info *inti,
1095                                    u8 *addr)
1096 {
1097         struct kvm_s390_irq __user *uptr = (struct kvm_s390_irq __user *) addr;
1098         struct kvm_s390_irq irq = {0};
1099
1100         irq.type = inti->type;
1101         switch (inti->type) {
1102         case KVM_S390_INT_PFAULT_INIT:
1103         case KVM_S390_INT_PFAULT_DONE:
1104         case KVM_S390_INT_VIRTIO:
1105         case KVM_S390_INT_SERVICE:
1106                 irq.u.ext = inti->ext;
1107                 break;
1108         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1109                 irq.u.io = inti->io;
1110                 break;
1111         case KVM_S390_MCHK:
1112                 irq.u.mchk = inti->mchk;
1113                 break;
1114         default:
1115                 return -EINVAL;
1116         }
1117
1118         if (copy_to_user(uptr, &irq, sizeof(irq)))
1119                 return -EFAULT;
1120
1121         return 0;
1122 }
1123
1124 static int get_all_floating_irqs(struct kvm *kvm, __u8 *buf, __u64 len)
1125 {
1126         struct kvm_s390_interrupt_info *inti;
1127         struct kvm_s390_float_interrupt *fi;
1128         int ret = 0;
1129         int n = 0;
1130
1131         mutex_lock(&kvm->lock);
1132         fi = &kvm->arch.float_int;
1133         spin_lock(&fi->lock);
1134
1135         list_for_each_entry(inti, &fi->list, list) {
1136                 if (len < sizeof(struct kvm_s390_irq)) {
1137                         /* signal userspace to try again */
1138                         ret = -ENOMEM;
1139                         break;
1140                 }
1141                 ret = copy_irq_to_user(inti, buf);
1142                 if (ret)
1143                         break;
1144                 buf += sizeof(struct kvm_s390_irq);
1145                 len -= sizeof(struct kvm_s390_irq);
1146                 n++;
1147         }
1148
1149         spin_unlock(&fi->lock);
1150         mutex_unlock(&kvm->lock);
1151
1152         return ret < 0 ? ret : n;
1153 }
1154
1155 static int flic_get_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
1156 {
1157         int r;
1158
1159         switch (attr->group) {
1160         case KVM_DEV_FLIC_GET_ALL_IRQS:
1161                 r = get_all_floating_irqs(dev->kvm, (u8 *) attr->addr,
1162                                           attr->attr);
1163                 break;
1164         default:
1165                 r = -EINVAL;
1166         }
1167
1168         return r;
1169 }
1170
1171 static inline int copy_irq_from_user(struct kvm_s390_interrupt_info *inti,
1172                                      u64 addr)
1173 {
1174         struct kvm_s390_irq __user *uptr = (struct kvm_s390_irq __user *) addr;
1175         void *target = NULL;
1176         void __user *source;
1177         u64 size;
1178
1179         if (get_user(inti->type, (u64 __user *)addr))
1180                 return -EFAULT;
1181
1182         switch (inti->type) {
1183         case KVM_S390_INT_PFAULT_INIT:
1184         case KVM_S390_INT_PFAULT_DONE:
1185         case KVM_S390_INT_VIRTIO:
1186         case KVM_S390_INT_SERVICE:
1187                 target = (void *) &inti->ext;
1188                 source = &uptr->u.ext;
1189                 size = sizeof(inti->ext);
1190                 break;
1191         case KVM_S390_INT_IO_MIN...KVM_S390_INT_IO_MAX:
1192                 target = (void *) &inti->io;
1193                 source = &uptr->u.io;
1194                 size = sizeof(inti->io);
1195                 break;
1196         case KVM_S390_MCHK:
1197                 target = (void *) &inti->mchk;
1198                 source = &uptr->u.mchk;
1199                 size = sizeof(inti->mchk);
1200                 break;
1201         default:
1202                 return -EINVAL;
1203         }
1204
1205         if (copy_from_user(target, source, size))
1206                 return -EFAULT;
1207
1208         return 0;
1209 }
1210
1211 static int enqueue_floating_irq(struct kvm_device *dev,
1212                                 struct kvm_device_attr *attr)
1213 {
1214         struct kvm_s390_interrupt_info *inti = NULL;
1215         int r = 0;
1216         int len = attr->attr;
1217
1218         if (len % sizeof(struct kvm_s390_irq) != 0)
1219                 return -EINVAL;
1220         else if (len > KVM_S390_FLIC_MAX_BUFFER)
1221                 return -EINVAL;
1222
1223         while (len >= sizeof(struct kvm_s390_irq)) {
1224                 inti = kzalloc(sizeof(*inti), GFP_KERNEL);
1225                 if (!inti)
1226                         return -ENOMEM;
1227
1228                 r = copy_irq_from_user(inti, attr->addr);
1229                 if (r) {
1230                         kfree(inti);
1231                         return r;
1232                 }
1233                 r = __inject_vm(dev->kvm, inti);
1234                 if (r) {
1235                         kfree(inti);
1236                         return r;
1237                 }
1238                 len -= sizeof(struct kvm_s390_irq);
1239                 attr->addr += sizeof(struct kvm_s390_irq);
1240         }
1241
1242         return r;
1243 }
1244
1245 static struct s390_io_adapter *get_io_adapter(struct kvm *kvm, unsigned int id)
1246 {
1247         if (id >= MAX_S390_IO_ADAPTERS)
1248                 return NULL;
1249         return kvm->arch.adapters[id];
1250 }
1251
1252 static int register_io_adapter(struct kvm_device *dev,
1253                                struct kvm_device_attr *attr)
1254 {
1255         struct s390_io_adapter *adapter;
1256         struct kvm_s390_io_adapter adapter_info;
1257
1258         if (copy_from_user(&adapter_info,
1259                            (void __user *)attr->addr, sizeof(adapter_info)))
1260                 return -EFAULT;
1261
1262         if ((adapter_info.id >= MAX_S390_IO_ADAPTERS) ||
1263             (dev->kvm->arch.adapters[adapter_info.id] != NULL))
1264                 return -EINVAL;
1265
1266         adapter = kzalloc(sizeof(*adapter), GFP_KERNEL);
1267         if (!adapter)
1268                 return -ENOMEM;
1269
1270         INIT_LIST_HEAD(&adapter->maps);
1271         init_rwsem(&adapter->maps_lock);
1272         atomic_set(&adapter->nr_maps, 0);
1273         adapter->id = adapter_info.id;
1274         adapter->isc = adapter_info.isc;
1275         adapter->maskable = adapter_info.maskable;
1276         adapter->masked = false;
1277         adapter->swap = adapter_info.swap;
1278         dev->kvm->arch.adapters[adapter->id] = adapter;
1279
1280         return 0;
1281 }
1282
1283 int kvm_s390_mask_adapter(struct kvm *kvm, unsigned int id, bool masked)
1284 {
1285         int ret;
1286         struct s390_io_adapter *adapter = get_io_adapter(kvm, id);
1287
1288         if (!adapter || !adapter->maskable)
1289                 return -EINVAL;
1290         ret = adapter->masked;
1291         adapter->masked = masked;
1292         return ret;
1293 }
1294
1295 static int kvm_s390_adapter_map(struct kvm *kvm, unsigned int id, __u64 addr)
1296 {
1297         struct s390_io_adapter *adapter = get_io_adapter(kvm, id);
1298         struct s390_map_info *map;
1299         int ret;
1300
1301         if (!adapter || !addr)
1302                 return -EINVAL;
1303
1304         map = kzalloc(sizeof(*map), GFP_KERNEL);
1305         if (!map) {
1306                 ret = -ENOMEM;
1307                 goto out;
1308         }
1309         INIT_LIST_HEAD(&map->list);
1310         map->guest_addr = addr;
1311         map->addr = gmap_translate(addr, kvm->arch.gmap);
1312         if (map->addr == -EFAULT) {
1313                 ret = -EFAULT;
1314                 goto out;
1315         }
1316         ret = get_user_pages_fast(map->addr, 1, 1, &map->page);
1317         if (ret < 0)
1318                 goto out;
1319         BUG_ON(ret != 1);
1320         down_write(&adapter->maps_lock);
1321         if (atomic_inc_return(&adapter->nr_maps) < MAX_S390_ADAPTER_MAPS) {
1322                 list_add_tail(&map->list, &adapter->maps);
1323                 ret = 0;
1324         } else {
1325                 put_page(map->page);
1326                 ret = -EINVAL;
1327         }
1328         up_write(&adapter->maps_lock);
1329 out:
1330         if (ret)
1331                 kfree(map);
1332         return ret;
1333 }
1334
1335 static int kvm_s390_adapter_unmap(struct kvm *kvm, unsigned int id, __u64 addr)
1336 {
1337         struct s390_io_adapter *adapter = get_io_adapter(kvm, id);
1338         struct s390_map_info *map, *tmp;
1339         int found = 0;
1340
1341         if (!adapter || !addr)
1342                 return -EINVAL;
1343
1344         down_write(&adapter->maps_lock);
1345         list_for_each_entry_safe(map, tmp, &adapter->maps, list) {
1346                 if (map->guest_addr == addr) {
1347                         found = 1;
1348                         atomic_dec(&adapter->nr_maps);
1349                         list_del(&map->list);
1350                         put_page(map->page);
1351                         kfree(map);
1352                         break;
1353                 }
1354         }
1355         up_write(&adapter->maps_lock);
1356
1357         return found ? 0 : -EINVAL;
1358 }
1359
1360 void kvm_s390_destroy_adapters(struct kvm *kvm)
1361 {
1362         int i;
1363         struct s390_map_info *map, *tmp;
1364
1365         for (i = 0; i < MAX_S390_IO_ADAPTERS; i++) {
1366                 if (!kvm->arch.adapters[i])
1367                         continue;
1368                 list_for_each_entry_safe(map, tmp,
1369                                          &kvm->arch.adapters[i]->maps, list) {
1370                         list_del(&map->list);
1371                         put_page(map->page);
1372                         kfree(map);
1373                 }
1374                 kfree(kvm->arch.adapters[i]);
1375         }
1376 }
1377
1378 static int modify_io_adapter(struct kvm_device *dev,
1379                              struct kvm_device_attr *attr)
1380 {
1381         struct kvm_s390_io_adapter_req req;
1382         struct s390_io_adapter *adapter;
1383         int ret;
1384
1385         if (copy_from_user(&req, (void __user *)attr->addr, sizeof(req)))
1386                 return -EFAULT;
1387
1388         adapter = get_io_adapter(dev->kvm, req.id);
1389         if (!adapter)
1390                 return -EINVAL;
1391         switch (req.type) {
1392         case KVM_S390_IO_ADAPTER_MASK:
1393                 ret = kvm_s390_mask_adapter(dev->kvm, req.id, req.mask);
1394                 if (ret > 0)
1395                         ret = 0;
1396                 break;
1397         case KVM_S390_IO_ADAPTER_MAP:
1398                 ret = kvm_s390_adapter_map(dev->kvm, req.id, req.addr);
1399                 break;
1400         case KVM_S390_IO_ADAPTER_UNMAP:
1401                 ret = kvm_s390_adapter_unmap(dev->kvm, req.id, req.addr);
1402                 break;
1403         default:
1404                 ret = -EINVAL;
1405         }
1406
1407         return ret;
1408 }
1409
1410 static int flic_set_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
1411 {
1412         int r = 0;
1413         unsigned int i;
1414         struct kvm_vcpu *vcpu;
1415
1416         switch (attr->group) {
1417         case KVM_DEV_FLIC_ENQUEUE:
1418                 r = enqueue_floating_irq(dev, attr);
1419                 break;
1420         case KVM_DEV_FLIC_CLEAR_IRQS:
1421                 r = 0;
1422                 kvm_s390_clear_float_irqs(dev->kvm);
1423                 break;
1424         case KVM_DEV_FLIC_APF_ENABLE:
1425                 dev->kvm->arch.gmap->pfault_enabled = 1;
1426                 break;
1427         case KVM_DEV_FLIC_APF_DISABLE_WAIT:
1428                 dev->kvm->arch.gmap->pfault_enabled = 0;
1429                 /*
1430                  * Make sure no async faults are in transition when
1431                  * clearing the queues. So we don't need to worry
1432                  * about late coming workers.
1433                  */
1434                 synchronize_srcu(&dev->kvm->srcu);
1435                 kvm_for_each_vcpu(i, vcpu, dev->kvm)
1436                         kvm_clear_async_pf_completion_queue(vcpu);
1437                 break;
1438         case KVM_DEV_FLIC_ADAPTER_REGISTER:
1439                 r = register_io_adapter(dev, attr);
1440                 break;
1441         case KVM_DEV_FLIC_ADAPTER_MODIFY:
1442                 r = modify_io_adapter(dev, attr);
1443                 break;
1444         default:
1445                 r = -EINVAL;
1446         }
1447
1448         return r;
1449 }
1450
1451 static int flic_create(struct kvm_device *dev, u32 type)
1452 {
1453         if (!dev)
1454                 return -EINVAL;
1455         if (dev->kvm->arch.flic)
1456                 return -EINVAL;
1457         dev->kvm->arch.flic = dev;
1458         return 0;
1459 }
1460
1461 static void flic_destroy(struct kvm_device *dev)
1462 {
1463         dev->kvm->arch.flic = NULL;
1464         kfree(dev);
1465 }
1466
1467 /* s390 floating irq controller (flic) */
1468 struct kvm_device_ops kvm_flic_ops = {
1469         .name = "kvm-flic",
1470         .get_attr = flic_get_attr,
1471         .set_attr = flic_set_attr,
1472         .create = flic_create,
1473         .destroy = flic_destroy,
1474 };
1475
1476 static unsigned long get_ind_bit(__u64 addr, unsigned long bit_nr, bool swap)
1477 {
1478         unsigned long bit;
1479
1480         bit = bit_nr + (addr % PAGE_SIZE) * 8;
1481
1482         return swap ? (bit ^ (BITS_PER_LONG - 1)) : bit;
1483 }
1484
1485 static struct s390_map_info *get_map_info(struct s390_io_adapter *adapter,
1486                                           u64 addr)
1487 {
1488         struct s390_map_info *map;
1489
1490         if (!adapter)
1491                 return NULL;
1492
1493         list_for_each_entry(map, &adapter->maps, list) {
1494                 if (map->guest_addr == addr)
1495                         return map;
1496         }
1497         return NULL;
1498 }
1499
1500 static int adapter_indicators_set(struct kvm *kvm,
1501                                   struct s390_io_adapter *adapter,
1502                                   struct kvm_s390_adapter_int *adapter_int)
1503 {
1504         unsigned long bit;
1505         int summary_set, idx;
1506         struct s390_map_info *info;
1507         void *map;
1508
1509         info = get_map_info(adapter, adapter_int->ind_addr);
1510         if (!info)
1511                 return -1;
1512         map = page_address(info->page);
1513         bit = get_ind_bit(info->addr, adapter_int->ind_offset, adapter->swap);
1514         set_bit(bit, map);
1515         idx = srcu_read_lock(&kvm->srcu);
1516         mark_page_dirty(kvm, info->guest_addr >> PAGE_SHIFT);
1517         set_page_dirty_lock(info->page);
1518         info = get_map_info(adapter, adapter_int->summary_addr);
1519         if (!info) {
1520                 srcu_read_unlock(&kvm->srcu, idx);
1521                 return -1;
1522         }
1523         map = page_address(info->page);
1524         bit = get_ind_bit(info->addr, adapter_int->summary_offset,
1525                           adapter->swap);
1526         summary_set = test_and_set_bit(bit, map);
1527         mark_page_dirty(kvm, info->guest_addr >> PAGE_SHIFT);
1528         set_page_dirty_lock(info->page);
1529         srcu_read_unlock(&kvm->srcu, idx);
1530         return summary_set ? 0 : 1;
1531 }
1532
1533 /*
1534  * < 0 - not injected due to error
1535  * = 0 - coalesced, summary indicator already active
1536  * > 0 - injected interrupt
1537  */
1538 static int set_adapter_int(struct kvm_kernel_irq_routing_entry *e,
1539                            struct kvm *kvm, int irq_source_id, int level,
1540                            bool line_status)
1541 {
1542         int ret;
1543         struct s390_io_adapter *adapter;
1544
1545         /* We're only interested in the 0->1 transition. */
1546         if (!level)
1547                 return 0;
1548         adapter = get_io_adapter(kvm, e->adapter.adapter_id);
1549         if (!adapter)
1550                 return -1;
1551         down_read(&adapter->maps_lock);
1552         ret = adapter_indicators_set(kvm, adapter, &e->adapter);
1553         up_read(&adapter->maps_lock);
1554         if ((ret > 0) && !adapter->masked) {
1555                 struct kvm_s390_interrupt s390int = {
1556                         .type = KVM_S390_INT_IO(1, 0, 0, 0),
1557                         .parm = 0,
1558                         .parm64 = (adapter->isc << 27) | 0x80000000,
1559                 };
1560                 ret = kvm_s390_inject_vm(kvm, &s390int);
1561                 if (ret == 0)
1562                         ret = 1;
1563         }
1564         return ret;
1565 }
1566
1567 int kvm_set_routing_entry(struct kvm_irq_routing_table *rt,
1568                           struct kvm_kernel_irq_routing_entry *e,
1569                           const struct kvm_irq_routing_entry *ue)
1570 {
1571         int ret;
1572
1573         switch (ue->type) {
1574         case KVM_IRQ_ROUTING_S390_ADAPTER:
1575                 e->set = set_adapter_int;
1576                 e->adapter.summary_addr = ue->u.adapter.summary_addr;
1577                 e->adapter.ind_addr = ue->u.adapter.ind_addr;
1578                 e->adapter.summary_offset = ue->u.adapter.summary_offset;
1579                 e->adapter.ind_offset = ue->u.adapter.ind_offset;
1580                 e->adapter.adapter_id = ue->u.adapter.adapter_id;
1581                 ret = 0;
1582                 break;
1583         default:
1584                 ret = -EINVAL;
1585         }
1586
1587         return ret;
1588 }
1589
1590 int kvm_set_msi(struct kvm_kernel_irq_routing_entry *e, struct kvm *kvm,
1591                 int irq_source_id, int level, bool line_status)
1592 {
1593         return -EINVAL;
1594 }