]> git.proxmox.com Git - mirror_ubuntu-hirsute-kernel.git/blame - arch/powerpc/kvm/book3s_xics.c
KVM: PPC: Book3S HV: Use XICS hypercalls when running as a nested hypervisor
[mirror_ubuntu-hirsute-kernel.git] / arch / powerpc / kvm / book3s_xics.c
CommitLineData
bc5ad3f3
BH
1/*
2 * Copyright 2012 Michael Ellerman, IBM Corporation.
3 * Copyright 2012 Benjamin Herrenschmidt, IBM Corporation.
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License, version 2, as
7 * published by the Free Software Foundation.
8 */
9
10#include <linux/kernel.h>
11#include <linux/kvm_host.h>
12#include <linux/err.h>
13#include <linux/gfp.h>
5975a2e0 14#include <linux/anon_inodes.h>
433c5c20 15#include <linux/spinlock.h>
bc5ad3f3 16
7c0f6ba6 17#include <linux/uaccess.h>
bc5ad3f3
BH
18#include <asm/kvm_book3s.h>
19#include <asm/kvm_ppc.h>
20#include <asm/hvcall.h>
21#include <asm/xics.h>
7644d581 22#include <asm/debugfs.h>
7bfa9ad5 23#include <asm/time.h>
bc5ad3f3 24
bc5ad3f3
BH
25#include <linux/seq_file.h>
26
27#include "book3s_xics.h"
28
29#if 1
30#define XICS_DBG(fmt...) do { } while (0)
31#else
32#define XICS_DBG(fmt...) trace_printk(fmt)
33#endif
34
e7d26f28
BH
35#define ENABLE_REALMODE true
36#define DEBUG_REALMODE false
37
bc5ad3f3
BH
38/*
39 * LOCKING
40 * =======
41 *
34cb7954 42 * Each ICS has a spin lock protecting the information about the IRQ
4e33d1f0 43 * sources and avoiding simultaneous deliveries of the same interrupt.
bc5ad3f3
BH
44 *
45 * ICP operations are done via a single compare & swap transaction
46 * (most ICP state fits in the union kvmppc_icp_state)
47 */
48
49/*
50 * TODO
51 * ====
52 *
53 * - To speed up resends, keep a bitmap of "resend" set bits in the
54 * ICS
55 *
56 * - Speed up server# -> ICP lookup (array ? hash table ?)
57 *
58 * - Make ICS lockless as well, or at least a per-interrupt lock or hashed
59 * locks array to improve scalability
bc5ad3f3
BH
60 */
61
62/* -- ICS routines -- */
63
64static void icp_deliver_irq(struct kvmppc_xics *xics, struct kvmppc_icp *icp,
21acd0e4 65 u32 new_irq, bool check_resend);
bc5ad3f3 66
25a2150b
PM
67/*
68 * Return value ideally indicates how the interrupt was handled, but no
69 * callers look at it (given that we don't implement KVM_IRQ_LINE_STATUS),
70 * so just return 0.
71 */
72static int ics_deliver_irq(struct kvmppc_xics *xics, u32 irq, u32 level)
bc5ad3f3
BH
73{
74 struct ics_irq_state *state;
75 struct kvmppc_ics *ics;
76 u16 src;
17d48610 77 u32 pq_old, pq_new;
bc5ad3f3
BH
78
79 XICS_DBG("ics deliver %#x (level: %d)\n", irq, level);
80
81 ics = kvmppc_xics_find_ics(xics, irq, &src);
82 if (!ics) {
83 XICS_DBG("ics_deliver_irq: IRQ 0x%06x not found !\n", irq);
84 return -EINVAL;
85 }
86 state = &ics->irq_state[src];
87 if (!state->exists)
88 return -EINVAL;
89
17d48610
LZ
90 if (level == KVM_INTERRUPT_SET_LEVEL || level == KVM_INTERRUPT_SET)
91 level = 1;
92 else if (level == KVM_INTERRUPT_UNSET)
93 level = 0;
bc5ad3f3 94 /*
17d48610
LZ
95 * Take other values the same as 1, consistent with original code.
96 * maybe WARN here?
bc5ad3f3 97 */
17d48610
LZ
98
99 if (!state->lsi && level == 0) /* noop for MSI */
bc5ad3f3 100 return 0;
17d48610
LZ
101
102 do {
103 pq_old = state->pq_state;
104 if (state->lsi) {
105 if (level) {
106 if (pq_old & PQ_PRESENTED)
107 /* Setting already set LSI ... */
108 return 0;
109
110 pq_new = PQ_PRESENTED;
111 } else
112 pq_new = 0;
113 } else
114 pq_new = ((pq_old << 1) & 3) | PQ_PRESENTED;
115 } while (cmpxchg(&state->pq_state, pq_old, pq_new) != pq_old);
116
117 /* Test P=1, Q=0, this is the only case where we present */
118 if (pq_new == PQ_PRESENTED)
21acd0e4 119 icp_deliver_irq(xics, NULL, irq, false);
bc5ad3f3 120
5d375199
PM
121 /* Record which CPU this arrived on for passed-through interrupts */
122 if (state->host_irq)
123 state->intr_cpu = raw_smp_processor_id();
124
25a2150b 125 return 0;
bc5ad3f3
BH
126}
127
128static void ics_check_resend(struct kvmppc_xics *xics, struct kvmppc_ics *ics,
129 struct kvmppc_icp *icp)
130{
131 int i;
132
bc5ad3f3
BH
133 for (i = 0; i < KVMPPC_XICS_IRQ_PER_ICS; i++) {
134 struct ics_irq_state *state = &ics->irq_state[i];
21acd0e4
LZ
135 if (state->resend) {
136 XICS_DBG("resend %#x prio %#x\n", state->number,
137 state->priority);
138 icp_deliver_irq(xics, icp, state->number, true);
139 }
bc5ad3f3 140 }
bc5ad3f3
BH
141}
142
d19bd862
PM
143static bool write_xive(struct kvmppc_xics *xics, struct kvmppc_ics *ics,
144 struct ics_irq_state *state,
145 u32 server, u32 priority, u32 saved_priority)
146{
147 bool deliver;
34cb7954 148 unsigned long flags;
d19bd862 149
34cb7954
SW
150 local_irq_save(flags);
151 arch_spin_lock(&ics->lock);
d19bd862
PM
152
153 state->server = server;
154 state->priority = priority;
155 state->saved_priority = saved_priority;
156 deliver = false;
157 if ((state->masked_pending || state->resend) && priority != MASKED) {
158 state->masked_pending = 0;
bf5a71d5 159 state->resend = 0;
d19bd862
PM
160 deliver = true;
161 }
162
34cb7954
SW
163 arch_spin_unlock(&ics->lock);
164 local_irq_restore(flags);
d19bd862
PM
165
166 return deliver;
167}
168
bc5ad3f3
BH
169int kvmppc_xics_set_xive(struct kvm *kvm, u32 irq, u32 server, u32 priority)
170{
171 struct kvmppc_xics *xics = kvm->arch.xics;
172 struct kvmppc_icp *icp;
173 struct kvmppc_ics *ics;
174 struct ics_irq_state *state;
175 u16 src;
bc5ad3f3
BH
176
177 if (!xics)
178 return -ENODEV;
179
180 ics = kvmppc_xics_find_ics(xics, irq, &src);
181 if (!ics)
182 return -EINVAL;
183 state = &ics->irq_state[src];
184
185 icp = kvmppc_xics_find_server(kvm, server);
186 if (!icp)
187 return -EINVAL;
188
bc5ad3f3
BH
189 XICS_DBG("set_xive %#x server %#x prio %#x MP:%d RS:%d\n",
190 irq, server, priority,
191 state->masked_pending, state->resend);
192
d19bd862 193 if (write_xive(xics, ics, state, server, priority, priority))
21acd0e4 194 icp_deliver_irq(xics, icp, irq, false);
bc5ad3f3
BH
195
196 return 0;
197}
198
199int kvmppc_xics_get_xive(struct kvm *kvm, u32 irq, u32 *server, u32 *priority)
200{
201 struct kvmppc_xics *xics = kvm->arch.xics;
202 struct kvmppc_ics *ics;
203 struct ics_irq_state *state;
204 u16 src;
34cb7954 205 unsigned long flags;
bc5ad3f3
BH
206
207 if (!xics)
208 return -ENODEV;
209
210 ics = kvmppc_xics_find_ics(xics, irq, &src);
211 if (!ics)
212 return -EINVAL;
213 state = &ics->irq_state[src];
214
34cb7954
SW
215 local_irq_save(flags);
216 arch_spin_lock(&ics->lock);
bc5ad3f3
BH
217 *server = state->server;
218 *priority = state->priority;
34cb7954
SW
219 arch_spin_unlock(&ics->lock);
220 local_irq_restore(flags);
bc5ad3f3
BH
221
222 return 0;
223}
224
d19bd862
PM
225int kvmppc_xics_int_on(struct kvm *kvm, u32 irq)
226{
227 struct kvmppc_xics *xics = kvm->arch.xics;
228 struct kvmppc_icp *icp;
229 struct kvmppc_ics *ics;
230 struct ics_irq_state *state;
231 u16 src;
232
233 if (!xics)
234 return -ENODEV;
235
236 ics = kvmppc_xics_find_ics(xics, irq, &src);
237 if (!ics)
238 return -EINVAL;
239 state = &ics->irq_state[src];
240
241 icp = kvmppc_xics_find_server(kvm, state->server);
242 if (!icp)
243 return -EINVAL;
244
245 if (write_xive(xics, ics, state, state->server, state->saved_priority,
246 state->saved_priority))
21acd0e4 247 icp_deliver_irq(xics, icp, irq, false);
d19bd862
PM
248
249 return 0;
250}
251
252int kvmppc_xics_int_off(struct kvm *kvm, u32 irq)
253{
254 struct kvmppc_xics *xics = kvm->arch.xics;
255 struct kvmppc_ics *ics;
256 struct ics_irq_state *state;
257 u16 src;
258
259 if (!xics)
260 return -ENODEV;
261
262 ics = kvmppc_xics_find_ics(xics, irq, &src);
263 if (!ics)
264 return -EINVAL;
265 state = &ics->irq_state[src];
266
267 write_xive(xics, ics, state, state->server, MASKED, state->priority);
268
269 return 0;
270}
271
bc5ad3f3
BH
272/* -- ICP routines, including hcalls -- */
273
274static inline bool icp_try_update(struct kvmppc_icp *icp,
275 union kvmppc_icp_state old,
276 union kvmppc_icp_state new,
277 bool change_self)
278{
279 bool success;
280
281 /* Calculate new output value */
282 new.out_ee = (new.xisr && (new.pending_pri < new.cppr));
283
284 /* Attempt atomic update */
285 success = cmpxchg64(&icp->state.raw, old.raw, new.raw) == old.raw;
286 if (!success)
287 goto bail;
288
ade3ac66 289 XICS_DBG("UPD [%04lx] - C:%02x M:%02x PP: %02x PI:%06x R:%d O:%d\n",
bc5ad3f3
BH
290 icp->server_num,
291 old.cppr, old.mfrr, old.pending_pri, old.xisr,
292 old.need_resend, old.out_ee);
293 XICS_DBG("UPD - C:%02x M:%02x PP: %02x PI:%06x R:%d O:%d\n",
294 new.cppr, new.mfrr, new.pending_pri, new.xisr,
295 new.need_resend, new.out_ee);
296 /*
297 * Check for output state update
298 *
299 * Note that this is racy since another processor could be updating
300 * the state already. This is why we never clear the interrupt output
301 * here, we only ever set it. The clear only happens prior to doing
302 * an update and only by the processor itself. Currently we do it
303 * in Accept (H_XIRR) and Up_Cppr (H_XPPR).
304 *
305 * We also do not try to figure out whether the EE state has changed,
e7d26f28
BH
306 * we unconditionally set it if the new state calls for it. The reason
307 * for that is that we opportunistically remove the pending interrupt
308 * flag when raising CPPR, so we need to set it back here if an
309 * interrupt is still pending.
bc5ad3f3
BH
310 */
311 if (new.out_ee) {
312 kvmppc_book3s_queue_irqprio(icp->vcpu,
d24ea8a7 313 BOOK3S_INTERRUPT_EXTERNAL);
bc5ad3f3 314 if (!change_self)
54695c30 315 kvmppc_fast_vcpu_kick(icp->vcpu);
bc5ad3f3
BH
316 }
317 bail:
318 return success;
319}
320
321static void icp_check_resend(struct kvmppc_xics *xics,
322 struct kvmppc_icp *icp)
323{
324 u32 icsid;
325
326 /* Order this load with the test for need_resend in the caller */
327 smp_rmb();
328 for_each_set_bit(icsid, icp->resend_map, xics->max_icsid + 1) {
329 struct kvmppc_ics *ics = xics->ics[icsid];
330
331 if (!test_and_clear_bit(icsid, icp->resend_map))
332 continue;
333 if (!ics)
334 continue;
335 ics_check_resend(xics, ics, icp);
336 }
337}
338
339static bool icp_try_to_deliver(struct kvmppc_icp *icp, u32 irq, u8 priority,
340 u32 *reject)
341{
342 union kvmppc_icp_state old_state, new_state;
343 bool success;
344
ade3ac66 345 XICS_DBG("try deliver %#x(P:%#x) to server %#lx\n", irq, priority,
bc5ad3f3
BH
346 icp->server_num);
347
348 do {
5ee07612 349 old_state = new_state = READ_ONCE(icp->state);
bc5ad3f3
BH
350
351 *reject = 0;
352
353 /* See if we can deliver */
354 success = new_state.cppr > priority &&
355 new_state.mfrr > priority &&
356 new_state.pending_pri > priority;
357
358 /*
359 * If we can, check for a rejection and perform the
360 * delivery
361 */
362 if (success) {
363 *reject = new_state.xisr;
364 new_state.xisr = irq;
365 new_state.pending_pri = priority;
366 } else {
367 /*
368 * If we failed to deliver we set need_resend
369 * so a subsequent CPPR state change causes us
370 * to try a new delivery.
371 */
372 new_state.need_resend = true;
373 }
374
375 } while (!icp_try_update(icp, old_state, new_state, false));
376
377 return success;
378}
379
380static void icp_deliver_irq(struct kvmppc_xics *xics, struct kvmppc_icp *icp,
21acd0e4 381 u32 new_irq, bool check_resend)
bc5ad3f3
BH
382{
383 struct ics_irq_state *state;
384 struct kvmppc_ics *ics;
385 u32 reject;
386 u16 src;
34cb7954 387 unsigned long flags;
bc5ad3f3
BH
388
389 /*
390 * This is used both for initial delivery of an interrupt and
391 * for subsequent rejection.
392 *
393 * Rejection can be racy vs. resends. We have evaluated the
394 * rejection in an atomic ICP transaction which is now complete,
395 * so potentially the ICP can already accept the interrupt again.
396 *
397 * So we need to retry the delivery. Essentially the reject path
398 * boils down to a failed delivery. Always.
399 *
400 * Now the interrupt could also have moved to a different target,
401 * thus we may need to re-do the ICP lookup as well
402 */
403
404 again:
405 /* Get the ICS state and lock it */
406 ics = kvmppc_xics_find_ics(xics, new_irq, &src);
407 if (!ics) {
408 XICS_DBG("icp_deliver_irq: IRQ 0x%06x not found !\n", new_irq);
409 return;
410 }
411 state = &ics->irq_state[src];
412
413 /* Get a lock on the ICS */
34cb7954
SW
414 local_irq_save(flags);
415 arch_spin_lock(&ics->lock);
bc5ad3f3
BH
416
417 /* Get our server */
418 if (!icp || state->server != icp->server_num) {
419 icp = kvmppc_xics_find_server(xics->kvm, state->server);
420 if (!icp) {
421 pr_warn("icp_deliver_irq: IRQ 0x%06x server 0x%x not found !\n",
422 new_irq, state->server);
423 goto out;
424 }
425 }
426
21acd0e4
LZ
427 if (check_resend)
428 if (!state->resend)
429 goto out;
430
bc5ad3f3
BH
431 /* Clear the resend bit of that interrupt */
432 state->resend = 0;
433
434 /*
435 * If masked, bail out
436 *
437 * Note: PAPR doesn't mention anything about masked pending
438 * when doing a resend, only when doing a delivery.
439 *
440 * However that would have the effect of losing a masked
441 * interrupt that was rejected and isn't consistent with
442 * the whole masked_pending business which is about not
443 * losing interrupts that occur while masked.
444 *
446957ba 445 * I don't differentiate normal deliveries and resends, this
bc5ad3f3
BH
446 * implementation will differ from PAPR and not lose such
447 * interrupts.
448 */
449 if (state->priority == MASKED) {
450 XICS_DBG("irq %#x masked pending\n", new_irq);
451 state->masked_pending = 1;
452 goto out;
453 }
454
455 /*
456 * Try the delivery, this will set the need_resend flag
457 * in the ICP as part of the atomic transaction if the
458 * delivery is not possible.
459 *
460 * Note that if successful, the new delivery might have itself
461 * rejected an interrupt that was "delivered" before we took the
34cb7954 462 * ics spin lock.
bc5ad3f3
BH
463 *
464 * In this case we do the whole sequence all over again for the
465 * new guy. We cannot assume that the rejected interrupt is less
466 * favored than the new one, and thus doesn't need to be delivered,
467 * because by the time we exit icp_try_to_deliver() the target
468 * processor may well have alrady consumed & completed it, and thus
469 * the rejected interrupt might actually be already acceptable.
470 */
471 if (icp_try_to_deliver(icp, new_irq, state->priority, &reject)) {
472 /*
473 * Delivery was successful, did we reject somebody else ?
474 */
475 if (reject && reject != XICS_IPI) {
34cb7954
SW
476 arch_spin_unlock(&ics->lock);
477 local_irq_restore(flags);
bc5ad3f3 478 new_irq = reject;
21acd0e4 479 check_resend = 0;
bc5ad3f3
BH
480 goto again;
481 }
482 } else {
483 /*
484 * We failed to deliver the interrupt we need to set the
485 * resend map bit and mark the ICS state as needing a resend
486 */
bc5ad3f3
BH
487 state->resend = 1;
488
21acd0e4
LZ
489 /*
490 * Make sure when checking resend, we don't miss the resend
491 * if resend_map bit is seen and cleared.
492 */
493 smp_wmb();
494 set_bit(ics->icsid, icp->resend_map);
495
bc5ad3f3
BH
496 /*
497 * If the need_resend flag got cleared in the ICP some time
498 * between icp_try_to_deliver() atomic update and now, then
499 * we know it might have missed the resend_map bit. So we
500 * retry
501 */
502 smp_mb();
503 if (!icp->state.need_resend) {
bf5a71d5 504 state->resend = 0;
34cb7954
SW
505 arch_spin_unlock(&ics->lock);
506 local_irq_restore(flags);
21acd0e4 507 check_resend = 0;
bc5ad3f3
BH
508 goto again;
509 }
510 }
511 out:
34cb7954
SW
512 arch_spin_unlock(&ics->lock);
513 local_irq_restore(flags);
bc5ad3f3
BH
514}
515
516static void icp_down_cppr(struct kvmppc_xics *xics, struct kvmppc_icp *icp,
517 u8 new_cppr)
518{
519 union kvmppc_icp_state old_state, new_state;
520 bool resend;
521
522 /*
523 * This handles several related states in one operation:
524 *
525 * ICP State: Down_CPPR
526 *
527 * Load CPPR with new value and if the XISR is 0
528 * then check for resends:
529 *
530 * ICP State: Resend
531 *
532 * If MFRR is more favored than CPPR, check for IPIs
533 * and notify ICS of a potential resend. This is done
534 * asynchronously (when used in real mode, we will have
535 * to exit here).
536 *
537 * We do not handle the complete Check_IPI as documented
538 * here. In the PAPR, this state will be used for both
539 * Set_MFRR and Down_CPPR. However, we know that we aren't
540 * changing the MFRR state here so we don't need to handle
541 * the case of an MFRR causing a reject of a pending irq,
542 * this will have been handled when the MFRR was set in the
543 * first place.
544 *
545 * Thus we don't have to handle rejects, only resends.
546 *
547 * When implementing real mode for HV KVM, resend will lead to
548 * a H_TOO_HARD return and the whole transaction will be handled
549 * in virtual mode.
550 */
551 do {
5ee07612 552 old_state = new_state = READ_ONCE(icp->state);
bc5ad3f3
BH
553
554 /* Down_CPPR */
555 new_state.cppr = new_cppr;
556
557 /*
558 * Cut down Resend / Check_IPI / IPI
559 *
560 * The logic is that we cannot have a pending interrupt
561 * trumped by an IPI at this point (see above), so we
562 * know that either the pending interrupt is already an
563 * IPI (in which case we don't care to override it) or
564 * it's either more favored than us or non existent
565 */
566 if (new_state.mfrr < new_cppr &&
567 new_state.mfrr <= new_state.pending_pri) {
568 WARN_ON(new_state.xisr != XICS_IPI &&
569 new_state.xisr != 0);
570 new_state.pending_pri = new_state.mfrr;
571 new_state.xisr = XICS_IPI;
572 }
573
574 /* Latch/clear resend bit */
575 resend = new_state.need_resend;
576 new_state.need_resend = 0;
577
578 } while (!icp_try_update(icp, old_state, new_state, true));
579
580 /*
581 * Now handle resend checks. Those are asynchronous to the ICP
582 * state update in HW (ie bus transactions) so we can handle them
583 * separately here too
584 */
585 if (resend)
586 icp_check_resend(xics, icp);
587}
588
e7d26f28 589static noinline unsigned long kvmppc_h_xirr(struct kvm_vcpu *vcpu)
bc5ad3f3
BH
590{
591 union kvmppc_icp_state old_state, new_state;
592 struct kvmppc_icp *icp = vcpu->arch.icp;
593 u32 xirr;
594
595 /* First, remove EE from the processor */
d24ea8a7 596 kvmppc_book3s_dequeue_irqprio(icp->vcpu, BOOK3S_INTERRUPT_EXTERNAL);
bc5ad3f3
BH
597
598 /*
599 * ICP State: Accept_Interrupt
600 *
601 * Return the pending interrupt (if any) along with the
602 * current CPPR, then clear the XISR & set CPPR to the
603 * pending priority
604 */
605 do {
5ee07612 606 old_state = new_state = READ_ONCE(icp->state);
bc5ad3f3
BH
607
608 xirr = old_state.xisr | (((u32)old_state.cppr) << 24);
609 if (!old_state.xisr)
610 break;
611 new_state.cppr = new_state.pending_pri;
612 new_state.pending_pri = 0xff;
613 new_state.xisr = 0;
614
615 } while (!icp_try_update(icp, old_state, new_state, true));
616
617 XICS_DBG("h_xirr vcpu %d xirr %#x\n", vcpu->vcpu_id, xirr);
618
619 return xirr;
620}
621
e7d26f28
BH
622static noinline int kvmppc_h_ipi(struct kvm_vcpu *vcpu, unsigned long server,
623 unsigned long mfrr)
bc5ad3f3
BH
624{
625 union kvmppc_icp_state old_state, new_state;
626 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
627 struct kvmppc_icp *icp;
628 u32 reject;
629 bool resend;
630 bool local;
631
632 XICS_DBG("h_ipi vcpu %d to server %lu mfrr %#lx\n",
633 vcpu->vcpu_id, server, mfrr);
634
635 icp = vcpu->arch.icp;
636 local = icp->server_num == server;
637 if (!local) {
638 icp = kvmppc_xics_find_server(vcpu->kvm, server);
639 if (!icp)
640 return H_PARAMETER;
641 }
642
643 /*
644 * ICP state: Set_MFRR
645 *
646 * If the CPPR is more favored than the new MFRR, then
647 * nothing needs to be rejected as there can be no XISR to
648 * reject. If the MFRR is being made less favored then
649 * there might be a previously-rejected interrupt needing
650 * to be resent.
651 *
5b88cda6
SW
652 * ICP state: Check_IPI
653 *
bc5ad3f3 654 * If the CPPR is less favored, then we might be replacing
5b88cda6 655 * an interrupt, and thus need to possibly reject it.
bc5ad3f3 656 *
5b88cda6
SW
657 * ICP State: IPI
658 *
659 * Besides rejecting any pending interrupts, we also
660 * update XISR and pending_pri to mark IPI as pending.
661 *
662 * PAPR does not describe this state, but if the MFRR is being
663 * made less favored than its earlier value, there might be
664 * a previously-rejected interrupt needing to be resent.
665 * Ideally, we would want to resend only if
666 * prio(pending_interrupt) < mfrr &&
667 * prio(pending_interrupt) < cppr
668 * where pending interrupt is the one that was rejected. But
669 * we don't have that state, so we simply trigger a resend
670 * whenever the MFRR is made less favored.
bc5ad3f3
BH
671 */
672 do {
5ee07612 673 old_state = new_state = READ_ONCE(icp->state);
bc5ad3f3
BH
674
675 /* Set_MFRR */
676 new_state.mfrr = mfrr;
677
678 /* Check_IPI */
679 reject = 0;
680 resend = false;
681 if (mfrr < new_state.cppr) {
682 /* Reject a pending interrupt if not an IPI */
5b88cda6 683 if (mfrr <= new_state.pending_pri) {
bc5ad3f3 684 reject = new_state.xisr;
5b88cda6
SW
685 new_state.pending_pri = mfrr;
686 new_state.xisr = XICS_IPI;
687 }
bc5ad3f3
BH
688 }
689
5b88cda6 690 if (mfrr > old_state.mfrr) {
bc5ad3f3
BH
691 resend = new_state.need_resend;
692 new_state.need_resend = 0;
693 }
694 } while (!icp_try_update(icp, old_state, new_state, local));
695
696 /* Handle reject */
697 if (reject && reject != XICS_IPI)
21acd0e4 698 icp_deliver_irq(xics, icp, reject, false);
bc5ad3f3
BH
699
700 /* Handle resend */
701 if (resend)
702 icp_check_resend(xics, icp);
703
704 return H_SUCCESS;
705}
706
8e44ddc3
PM
707static int kvmppc_h_ipoll(struct kvm_vcpu *vcpu, unsigned long server)
708{
709 union kvmppc_icp_state state;
710 struct kvmppc_icp *icp;
711
712 icp = vcpu->arch.icp;
713 if (icp->server_num != server) {
714 icp = kvmppc_xics_find_server(vcpu->kvm, server);
715 if (!icp)
716 return H_PARAMETER;
717 }
5ee07612 718 state = READ_ONCE(icp->state);
8e44ddc3
PM
719 kvmppc_set_gpr(vcpu, 4, ((u32)state.cppr << 24) | state.xisr);
720 kvmppc_set_gpr(vcpu, 5, state.mfrr);
721 return H_SUCCESS;
722}
723
e7d26f28 724static noinline void kvmppc_h_cppr(struct kvm_vcpu *vcpu, unsigned long cppr)
bc5ad3f3
BH
725{
726 union kvmppc_icp_state old_state, new_state;
727 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
728 struct kvmppc_icp *icp = vcpu->arch.icp;
729 u32 reject;
730
731 XICS_DBG("h_cppr vcpu %d cppr %#lx\n", vcpu->vcpu_id, cppr);
732
733 /*
734 * ICP State: Set_CPPR
735 *
736 * We can safely compare the new value with the current
737 * value outside of the transaction as the CPPR is only
738 * ever changed by the processor on itself
739 */
740 if (cppr > icp->state.cppr)
741 icp_down_cppr(xics, icp, cppr);
742 else if (cppr == icp->state.cppr)
743 return;
744
745 /*
746 * ICP State: Up_CPPR
747 *
748 * The processor is raising its priority, this can result
749 * in a rejection of a pending interrupt:
750 *
751 * ICP State: Reject_Current
752 *
753 * We can remove EE from the current processor, the update
754 * transaction will set it again if needed
755 */
d24ea8a7 756 kvmppc_book3s_dequeue_irqprio(icp->vcpu, BOOK3S_INTERRUPT_EXTERNAL);
bc5ad3f3
BH
757
758 do {
5ee07612 759 old_state = new_state = READ_ONCE(icp->state);
bc5ad3f3
BH
760
761 reject = 0;
762 new_state.cppr = cppr;
763
764 if (cppr <= new_state.pending_pri) {
765 reject = new_state.xisr;
766 new_state.xisr = 0;
767 new_state.pending_pri = 0xff;
768 }
769
770 } while (!icp_try_update(icp, old_state, new_state, true));
771
772 /*
773 * Check for rejects. They are handled by doing a new delivery
774 * attempt (see comments in icp_deliver_irq).
775 */
776 if (reject && reject != XICS_IPI)
21acd0e4 777 icp_deliver_irq(xics, icp, reject, false);
bc5ad3f3
BH
778}
779
17d48610 780static int ics_eoi(struct kvm_vcpu *vcpu, u32 irq)
bc5ad3f3
BH
781{
782 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
783 struct kvmppc_icp *icp = vcpu->arch.icp;
784 struct kvmppc_ics *ics;
785 struct ics_irq_state *state;
bc5ad3f3 786 u16 src;
17d48610
LZ
787 u32 pq_old, pq_new;
788
789 /*
790 * ICS EOI handling: For LSI, if P bit is still set, we need to
791 * resend it.
792 *
793 * For MSI, we move Q bit into P (and clear Q). If it is set,
794 * resend it.
795 */
796
797 ics = kvmppc_xics_find_ics(xics, irq, &src);
798 if (!ics) {
799 XICS_DBG("ios_eoi: IRQ 0x%06x not found !\n", irq);
800 return H_PARAMETER;
801 }
802 state = &ics->irq_state[src];
803
804 if (state->lsi)
805 pq_new = state->pq_state;
806 else
807 do {
808 pq_old = state->pq_state;
809 pq_new = pq_old >> 1;
810 } while (cmpxchg(&state->pq_state, pq_old, pq_new) != pq_old);
811
812 if (pq_new & PQ_PRESENTED)
21acd0e4 813 icp_deliver_irq(xics, icp, irq, false);
17d48610
LZ
814
815 kvm_notify_acked_irq(vcpu->kvm, 0, irq);
816
817 return H_SUCCESS;
818}
819
820static noinline int kvmppc_h_eoi(struct kvm_vcpu *vcpu, unsigned long xirr)
821{
822 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
823 struct kvmppc_icp *icp = vcpu->arch.icp;
824 u32 irq = xirr & 0x00ffffff;
bc5ad3f3
BH
825
826 XICS_DBG("h_eoi vcpu %d eoi %#lx\n", vcpu->vcpu_id, xirr);
827
828 /*
829 * ICP State: EOI
830 *
831 * Note: If EOI is incorrectly used by SW to lower the CPPR
832 * value (ie more favored), we do not check for rejection of
833 * a pending interrupt, this is a SW error and PAPR sepcifies
834 * that we don't have to deal with it.
835 *
836 * The sending of an EOI to the ICS is handled after the
837 * CPPR update
838 *
839 * ICP State: Down_CPPR which we handle
840 * in a separate function as it's shared with H_CPPR.
841 */
842 icp_down_cppr(xics, icp, xirr >> 24);
843
844 /* IPIs have no EOI */
845 if (irq == XICS_IPI)
846 return H_SUCCESS;
25a2150b 847
17d48610 848 return ics_eoi(vcpu, irq);
bc5ad3f3
BH
849}
850
f7af5209 851int kvmppc_xics_rm_complete(struct kvm_vcpu *vcpu, u32 hcall)
e7d26f28
BH
852{
853 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
854 struct kvmppc_icp *icp = vcpu->arch.icp;
855
856 XICS_DBG("XICS_RM: H_%x completing, act: %x state: %lx tgt: %p\n",
857 hcall, icp->rm_action, icp->rm_dbgstate.raw, icp->rm_dbgtgt);
858
878610fe
SW
859 if (icp->rm_action & XICS_RM_KICK_VCPU) {
860 icp->n_rm_kick_vcpu++;
e7d26f28 861 kvmppc_fast_vcpu_kick(icp->rm_kick_target);
878610fe
SW
862 }
863 if (icp->rm_action & XICS_RM_CHECK_RESEND) {
864 icp->n_rm_check_resend++;
5b88cda6 865 icp_check_resend(xics, icp->rm_resend_icp);
878610fe 866 }
878610fe
SW
867 if (icp->rm_action & XICS_RM_NOTIFY_EOI) {
868 icp->n_rm_notify_eoi++;
25a2150b 869 kvm_notify_acked_irq(vcpu->kvm, 0, icp->rm_eoied_irq);
878610fe 870 }
e7d26f28
BH
871
872 icp->rm_action = 0;
873
874 return H_SUCCESS;
875}
f7af5209 876EXPORT_SYMBOL_GPL(kvmppc_xics_rm_complete);
e7d26f28 877
bc5ad3f3
BH
878int kvmppc_xics_hcall(struct kvm_vcpu *vcpu, u32 req)
879{
e7d26f28 880 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
bc5ad3f3
BH
881 unsigned long res;
882 int rc = H_SUCCESS;
883
884 /* Check if we have an ICP */
e7d26f28 885 if (!xics || !vcpu->arch.icp)
bc5ad3f3
BH
886 return H_HARDWARE;
887
8e44ddc3
PM
888 /* These requests don't have real-mode implementations at present */
889 switch (req) {
890 case H_XIRR_X:
891 res = kvmppc_h_xirr(vcpu);
892 kvmppc_set_gpr(vcpu, 4, res);
893 kvmppc_set_gpr(vcpu, 5, get_tb());
894 return rc;
895 case H_IPOLL:
896 rc = kvmppc_h_ipoll(vcpu, kvmppc_get_gpr(vcpu, 4));
897 return rc;
898 }
899
e7d26f28 900 /* Check for real mode returning too hard */
a78b55d1 901 if (xics->real_mode && is_kvmppc_hv_enabled(vcpu->kvm))
e7d26f28
BH
902 return kvmppc_xics_rm_complete(vcpu, req);
903
bc5ad3f3
BH
904 switch (req) {
905 case H_XIRR:
e7d26f28 906 res = kvmppc_h_xirr(vcpu);
bc5ad3f3
BH
907 kvmppc_set_gpr(vcpu, 4, res);
908 break;
909 case H_CPPR:
e7d26f28 910 kvmppc_h_cppr(vcpu, kvmppc_get_gpr(vcpu, 4));
bc5ad3f3
BH
911 break;
912 case H_EOI:
e7d26f28 913 rc = kvmppc_h_eoi(vcpu, kvmppc_get_gpr(vcpu, 4));
bc5ad3f3
BH
914 break;
915 case H_IPI:
e7d26f28
BH
916 rc = kvmppc_h_ipi(vcpu, kvmppc_get_gpr(vcpu, 4),
917 kvmppc_get_gpr(vcpu, 5));
bc5ad3f3
BH
918 break;
919 }
920
921 return rc;
922}
2ba9f0d8 923EXPORT_SYMBOL_GPL(kvmppc_xics_hcall);
bc5ad3f3
BH
924
925
926/* -- Initialisation code etc. -- */
927
af893c7d
SW
928static void xics_debugfs_irqmap(struct seq_file *m,
929 struct kvmppc_passthru_irqmap *pimap)
930{
931 int i;
932
933 if (!pimap)
934 return;
935 seq_printf(m, "========\nPIRQ mappings: %d maps\n===========\n",
936 pimap->n_mapped);
937 for (i = 0; i < pimap->n_mapped; i++) {
938 seq_printf(m, "r_hwirq=%x, v_hwirq=%x\n",
939 pimap->mapped[i].r_hwirq, pimap->mapped[i].v_hwirq);
940 }
941}
942
bc5ad3f3
BH
943static int xics_debug_show(struct seq_file *m, void *private)
944{
945 struct kvmppc_xics *xics = m->private;
946 struct kvm *kvm = xics->kvm;
947 struct kvm_vcpu *vcpu;
948 int icsid, i;
34cb7954 949 unsigned long flags;
878610fe 950 unsigned long t_rm_kick_vcpu, t_rm_check_resend;
5efa6605 951 unsigned long t_rm_notify_eoi;
6e0365b7 952 unsigned long t_reject, t_check_resend;
bc5ad3f3
BH
953
954 if (!kvm)
955 return 0;
956
878610fe
SW
957 t_rm_kick_vcpu = 0;
958 t_rm_notify_eoi = 0;
959 t_rm_check_resend = 0;
6e0365b7
SW
960 t_check_resend = 0;
961 t_reject = 0;
878610fe 962
af893c7d
SW
963 xics_debugfs_irqmap(m, kvm->arch.pimap);
964
bc5ad3f3
BH
965 seq_printf(m, "=========\nICP state\n=========\n");
966
967 kvm_for_each_vcpu(i, vcpu, kvm) {
968 struct kvmppc_icp *icp = vcpu->arch.icp;
969 union kvmppc_icp_state state;
970
971 if (!icp)
972 continue;
973
5ee07612 974 state.raw = READ_ONCE(icp->state.raw);
bc5ad3f3
BH
975 seq_printf(m, "cpu server %#lx XIRR:%#x PPRI:%#x CPPR:%#x MFRR:%#x OUT:%d NR:%d\n",
976 icp->server_num, state.xisr,
977 state.pending_pri, state.cppr, state.mfrr,
978 state.out_ee, state.need_resend);
878610fe
SW
979 t_rm_kick_vcpu += icp->n_rm_kick_vcpu;
980 t_rm_notify_eoi += icp->n_rm_notify_eoi;
981 t_rm_check_resend += icp->n_rm_check_resend;
6e0365b7
SW
982 t_check_resend += icp->n_check_resend;
983 t_reject += icp->n_reject;
bc5ad3f3
BH
984 }
985
5efa6605 986 seq_printf(m, "ICP Guest->Host totals: kick_vcpu=%lu check_resend=%lu notify_eoi=%lu\n",
878610fe 987 t_rm_kick_vcpu, t_rm_check_resend,
5efa6605 988 t_rm_notify_eoi);
6e0365b7
SW
989 seq_printf(m, "ICP Real Mode totals: check_resend=%lu resend=%lu\n",
990 t_check_resend, t_reject);
bc5ad3f3
BH
991 for (icsid = 0; icsid <= KVMPPC_XICS_MAX_ICS_ID; icsid++) {
992 struct kvmppc_ics *ics = xics->ics[icsid];
993
994 if (!ics)
995 continue;
996
997 seq_printf(m, "=========\nICS state for ICS 0x%x\n=========\n",
998 icsid);
999
34cb7954
SW
1000 local_irq_save(flags);
1001 arch_spin_lock(&ics->lock);
bc5ad3f3
BH
1002
1003 for (i = 0; i < KVMPPC_XICS_IRQ_PER_ICS; i++) {
1004 struct ics_irq_state *irq = &ics->irq_state[i];
1005
17d48610 1006 seq_printf(m, "irq 0x%06x: server %#x prio %#x save prio %#x pq_state %d resend %d masked pending %d\n",
bc5ad3f3 1007 irq->number, irq->server, irq->priority,
17d48610 1008 irq->saved_priority, irq->pq_state,
bc5ad3f3
BH
1009 irq->resend, irq->masked_pending);
1010
1011 }
34cb7954
SW
1012 arch_spin_unlock(&ics->lock);
1013 local_irq_restore(flags);
bc5ad3f3
BH
1014 }
1015 return 0;
1016}
1017
1018static int xics_debug_open(struct inode *inode, struct file *file)
1019{
1020 return single_open(file, xics_debug_show, inode->i_private);
1021}
1022
1023static const struct file_operations xics_debug_fops = {
1024 .open = xics_debug_open,
1025 .read = seq_read,
1026 .llseek = seq_lseek,
1027 .release = single_release,
1028};
1029
1030static void xics_debugfs_init(struct kvmppc_xics *xics)
1031{
1032 char *name;
1033
1034 name = kasprintf(GFP_KERNEL, "kvm-xics-%p", xics);
1035 if (!name) {
1036 pr_err("%s: no memory for name\n", __func__);
1037 return;
1038 }
1039
57ad583f 1040 xics->dentry = debugfs_create_file(name, 0444, powerpc_debugfs_root,
bc5ad3f3
BH
1041 xics, &xics_debug_fops);
1042
1043 pr_debug("%s: created %s\n", __func__, name);
1044 kfree(name);
1045}
1046
5975a2e0
PM
1047static struct kvmppc_ics *kvmppc_xics_create_ics(struct kvm *kvm,
1048 struct kvmppc_xics *xics, int irq)
bc5ad3f3
BH
1049{
1050 struct kvmppc_ics *ics;
1051 int i, icsid;
1052
1053 icsid = irq >> KVMPPC_XICS_ICS_SHIFT;
1054
1055 mutex_lock(&kvm->lock);
1056
1057 /* ICS already exists - somebody else got here first */
1058 if (xics->ics[icsid])
1059 goto out;
1060
1061 /* Create the ICS */
1062 ics = kzalloc(sizeof(struct kvmppc_ics), GFP_KERNEL);
1063 if (!ics)
1064 goto out;
1065
bc5ad3f3
BH
1066 ics->icsid = icsid;
1067
1068 for (i = 0; i < KVMPPC_XICS_IRQ_PER_ICS; i++) {
1069 ics->irq_state[i].number = (icsid << KVMPPC_XICS_ICS_SHIFT) | i;
1070 ics->irq_state[i].priority = MASKED;
1071 ics->irq_state[i].saved_priority = MASKED;
1072 }
1073 smp_wmb();
1074 xics->ics[icsid] = ics;
1075
1076 if (icsid > xics->max_icsid)
1077 xics->max_icsid = icsid;
1078
1079 out:
1080 mutex_unlock(&kvm->lock);
1081 return xics->ics[icsid];
1082}
1083
936774cd 1084static int kvmppc_xics_create_icp(struct kvm_vcpu *vcpu, unsigned long server_num)
bc5ad3f3
BH
1085{
1086 struct kvmppc_icp *icp;
1087
1088 if (!vcpu->kvm->arch.xics)
1089 return -ENODEV;
1090
1091 if (kvmppc_xics_find_server(vcpu->kvm, server_num))
1092 return -EEXIST;
1093
1094 icp = kzalloc(sizeof(struct kvmppc_icp), GFP_KERNEL);
1095 if (!icp)
1096 return -ENOMEM;
1097
1098 icp->vcpu = vcpu;
1099 icp->server_num = server_num;
1100 icp->state.mfrr = MASKED;
1101 icp->state.pending_pri = MASKED;
1102 vcpu->arch.icp = icp;
1103
1104 XICS_DBG("created server for vcpu %d\n", vcpu->vcpu_id);
1105
1106 return 0;
1107}
1108
8b78645c
PM
1109u64 kvmppc_xics_get_icp(struct kvm_vcpu *vcpu)
1110{
1111 struct kvmppc_icp *icp = vcpu->arch.icp;
1112 union kvmppc_icp_state state;
1113
1114 if (!icp)
1115 return 0;
1116 state = icp->state;
1117 return ((u64)state.cppr << KVM_REG_PPC_ICP_CPPR_SHIFT) |
1118 ((u64)state.xisr << KVM_REG_PPC_ICP_XISR_SHIFT) |
1119 ((u64)state.mfrr << KVM_REG_PPC_ICP_MFRR_SHIFT) |
1120 ((u64)state.pending_pri << KVM_REG_PPC_ICP_PPRI_SHIFT);
1121}
1122
1123int kvmppc_xics_set_icp(struct kvm_vcpu *vcpu, u64 icpval)
1124{
1125 struct kvmppc_icp *icp = vcpu->arch.icp;
1126 struct kvmppc_xics *xics = vcpu->kvm->arch.xics;
1127 union kvmppc_icp_state old_state, new_state;
1128 struct kvmppc_ics *ics;
1129 u8 cppr, mfrr, pending_pri;
1130 u32 xisr;
1131 u16 src;
1132 bool resend;
1133
1134 if (!icp || !xics)
1135 return -ENOENT;
1136
1137 cppr = icpval >> KVM_REG_PPC_ICP_CPPR_SHIFT;
1138 xisr = (icpval >> KVM_REG_PPC_ICP_XISR_SHIFT) &
1139 KVM_REG_PPC_ICP_XISR_MASK;
1140 mfrr = icpval >> KVM_REG_PPC_ICP_MFRR_SHIFT;
1141 pending_pri = icpval >> KVM_REG_PPC_ICP_PPRI_SHIFT;
1142
1143 /* Require the new state to be internally consistent */
1144 if (xisr == 0) {
1145 if (pending_pri != 0xff)
1146 return -EINVAL;
1147 } else if (xisr == XICS_IPI) {
1148 if (pending_pri != mfrr || pending_pri >= cppr)
1149 return -EINVAL;
1150 } else {
1151 if (pending_pri >= mfrr || pending_pri >= cppr)
1152 return -EINVAL;
1153 ics = kvmppc_xics_find_ics(xics, xisr, &src);
1154 if (!ics)
1155 return -EINVAL;
1156 }
1157
1158 new_state.raw = 0;
1159 new_state.cppr = cppr;
1160 new_state.xisr = xisr;
1161 new_state.mfrr = mfrr;
1162 new_state.pending_pri = pending_pri;
1163
1164 /*
1165 * Deassert the CPU interrupt request.
1166 * icp_try_update will reassert it if necessary.
1167 */
d24ea8a7 1168 kvmppc_book3s_dequeue_irqprio(icp->vcpu, BOOK3S_INTERRUPT_EXTERNAL);
8b78645c
PM
1169
1170 /*
1171 * Note that if we displace an interrupt from old_state.xisr,
1172 * we don't mark it as rejected. We expect userspace to set
1173 * the state of the interrupt sources to be consistent with
1174 * the ICP states (either before or afterwards, which doesn't
1175 * matter). We do handle resends due to CPPR becoming less
1176 * favoured because that is necessary to end up with a
1177 * consistent state in the situation where userspace restores
1178 * the ICS states before the ICP states.
1179 */
1180 do {
5ee07612 1181 old_state = READ_ONCE(icp->state);
8b78645c
PM
1182
1183 if (new_state.mfrr <= old_state.mfrr) {
1184 resend = false;
1185 new_state.need_resend = old_state.need_resend;
1186 } else {
1187 resend = old_state.need_resend;
1188 new_state.need_resend = 0;
1189 }
1190 } while (!icp_try_update(icp, old_state, new_state, false));
1191
1192 if (resend)
1193 icp_check_resend(xics, icp);
1194
1195 return 0;
1196}
1197
5975a2e0
PM
1198static int xics_get_source(struct kvmppc_xics *xics, long irq, u64 addr)
1199{
1200 int ret;
1201 struct kvmppc_ics *ics;
1202 struct ics_irq_state *irqp;
1203 u64 __user *ubufp = (u64 __user *) addr;
1204 u16 idx;
1205 u64 val, prio;
34cb7954 1206 unsigned long flags;
5975a2e0
PM
1207
1208 ics = kvmppc_xics_find_ics(xics, irq, &idx);
1209 if (!ics)
1210 return -ENOENT;
bc5ad3f3 1211
5975a2e0 1212 irqp = &ics->irq_state[idx];
34cb7954
SW
1213 local_irq_save(flags);
1214 arch_spin_lock(&ics->lock);
5975a2e0
PM
1215 ret = -ENOENT;
1216 if (irqp->exists) {
1217 val = irqp->server;
1218 prio = irqp->priority;
1219 if (prio == MASKED) {
1220 val |= KVM_XICS_MASKED;
1221 prio = irqp->saved_priority;
1222 }
1223 val |= prio << KVM_XICS_PRIORITY_SHIFT;
b1a4286b
PM
1224 if (irqp->lsi) {
1225 val |= KVM_XICS_LEVEL_SENSITIVE;
17d48610 1226 if (irqp->pq_state & PQ_PRESENTED)
b1a4286b
PM
1227 val |= KVM_XICS_PENDING;
1228 } else if (irqp->masked_pending || irqp->resend)
5975a2e0 1229 val |= KVM_XICS_PENDING;
17d48610
LZ
1230
1231 if (irqp->pq_state & PQ_PRESENTED)
1232 val |= KVM_XICS_PRESENTED;
1233
1234 if (irqp->pq_state & PQ_QUEUED)
1235 val |= KVM_XICS_QUEUED;
1236
5975a2e0
PM
1237 ret = 0;
1238 }
34cb7954
SW
1239 arch_spin_unlock(&ics->lock);
1240 local_irq_restore(flags);
5975a2e0
PM
1241
1242 if (!ret && put_user(val, ubufp))
1243 ret = -EFAULT;
1244
1245 return ret;
1246}
1247
1248static int xics_set_source(struct kvmppc_xics *xics, long irq, u64 addr)
bc5ad3f3 1249{
5975a2e0
PM
1250 struct kvmppc_ics *ics;
1251 struct ics_irq_state *irqp;
1252 u64 __user *ubufp = (u64 __user *) addr;
1253 u16 idx;
1254 u64 val;
1255 u8 prio;
1256 u32 server;
34cb7954 1257 unsigned long flags;
5975a2e0
PM
1258
1259 if (irq < KVMPPC_XICS_FIRST_IRQ || irq >= KVMPPC_XICS_NR_IRQS)
1260 return -ENOENT;
1261
1262 ics = kvmppc_xics_find_ics(xics, irq, &idx);
1263 if (!ics) {
1264 ics = kvmppc_xics_create_ics(xics->kvm, xics, irq);
1265 if (!ics)
1266 return -ENOMEM;
1267 }
1268 irqp = &ics->irq_state[idx];
1269 if (get_user(val, ubufp))
1270 return -EFAULT;
1271
1272 server = val & KVM_XICS_DESTINATION_MASK;
1273 prio = val >> KVM_XICS_PRIORITY_SHIFT;
1274 if (prio != MASKED &&
1275 kvmppc_xics_find_server(xics->kvm, server) == NULL)
1276 return -EINVAL;
bc5ad3f3 1277
34cb7954
SW
1278 local_irq_save(flags);
1279 arch_spin_lock(&ics->lock);
5975a2e0
PM
1280 irqp->server = server;
1281 irqp->saved_priority = prio;
1282 if (val & KVM_XICS_MASKED)
1283 prio = MASKED;
1284 irqp->priority = prio;
1285 irqp->resend = 0;
1286 irqp->masked_pending = 0;
b1a4286b 1287 irqp->lsi = 0;
17d48610
LZ
1288 irqp->pq_state = 0;
1289 if (val & KVM_XICS_LEVEL_SENSITIVE)
b1a4286b 1290 irqp->lsi = 1;
17d48610
LZ
1291 /* If PENDING, set P in case P is not saved because of old code */
1292 if (val & KVM_XICS_PRESENTED || val & KVM_XICS_PENDING)
1293 irqp->pq_state |= PQ_PRESENTED;
1294 if (val & KVM_XICS_QUEUED)
1295 irqp->pq_state |= PQ_QUEUED;
5975a2e0 1296 irqp->exists = 1;
34cb7954
SW
1297 arch_spin_unlock(&ics->lock);
1298 local_irq_restore(flags);
bc5ad3f3 1299
5975a2e0 1300 if (val & KVM_XICS_PENDING)
21acd0e4 1301 icp_deliver_irq(xics, NULL, irqp->number, false);
bc5ad3f3 1302
5975a2e0
PM
1303 return 0;
1304}
1305
5af50993
BH
1306int kvmppc_xics_set_irq(struct kvm *kvm, int irq_source_id, u32 irq, int level,
1307 bool line_status)
5975a2e0
PM
1308{
1309 struct kvmppc_xics *xics = kvm->arch.xics;
1310
e48ba1cb
PM
1311 if (!xics)
1312 return -ENODEV;
25a2150b
PM
1313 return ics_deliver_irq(xics, irq, level);
1314}
1315
5975a2e0
PM
1316static int xics_set_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
1317{
1318 struct kvmppc_xics *xics = dev->private;
1319
1320 switch (attr->group) {
1321 case KVM_DEV_XICS_GRP_SOURCES:
1322 return xics_set_source(xics, attr->attr, attr->addr);
bc5ad3f3 1323 }
5975a2e0
PM
1324 return -ENXIO;
1325}
bc5ad3f3 1326
5975a2e0
PM
1327static int xics_get_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
1328{
1329 struct kvmppc_xics *xics = dev->private;
1330
1331 switch (attr->group) {
1332 case KVM_DEV_XICS_GRP_SOURCES:
1333 return xics_get_source(xics, attr->attr, attr->addr);
1334 }
1335 return -ENXIO;
bc5ad3f3
BH
1336}
1337
5975a2e0 1338static int xics_has_attr(struct kvm_device *dev, struct kvm_device_attr *attr)
bc5ad3f3 1339{
5975a2e0
PM
1340 switch (attr->group) {
1341 case KVM_DEV_XICS_GRP_SOURCES:
1342 if (attr->attr >= KVMPPC_XICS_FIRST_IRQ &&
1343 attr->attr < KVMPPC_XICS_NR_IRQS)
1344 return 0;
1345 break;
1346 }
1347 return -ENXIO;
1348}
1349
1350static void kvmppc_xics_free(struct kvm_device *dev)
1351{
1352 struct kvmppc_xics *xics = dev->private;
bc5ad3f3
BH
1353 int i;
1354 struct kvm *kvm = xics->kvm;
1355
1356 debugfs_remove(xics->dentry);
1357
1358 if (kvm)
1359 kvm->arch.xics = NULL;
1360
1361 for (i = 0; i <= xics->max_icsid; i++)
1362 kfree(xics->ics[i]);
1363 kfree(xics);
5975a2e0 1364 kfree(dev);
bc5ad3f3
BH
1365}
1366
5975a2e0 1367static int kvmppc_xics_create(struct kvm_device *dev, u32 type)
bc5ad3f3
BH
1368{
1369 struct kvmppc_xics *xics;
5975a2e0 1370 struct kvm *kvm = dev->kvm;
bc5ad3f3
BH
1371 int ret = 0;
1372
1373 xics = kzalloc(sizeof(*xics), GFP_KERNEL);
1374 if (!xics)
1375 return -ENOMEM;
1376
5975a2e0
PM
1377 dev->private = xics;
1378 xics->dev = dev;
bc5ad3f3
BH
1379 xics->kvm = kvm;
1380
1381 /* Already there ? */
bc5ad3f3
BH
1382 if (kvm->arch.xics)
1383 ret = -EEXIST;
1384 else
1385 kvm->arch.xics = xics;
bc5ad3f3 1386
458ff3c0
GN
1387 if (ret) {
1388 kfree(xics);
bc5ad3f3 1389 return ret;
458ff3c0 1390 }
bc5ad3f3 1391
3a167bea 1392#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
e7d26f28
BH
1393 if (cpu_has_feature(CPU_FTR_ARCH_206)) {
1394 /* Enable real mode support */
1395 xics->real_mode = ENABLE_REALMODE;
1396 xics->real_mode_dbg = DEBUG_REALMODE;
1397 }
3a167bea 1398#endif /* CONFIG_KVM_BOOK3S_HV_POSSIBLE */
e7d26f28 1399
bc5ad3f3
BH
1400 return 0;
1401}
1402
023e9fdd
CD
1403static void kvmppc_xics_init(struct kvm_device *dev)
1404{
1405 struct kvmppc_xics *xics = (struct kvmppc_xics *)dev->private;
1406
1407 xics_debugfs_init(xics);
1408}
1409
5975a2e0
PM
1410struct kvm_device_ops kvm_xics_ops = {
1411 .name = "kvm-xics",
1412 .create = kvmppc_xics_create,
023e9fdd 1413 .init = kvmppc_xics_init,
5975a2e0
PM
1414 .destroy = kvmppc_xics_free,
1415 .set_attr = xics_set_attr,
1416 .get_attr = xics_get_attr,
1417 .has_attr = xics_has_attr,
1418};
1419
1420int kvmppc_xics_connect_vcpu(struct kvm_device *dev, struct kvm_vcpu *vcpu,
1421 u32 xcpu)
1422{
1423 struct kvmppc_xics *xics = dev->private;
1424 int r = -EBUSY;
1425
1426 if (dev->ops != &kvm_xics_ops)
1427 return -EPERM;
1428 if (xics->kvm != vcpu->kvm)
1429 return -EPERM;
1430 if (vcpu->arch.irq_type)
1431 return -EBUSY;
1432
1433 r = kvmppc_xics_create_icp(vcpu, xcpu);
1434 if (!r)
1435 vcpu->arch.irq_type = KVMPPC_IRQ_XICS;
1436
1437 return r;
1438}
1439
bc5ad3f3
BH
1440void kvmppc_xics_free_icp(struct kvm_vcpu *vcpu)
1441{
1442 if (!vcpu->arch.icp)
1443 return;
1444 kfree(vcpu->arch.icp);
1445 vcpu->arch.icp = NULL;
1446 vcpu->arch.irq_type = KVMPPC_IRQ_DEFAULT;
1447}
25a2150b 1448
5d375199
PM
1449void kvmppc_xics_set_mapped(struct kvm *kvm, unsigned long irq,
1450 unsigned long host_irq)
1451{
1452 struct kvmppc_xics *xics = kvm->arch.xics;
1453 struct kvmppc_ics *ics;
1454 u16 idx;
1455
1456 ics = kvmppc_xics_find_ics(xics, irq, &idx);
1457 if (!ics)
1458 return;
1459
1460 ics->irq_state[idx].host_irq = host_irq;
1461 ics->irq_state[idx].intr_cpu = -1;
1462}
1463EXPORT_SYMBOL_GPL(kvmppc_xics_set_mapped);
1464
1465void kvmppc_xics_clr_mapped(struct kvm *kvm, unsigned long irq,
1466 unsigned long host_irq)
1467{
1468 struct kvmppc_xics *xics = kvm->arch.xics;
1469 struct kvmppc_ics *ics;
1470 u16 idx;
1471
1472 ics = kvmppc_xics_find_ics(xics, irq, &idx);
1473 if (!ics)
1474 return;
1475
1476 ics->irq_state[idx].host_irq = 0;
1477}
1478EXPORT_SYMBOL_GPL(kvmppc_xics_clr_mapped);