]> git.proxmox.com Git - mirror_ubuntu-kernels.git/blob - virt/kvm/arm/arch_timer.c
HID: logitech-dj: fix spelling in printk
[mirror_ubuntu-kernels.git] / virt / kvm / arm / arch_timer.c
1 /*
2 * Copyright (C) 2012 ARM Ltd.
3 * Author: Marc Zyngier <marc.zyngier@arm.com>
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License version 2 as
7 * published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17 */
18
19 #include <linux/cpu.h>
20 #include <linux/kvm.h>
21 #include <linux/kvm_host.h>
22 #include <linux/interrupt.h>
23 #include <linux/irq.h>
24 #include <linux/uaccess.h>
25
26 #include <clocksource/arm_arch_timer.h>
27 #include <asm/arch_timer.h>
28 #include <asm/kvm_hyp.h>
29
30 #include <kvm/arm_vgic.h>
31 #include <kvm/arm_arch_timer.h>
32
33 #include "trace.h"
34
35 static struct timecounter *timecounter;
36 static unsigned int host_vtimer_irq;
37 static u32 host_vtimer_irq_flags;
38
39 static DEFINE_STATIC_KEY_FALSE(has_gic_active_state);
40
41 static const struct kvm_irq_level default_ptimer_irq = {
42 .irq = 30,
43 .level = 1,
44 };
45
46 static const struct kvm_irq_level default_vtimer_irq = {
47 .irq = 27,
48 .level = 1,
49 };
50
51 static bool kvm_timer_irq_can_fire(struct arch_timer_context *timer_ctx);
52 static void kvm_timer_update_irq(struct kvm_vcpu *vcpu, bool new_level,
53 struct arch_timer_context *timer_ctx);
54 static bool kvm_timer_should_fire(struct arch_timer_context *timer_ctx);
55
56 u64 kvm_phys_timer_read(void)
57 {
58 return timecounter->cc->read(timecounter->cc);
59 }
60
61 static inline bool userspace_irqchip(struct kvm *kvm)
62 {
63 return static_branch_unlikely(&userspace_irqchip_in_use) &&
64 unlikely(!irqchip_in_kernel(kvm));
65 }
66
67 static void soft_timer_start(struct hrtimer *hrt, u64 ns)
68 {
69 hrtimer_start(hrt, ktime_add_ns(ktime_get(), ns),
70 HRTIMER_MODE_ABS);
71 }
72
73 static void soft_timer_cancel(struct hrtimer *hrt)
74 {
75 hrtimer_cancel(hrt);
76 }
77
78 static irqreturn_t kvm_arch_timer_handler(int irq, void *dev_id)
79 {
80 struct kvm_vcpu *vcpu = *(struct kvm_vcpu **)dev_id;
81 struct arch_timer_context *vtimer;
82
83 /*
84 * We may see a timer interrupt after vcpu_put() has been called which
85 * sets the CPU's vcpu pointer to NULL, because even though the timer
86 * has been disabled in vtimer_save_state(), the hardware interrupt
87 * signal may not have been retired from the interrupt controller yet.
88 */
89 if (!vcpu)
90 return IRQ_HANDLED;
91
92 vtimer = vcpu_vtimer(vcpu);
93 if (kvm_timer_should_fire(vtimer))
94 kvm_timer_update_irq(vcpu, true, vtimer);
95
96 if (userspace_irqchip(vcpu->kvm) &&
97 !static_branch_unlikely(&has_gic_active_state))
98 disable_percpu_irq(host_vtimer_irq);
99
100 return IRQ_HANDLED;
101 }
102
103 static u64 kvm_timer_compute_delta(struct arch_timer_context *timer_ctx)
104 {
105 u64 cval, now;
106
107 cval = timer_ctx->cnt_cval;
108 now = kvm_phys_timer_read() - timer_ctx->cntvoff;
109
110 if (now < cval) {
111 u64 ns;
112
113 ns = cyclecounter_cyc2ns(timecounter->cc,
114 cval - now,
115 timecounter->mask,
116 &timecounter->frac);
117 return ns;
118 }
119
120 return 0;
121 }
122
123 static bool kvm_timer_irq_can_fire(struct arch_timer_context *timer_ctx)
124 {
125 return !(timer_ctx->cnt_ctl & ARCH_TIMER_CTRL_IT_MASK) &&
126 (timer_ctx->cnt_ctl & ARCH_TIMER_CTRL_ENABLE);
127 }
128
129 /*
130 * Returns the earliest expiration time in ns among guest timers.
131 * Note that it will return 0 if none of timers can fire.
132 */
133 static u64 kvm_timer_earliest_exp(struct kvm_vcpu *vcpu)
134 {
135 u64 min_virt = ULLONG_MAX, min_phys = ULLONG_MAX;
136 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
137 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
138
139 if (kvm_timer_irq_can_fire(vtimer))
140 min_virt = kvm_timer_compute_delta(vtimer);
141
142 if (kvm_timer_irq_can_fire(ptimer))
143 min_phys = kvm_timer_compute_delta(ptimer);
144
145 /* If none of timers can fire, then return 0 */
146 if ((min_virt == ULLONG_MAX) && (min_phys == ULLONG_MAX))
147 return 0;
148
149 return min(min_virt, min_phys);
150 }
151
152 static enum hrtimer_restart kvm_bg_timer_expire(struct hrtimer *hrt)
153 {
154 struct arch_timer_cpu *timer;
155 struct kvm_vcpu *vcpu;
156 u64 ns;
157
158 timer = container_of(hrt, struct arch_timer_cpu, bg_timer);
159 vcpu = container_of(timer, struct kvm_vcpu, arch.timer_cpu);
160
161 /*
162 * Check that the timer has really expired from the guest's
163 * PoV (NTP on the host may have forced it to expire
164 * early). If we should have slept longer, restart it.
165 */
166 ns = kvm_timer_earliest_exp(vcpu);
167 if (unlikely(ns)) {
168 hrtimer_forward_now(hrt, ns_to_ktime(ns));
169 return HRTIMER_RESTART;
170 }
171
172 kvm_vcpu_wake_up(vcpu);
173 return HRTIMER_NORESTART;
174 }
175
176 static enum hrtimer_restart kvm_phys_timer_expire(struct hrtimer *hrt)
177 {
178 struct arch_timer_context *ptimer;
179 struct arch_timer_cpu *timer;
180 struct kvm_vcpu *vcpu;
181 u64 ns;
182
183 timer = container_of(hrt, struct arch_timer_cpu, phys_timer);
184 vcpu = container_of(timer, struct kvm_vcpu, arch.timer_cpu);
185 ptimer = vcpu_ptimer(vcpu);
186
187 /*
188 * Check that the timer has really expired from the guest's
189 * PoV (NTP on the host may have forced it to expire
190 * early). If not ready, schedule for a later time.
191 */
192 ns = kvm_timer_compute_delta(ptimer);
193 if (unlikely(ns)) {
194 hrtimer_forward_now(hrt, ns_to_ktime(ns));
195 return HRTIMER_RESTART;
196 }
197
198 kvm_timer_update_irq(vcpu, true, ptimer);
199 return HRTIMER_NORESTART;
200 }
201
202 static bool kvm_timer_should_fire(struct arch_timer_context *timer_ctx)
203 {
204 u64 cval, now;
205
206 if (timer_ctx->loaded) {
207 u32 cnt_ctl;
208
209 /* Only the virtual timer can be loaded so far */
210 cnt_ctl = read_sysreg_el0(cntv_ctl);
211 return (cnt_ctl & ARCH_TIMER_CTRL_ENABLE) &&
212 (cnt_ctl & ARCH_TIMER_CTRL_IT_STAT) &&
213 !(cnt_ctl & ARCH_TIMER_CTRL_IT_MASK);
214 }
215
216 if (!kvm_timer_irq_can_fire(timer_ctx))
217 return false;
218
219 cval = timer_ctx->cnt_cval;
220 now = kvm_phys_timer_read() - timer_ctx->cntvoff;
221
222 return cval <= now;
223 }
224
225 bool kvm_timer_is_pending(struct kvm_vcpu *vcpu)
226 {
227 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
228 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
229
230 if (kvm_timer_should_fire(vtimer))
231 return true;
232
233 return kvm_timer_should_fire(ptimer);
234 }
235
236 /*
237 * Reflect the timer output level into the kvm_run structure
238 */
239 void kvm_timer_update_run(struct kvm_vcpu *vcpu)
240 {
241 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
242 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
243 struct kvm_sync_regs *regs = &vcpu->run->s.regs;
244
245 /* Populate the device bitmap with the timer states */
246 regs->device_irq_level &= ~(KVM_ARM_DEV_EL1_VTIMER |
247 KVM_ARM_DEV_EL1_PTIMER);
248 if (kvm_timer_should_fire(vtimer))
249 regs->device_irq_level |= KVM_ARM_DEV_EL1_VTIMER;
250 if (kvm_timer_should_fire(ptimer))
251 regs->device_irq_level |= KVM_ARM_DEV_EL1_PTIMER;
252 }
253
254 static void kvm_timer_update_irq(struct kvm_vcpu *vcpu, bool new_level,
255 struct arch_timer_context *timer_ctx)
256 {
257 int ret;
258
259 timer_ctx->irq.level = new_level;
260 trace_kvm_timer_update_irq(vcpu->vcpu_id, timer_ctx->irq.irq,
261 timer_ctx->irq.level);
262
263 if (!userspace_irqchip(vcpu->kvm)) {
264 ret = kvm_vgic_inject_irq(vcpu->kvm, vcpu->vcpu_id,
265 timer_ctx->irq.irq,
266 timer_ctx->irq.level,
267 timer_ctx);
268 WARN_ON(ret);
269 }
270 }
271
272 /* Schedule the background timer for the emulated timer. */
273 static void phys_timer_emulate(struct kvm_vcpu *vcpu)
274 {
275 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
276 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
277
278 /*
279 * If the timer can fire now, we don't need to have a soft timer
280 * scheduled for the future. If the timer cannot fire at all,
281 * then we also don't need a soft timer.
282 */
283 if (kvm_timer_should_fire(ptimer) || !kvm_timer_irq_can_fire(ptimer)) {
284 soft_timer_cancel(&timer->phys_timer);
285 return;
286 }
287
288 soft_timer_start(&timer->phys_timer, kvm_timer_compute_delta(ptimer));
289 }
290
291 /*
292 * Check if there was a change in the timer state, so that we should either
293 * raise or lower the line level to the GIC or schedule a background timer to
294 * emulate the physical timer.
295 */
296 static void kvm_timer_update_state(struct kvm_vcpu *vcpu)
297 {
298 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
299 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
300 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
301 bool level;
302
303 if (unlikely(!timer->enabled))
304 return;
305
306 /*
307 * The vtimer virtual interrupt is a 'mapped' interrupt, meaning part
308 * of its lifecycle is offloaded to the hardware, and we therefore may
309 * not have lowered the irq.level value before having to signal a new
310 * interrupt, but have to signal an interrupt every time the level is
311 * asserted.
312 */
313 level = kvm_timer_should_fire(vtimer);
314 kvm_timer_update_irq(vcpu, level, vtimer);
315
316 phys_timer_emulate(vcpu);
317
318 if (kvm_timer_should_fire(ptimer) != ptimer->irq.level)
319 kvm_timer_update_irq(vcpu, !ptimer->irq.level, ptimer);
320 }
321
322 static void vtimer_save_state(struct kvm_vcpu *vcpu)
323 {
324 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
325 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
326 unsigned long flags;
327
328 local_irq_save(flags);
329
330 if (!vtimer->loaded)
331 goto out;
332
333 if (timer->enabled) {
334 vtimer->cnt_ctl = read_sysreg_el0(cntv_ctl);
335 vtimer->cnt_cval = read_sysreg_el0(cntv_cval);
336 }
337
338 /* Disable the virtual timer */
339 write_sysreg_el0(0, cntv_ctl);
340 isb();
341
342 vtimer->loaded = false;
343 out:
344 local_irq_restore(flags);
345 }
346
347 /*
348 * Schedule the background timer before calling kvm_vcpu_block, so that this
349 * thread is removed from its waitqueue and made runnable when there's a timer
350 * interrupt to handle.
351 */
352 void kvm_timer_schedule(struct kvm_vcpu *vcpu)
353 {
354 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
355 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
356 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
357
358 vtimer_save_state(vcpu);
359
360 /*
361 * No need to schedule a background timer if any guest timer has
362 * already expired, because kvm_vcpu_block will return before putting
363 * the thread to sleep.
364 */
365 if (kvm_timer_should_fire(vtimer) || kvm_timer_should_fire(ptimer))
366 return;
367
368 /*
369 * If both timers are not capable of raising interrupts (disabled or
370 * masked), then there's no more work for us to do.
371 */
372 if (!kvm_timer_irq_can_fire(vtimer) && !kvm_timer_irq_can_fire(ptimer))
373 return;
374
375 /*
376 * The guest timers have not yet expired, schedule a background timer.
377 * Set the earliest expiration time among the guest timers.
378 */
379 soft_timer_start(&timer->bg_timer, kvm_timer_earliest_exp(vcpu));
380 }
381
382 static void vtimer_restore_state(struct kvm_vcpu *vcpu)
383 {
384 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
385 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
386 unsigned long flags;
387
388 local_irq_save(flags);
389
390 if (vtimer->loaded)
391 goto out;
392
393 if (timer->enabled) {
394 write_sysreg_el0(vtimer->cnt_cval, cntv_cval);
395 isb();
396 write_sysreg_el0(vtimer->cnt_ctl, cntv_ctl);
397 }
398
399 vtimer->loaded = true;
400 out:
401 local_irq_restore(flags);
402 }
403
404 void kvm_timer_unschedule(struct kvm_vcpu *vcpu)
405 {
406 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
407
408 vtimer_restore_state(vcpu);
409
410 soft_timer_cancel(&timer->bg_timer);
411 }
412
413 static void set_cntvoff(u64 cntvoff)
414 {
415 u32 low = lower_32_bits(cntvoff);
416 u32 high = upper_32_bits(cntvoff);
417
418 /*
419 * Since kvm_call_hyp doesn't fully support the ARM PCS especially on
420 * 32-bit systems, but rather passes register by register shifted one
421 * place (we put the function address in r0/x0), we cannot simply pass
422 * a 64-bit value as an argument, but have to split the value in two
423 * 32-bit halves.
424 */
425 kvm_call_hyp(__kvm_timer_set_cntvoff, low, high);
426 }
427
428 static inline void set_vtimer_irq_phys_active(struct kvm_vcpu *vcpu, bool active)
429 {
430 int r;
431 r = irq_set_irqchip_state(host_vtimer_irq, IRQCHIP_STATE_ACTIVE, active);
432 WARN_ON(r);
433 }
434
435 static void kvm_timer_vcpu_load_gic(struct kvm_vcpu *vcpu)
436 {
437 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
438 bool phys_active;
439
440 if (irqchip_in_kernel(vcpu->kvm))
441 phys_active = kvm_vgic_map_is_active(vcpu, vtimer->irq.irq);
442 else
443 phys_active = vtimer->irq.level;
444 set_vtimer_irq_phys_active(vcpu, phys_active);
445 }
446
447 static void kvm_timer_vcpu_load_nogic(struct kvm_vcpu *vcpu)
448 {
449 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
450
451 /*
452 * When using a userspace irqchip with the architected timers and a
453 * host interrupt controller that doesn't support an active state, we
454 * must still prevent continuously exiting from the guest, and
455 * therefore mask the physical interrupt by disabling it on the host
456 * interrupt controller when the virtual level is high, such that the
457 * guest can make forward progress. Once we detect the output level
458 * being de-asserted, we unmask the interrupt again so that we exit
459 * from the guest when the timer fires.
460 */
461 if (vtimer->irq.level)
462 disable_percpu_irq(host_vtimer_irq);
463 else
464 enable_percpu_irq(host_vtimer_irq, host_vtimer_irq_flags);
465 }
466
467 void kvm_timer_vcpu_load(struct kvm_vcpu *vcpu)
468 {
469 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
470 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
471 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
472
473 if (unlikely(!timer->enabled))
474 return;
475
476 if (static_branch_likely(&has_gic_active_state))
477 kvm_timer_vcpu_load_gic(vcpu);
478 else
479 kvm_timer_vcpu_load_nogic(vcpu);
480
481 set_cntvoff(vtimer->cntvoff);
482
483 vtimer_restore_state(vcpu);
484
485 /* Set the background timer for the physical timer emulation. */
486 phys_timer_emulate(vcpu);
487
488 /* If the timer fired while we weren't running, inject it now */
489 if (kvm_timer_should_fire(ptimer) != ptimer->irq.level)
490 kvm_timer_update_irq(vcpu, !ptimer->irq.level, ptimer);
491 }
492
493 bool kvm_timer_should_notify_user(struct kvm_vcpu *vcpu)
494 {
495 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
496 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
497 struct kvm_sync_regs *sregs = &vcpu->run->s.regs;
498 bool vlevel, plevel;
499
500 if (likely(irqchip_in_kernel(vcpu->kvm)))
501 return false;
502
503 vlevel = sregs->device_irq_level & KVM_ARM_DEV_EL1_VTIMER;
504 plevel = sregs->device_irq_level & KVM_ARM_DEV_EL1_PTIMER;
505
506 return kvm_timer_should_fire(vtimer) != vlevel ||
507 kvm_timer_should_fire(ptimer) != plevel;
508 }
509
510 void kvm_timer_vcpu_put(struct kvm_vcpu *vcpu)
511 {
512 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
513
514 if (unlikely(!timer->enabled))
515 return;
516
517 vtimer_save_state(vcpu);
518
519 /*
520 * Cancel the physical timer emulation, because the only case where we
521 * need it after a vcpu_put is in the context of a sleeping VCPU, and
522 * in that case we already factor in the deadline for the physical
523 * timer when scheduling the bg_timer.
524 *
525 * In any case, we re-schedule the hrtimer for the physical timer when
526 * coming back to the VCPU thread in kvm_timer_vcpu_load().
527 */
528 soft_timer_cancel(&timer->phys_timer);
529
530 /*
531 * The kernel may decide to run userspace after calling vcpu_put, so
532 * we reset cntvoff to 0 to ensure a consistent read between user
533 * accesses to the virtual counter and kernel access to the physical
534 * counter of non-VHE case. For VHE, the virtual counter uses a fixed
535 * virtual offset of zero, so no need to zero CNTVOFF_EL2 register.
536 */
537 if (!has_vhe())
538 set_cntvoff(0);
539 }
540
541 /*
542 * With a userspace irqchip we have to check if the guest de-asserted the
543 * timer and if so, unmask the timer irq signal on the host interrupt
544 * controller to ensure that we see future timer signals.
545 */
546 static void unmask_vtimer_irq_user(struct kvm_vcpu *vcpu)
547 {
548 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
549
550 if (!kvm_timer_should_fire(vtimer)) {
551 kvm_timer_update_irq(vcpu, false, vtimer);
552 if (static_branch_likely(&has_gic_active_state))
553 set_vtimer_irq_phys_active(vcpu, false);
554 else
555 enable_percpu_irq(host_vtimer_irq, host_vtimer_irq_flags);
556 }
557 }
558
559 void kvm_timer_sync_hwstate(struct kvm_vcpu *vcpu)
560 {
561 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
562
563 if (unlikely(!timer->enabled))
564 return;
565
566 if (unlikely(!irqchip_in_kernel(vcpu->kvm)))
567 unmask_vtimer_irq_user(vcpu);
568 }
569
570 int kvm_timer_vcpu_reset(struct kvm_vcpu *vcpu)
571 {
572 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
573 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
574 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
575
576 /*
577 * The bits in CNTV_CTL are architecturally reset to UNKNOWN for ARMv8
578 * and to 0 for ARMv7. We provide an implementation that always
579 * resets the timer to be disabled and unmasked and is compliant with
580 * the ARMv7 architecture.
581 */
582 vtimer->cnt_ctl = 0;
583 ptimer->cnt_ctl = 0;
584 kvm_timer_update_state(vcpu);
585
586 if (timer->enabled && irqchip_in_kernel(vcpu->kvm))
587 kvm_vgic_reset_mapped_irq(vcpu, vtimer->irq.irq);
588
589 return 0;
590 }
591
592 /* Make the updates of cntvoff for all vtimer contexts atomic */
593 static void update_vtimer_cntvoff(struct kvm_vcpu *vcpu, u64 cntvoff)
594 {
595 int i;
596 struct kvm *kvm = vcpu->kvm;
597 struct kvm_vcpu *tmp;
598
599 mutex_lock(&kvm->lock);
600 kvm_for_each_vcpu(i, tmp, kvm)
601 vcpu_vtimer(tmp)->cntvoff = cntvoff;
602
603 /*
604 * When called from the vcpu create path, the CPU being created is not
605 * included in the loop above, so we just set it here as well.
606 */
607 vcpu_vtimer(vcpu)->cntvoff = cntvoff;
608 mutex_unlock(&kvm->lock);
609 }
610
611 void kvm_timer_vcpu_init(struct kvm_vcpu *vcpu)
612 {
613 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
614 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
615 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
616
617 /* Synchronize cntvoff across all vtimers of a VM. */
618 update_vtimer_cntvoff(vcpu, kvm_phys_timer_read());
619 vcpu_ptimer(vcpu)->cntvoff = 0;
620
621 hrtimer_init(&timer->bg_timer, CLOCK_MONOTONIC, HRTIMER_MODE_ABS);
622 timer->bg_timer.function = kvm_bg_timer_expire;
623
624 hrtimer_init(&timer->phys_timer, CLOCK_MONOTONIC, HRTIMER_MODE_ABS);
625 timer->phys_timer.function = kvm_phys_timer_expire;
626
627 vtimer->irq.irq = default_vtimer_irq.irq;
628 ptimer->irq.irq = default_ptimer_irq.irq;
629 }
630
631 static void kvm_timer_init_interrupt(void *info)
632 {
633 enable_percpu_irq(host_vtimer_irq, host_vtimer_irq_flags);
634 }
635
636 int kvm_arm_timer_set_reg(struct kvm_vcpu *vcpu, u64 regid, u64 value)
637 {
638 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
639 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
640
641 switch (regid) {
642 case KVM_REG_ARM_TIMER_CTL:
643 vtimer->cnt_ctl = value & ~ARCH_TIMER_CTRL_IT_STAT;
644 break;
645 case KVM_REG_ARM_TIMER_CNT:
646 update_vtimer_cntvoff(vcpu, kvm_phys_timer_read() - value);
647 break;
648 case KVM_REG_ARM_TIMER_CVAL:
649 vtimer->cnt_cval = value;
650 break;
651 case KVM_REG_ARM_PTIMER_CTL:
652 ptimer->cnt_ctl = value & ~ARCH_TIMER_CTRL_IT_STAT;
653 break;
654 case KVM_REG_ARM_PTIMER_CVAL:
655 ptimer->cnt_cval = value;
656 break;
657
658 default:
659 return -1;
660 }
661
662 kvm_timer_update_state(vcpu);
663 return 0;
664 }
665
666 static u64 read_timer_ctl(struct arch_timer_context *timer)
667 {
668 /*
669 * Set ISTATUS bit if it's expired.
670 * Note that according to ARMv8 ARM Issue A.k, ISTATUS bit is
671 * UNKNOWN when ENABLE bit is 0, so we chose to set ISTATUS bit
672 * regardless of ENABLE bit for our implementation convenience.
673 */
674 if (!kvm_timer_compute_delta(timer))
675 return timer->cnt_ctl | ARCH_TIMER_CTRL_IT_STAT;
676 else
677 return timer->cnt_ctl;
678 }
679
680 u64 kvm_arm_timer_get_reg(struct kvm_vcpu *vcpu, u64 regid)
681 {
682 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
683 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
684
685 switch (regid) {
686 case KVM_REG_ARM_TIMER_CTL:
687 return read_timer_ctl(vtimer);
688 case KVM_REG_ARM_TIMER_CNT:
689 return kvm_phys_timer_read() - vtimer->cntvoff;
690 case KVM_REG_ARM_TIMER_CVAL:
691 return vtimer->cnt_cval;
692 case KVM_REG_ARM_PTIMER_CTL:
693 return read_timer_ctl(ptimer);
694 case KVM_REG_ARM_PTIMER_CVAL:
695 return ptimer->cnt_cval;
696 case KVM_REG_ARM_PTIMER_CNT:
697 return kvm_phys_timer_read();
698 }
699 return (u64)-1;
700 }
701
702 static int kvm_timer_starting_cpu(unsigned int cpu)
703 {
704 kvm_timer_init_interrupt(NULL);
705 return 0;
706 }
707
708 static int kvm_timer_dying_cpu(unsigned int cpu)
709 {
710 disable_percpu_irq(host_vtimer_irq);
711 return 0;
712 }
713
714 int kvm_timer_hyp_init(bool has_gic)
715 {
716 struct arch_timer_kvm_info *info;
717 int err;
718
719 info = arch_timer_get_kvm_info();
720 timecounter = &info->timecounter;
721
722 if (!timecounter->cc) {
723 kvm_err("kvm_arch_timer: uninitialized timecounter\n");
724 return -ENODEV;
725 }
726
727 if (info->virtual_irq <= 0) {
728 kvm_err("kvm_arch_timer: invalid virtual timer IRQ: %d\n",
729 info->virtual_irq);
730 return -ENODEV;
731 }
732 host_vtimer_irq = info->virtual_irq;
733
734 host_vtimer_irq_flags = irq_get_trigger_type(host_vtimer_irq);
735 if (host_vtimer_irq_flags != IRQF_TRIGGER_HIGH &&
736 host_vtimer_irq_flags != IRQF_TRIGGER_LOW) {
737 kvm_err("Invalid trigger for IRQ%d, assuming level low\n",
738 host_vtimer_irq);
739 host_vtimer_irq_flags = IRQF_TRIGGER_LOW;
740 }
741
742 err = request_percpu_irq(host_vtimer_irq, kvm_arch_timer_handler,
743 "kvm guest timer", kvm_get_running_vcpus());
744 if (err) {
745 kvm_err("kvm_arch_timer: can't request interrupt %d (%d)\n",
746 host_vtimer_irq, err);
747 return err;
748 }
749
750 if (has_gic) {
751 err = irq_set_vcpu_affinity(host_vtimer_irq,
752 kvm_get_running_vcpus());
753 if (err) {
754 kvm_err("kvm_arch_timer: error setting vcpu affinity\n");
755 goto out_free_irq;
756 }
757
758 static_branch_enable(&has_gic_active_state);
759 }
760
761 kvm_debug("virtual timer IRQ%d\n", host_vtimer_irq);
762
763 cpuhp_setup_state(CPUHP_AP_KVM_ARM_TIMER_STARTING,
764 "kvm/arm/timer:starting", kvm_timer_starting_cpu,
765 kvm_timer_dying_cpu);
766 return 0;
767 out_free_irq:
768 free_percpu_irq(host_vtimer_irq, kvm_get_running_vcpus());
769 return err;
770 }
771
772 void kvm_timer_vcpu_terminate(struct kvm_vcpu *vcpu)
773 {
774 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
775
776 soft_timer_cancel(&timer->bg_timer);
777 }
778
779 static bool timer_irqs_are_valid(struct kvm_vcpu *vcpu)
780 {
781 int vtimer_irq, ptimer_irq;
782 int i, ret;
783
784 vtimer_irq = vcpu_vtimer(vcpu)->irq.irq;
785 ret = kvm_vgic_set_owner(vcpu, vtimer_irq, vcpu_vtimer(vcpu));
786 if (ret)
787 return false;
788
789 ptimer_irq = vcpu_ptimer(vcpu)->irq.irq;
790 ret = kvm_vgic_set_owner(vcpu, ptimer_irq, vcpu_ptimer(vcpu));
791 if (ret)
792 return false;
793
794 kvm_for_each_vcpu(i, vcpu, vcpu->kvm) {
795 if (vcpu_vtimer(vcpu)->irq.irq != vtimer_irq ||
796 vcpu_ptimer(vcpu)->irq.irq != ptimer_irq)
797 return false;
798 }
799
800 return true;
801 }
802
803 bool kvm_arch_timer_get_input_level(int vintid)
804 {
805 struct kvm_vcpu *vcpu = kvm_arm_get_running_vcpu();
806 struct arch_timer_context *timer;
807
808 if (vintid == vcpu_vtimer(vcpu)->irq.irq)
809 timer = vcpu_vtimer(vcpu);
810 else
811 BUG(); /* We only map the vtimer so far */
812
813 return kvm_timer_should_fire(timer);
814 }
815
816 int kvm_timer_enable(struct kvm_vcpu *vcpu)
817 {
818 struct arch_timer_cpu *timer = &vcpu->arch.timer_cpu;
819 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
820 int ret;
821
822 if (timer->enabled)
823 return 0;
824
825 /* Without a VGIC we do not map virtual IRQs to physical IRQs */
826 if (!irqchip_in_kernel(vcpu->kvm))
827 goto no_vgic;
828
829 if (!vgic_initialized(vcpu->kvm))
830 return -ENODEV;
831
832 if (!timer_irqs_are_valid(vcpu)) {
833 kvm_debug("incorrectly configured timer irqs\n");
834 return -EINVAL;
835 }
836
837 ret = kvm_vgic_map_phys_irq(vcpu, host_vtimer_irq, vtimer->irq.irq,
838 kvm_arch_timer_get_input_level);
839 if (ret)
840 return ret;
841
842 no_vgic:
843 timer->enabled = 1;
844 return 0;
845 }
846
847 /*
848 * On VHE system, we only need to configure trap on physical timer and counter
849 * accesses in EL0 and EL1 once, not for every world switch.
850 * The host kernel runs at EL2 with HCR_EL2.TGE == 1,
851 * and this makes those bits have no effect for the host kernel execution.
852 */
853 void kvm_timer_init_vhe(void)
854 {
855 /* When HCR_EL2.E2H ==1, EL1PCEN and EL1PCTEN are shifted by 10 */
856 u32 cnthctl_shift = 10;
857 u64 val;
858
859 /*
860 * Disallow physical timer access for the guest.
861 * Physical counter access is allowed.
862 */
863 val = read_sysreg(cnthctl_el2);
864 val &= ~(CNTHCTL_EL1PCEN << cnthctl_shift);
865 val |= (CNTHCTL_EL1PCTEN << cnthctl_shift);
866 write_sysreg(val, cnthctl_el2);
867 }
868
869 static void set_timer_irqs(struct kvm *kvm, int vtimer_irq, int ptimer_irq)
870 {
871 struct kvm_vcpu *vcpu;
872 int i;
873
874 kvm_for_each_vcpu(i, vcpu, kvm) {
875 vcpu_vtimer(vcpu)->irq.irq = vtimer_irq;
876 vcpu_ptimer(vcpu)->irq.irq = ptimer_irq;
877 }
878 }
879
880 int kvm_arm_timer_set_attr(struct kvm_vcpu *vcpu, struct kvm_device_attr *attr)
881 {
882 int __user *uaddr = (int __user *)(long)attr->addr;
883 struct arch_timer_context *vtimer = vcpu_vtimer(vcpu);
884 struct arch_timer_context *ptimer = vcpu_ptimer(vcpu);
885 int irq;
886
887 if (!irqchip_in_kernel(vcpu->kvm))
888 return -EINVAL;
889
890 if (get_user(irq, uaddr))
891 return -EFAULT;
892
893 if (!(irq_is_ppi(irq)))
894 return -EINVAL;
895
896 if (vcpu->arch.timer_cpu.enabled)
897 return -EBUSY;
898
899 switch (attr->attr) {
900 case KVM_ARM_VCPU_TIMER_IRQ_VTIMER:
901 set_timer_irqs(vcpu->kvm, irq, ptimer->irq.irq);
902 break;
903 case KVM_ARM_VCPU_TIMER_IRQ_PTIMER:
904 set_timer_irqs(vcpu->kvm, vtimer->irq.irq, irq);
905 break;
906 default:
907 return -ENXIO;
908 }
909
910 return 0;
911 }
912
913 int kvm_arm_timer_get_attr(struct kvm_vcpu *vcpu, struct kvm_device_attr *attr)
914 {
915 int __user *uaddr = (int __user *)(long)attr->addr;
916 struct arch_timer_context *timer;
917 int irq;
918
919 switch (attr->attr) {
920 case KVM_ARM_VCPU_TIMER_IRQ_VTIMER:
921 timer = vcpu_vtimer(vcpu);
922 break;
923 case KVM_ARM_VCPU_TIMER_IRQ_PTIMER:
924 timer = vcpu_ptimer(vcpu);
925 break;
926 default:
927 return -ENXIO;
928 }
929
930 irq = timer->irq.irq;
931 return put_user(irq, uaddr);
932 }
933
934 int kvm_arm_timer_has_attr(struct kvm_vcpu *vcpu, struct kvm_device_attr *attr)
935 {
936 switch (attr->attr) {
937 case KVM_ARM_VCPU_TIMER_IRQ_VTIMER:
938 case KVM_ARM_VCPU_TIMER_IRQ_PTIMER:
939 return 0;
940 }
941
942 return -ENXIO;
943 }