KVM: arm64: timers: Correctly handle TGE flip with CNTPOFF_EL2
authorMarc Zyngier <maz@kernel.org>
Tue, 22 Aug 2023 12:18:10 +0000 (13:18 +0100)
committerMarc Zyngier <maz@kernel.org>
Thu, 12 Oct 2023 15:55:21 +0000 (16:55 +0100)
Contrary to common belief, HCR_EL2.TGE has a direct and immediate
effect on the way the EL0 physical counter is offset. Flipping
TGE from 1 to 0 while at EL2 immediately changes the way the counter
compared to the CVAL limit.

This means that we cannot directly save/restore the guest's view of
CVAL, but that we instead must treat it as if CNTPOFF didn't exist.
Only in the world switch, once we figure out that we do have CNTPOFF,
can we must the offset back and forth depending on the polarity of
TGE.

Fixes: 2b4825a86940 ("KVM: arm64: timers: Use CNTPOFF_EL2 to offset the physical timer")
Reported-by: Ganapatrao Kulkarni <gankulkarni@os.amperecomputing.com>
Tested-by: Ganapatrao Kulkarni <gankulkarni@os.amperecomputing.com>
Signed-off-by: Marc Zyngier <maz@kernel.org>
arch/arm64/kvm/arch_timer.c
arch/arm64/kvm/hyp/vhe/switch.c
include/kvm/arm_arch_timer.h

index 6dcdae4d38cb5ab9a7aba4a2bcf83ec6b7262d48..a1e24228aaaa764f3f96a3780e60a3003694b22b 100644 (file)
@@ -55,11 +55,6 @@ static struct irq_ops arch_timer_irq_ops = {
        .get_input_level = kvm_arch_timer_get_input_level,
 };
 
-static bool has_cntpoff(void)
-{
-       return (has_vhe() && cpus_have_final_cap(ARM64_HAS_ECV_CNTPOFF));
-}
-
 static int nr_timers(struct kvm_vcpu *vcpu)
 {
        if (!vcpu_has_nv(vcpu))
@@ -180,7 +175,7 @@ u64 kvm_phys_timer_read(void)
        return timecounter->cc->read(timecounter->cc);
 }
 
-static void get_timer_map(struct kvm_vcpu *vcpu, struct timer_map *map)
+void get_timer_map(struct kvm_vcpu *vcpu, struct timer_map *map)
 {
        if (vcpu_has_nv(vcpu)) {
                if (is_hyp_ctxt(vcpu)) {
@@ -548,8 +543,7 @@ static void timer_save_state(struct arch_timer_context *ctx)
                timer_set_ctl(ctx, read_sysreg_el0(SYS_CNTP_CTL));
                cval = read_sysreg_el0(SYS_CNTP_CVAL);
 
-               if (!has_cntpoff())
-                       cval -= timer_get_offset(ctx);
+               cval -= timer_get_offset(ctx);
 
                timer_set_cval(ctx, cval);
 
@@ -636,8 +630,7 @@ static void timer_restore_state(struct arch_timer_context *ctx)
                cval = timer_get_cval(ctx);
                offset = timer_get_offset(ctx);
                set_cntpoff(offset);
-               if (!has_cntpoff())
-                       cval += offset;
+               cval += offset;
                write_sysreg_el0(cval, SYS_CNTP_CVAL);
                isb();
                write_sysreg_el0(timer_get_ctl(ctx), SYS_CNTP_CTL);
index 6537f58b1a8cc026f087f4f73affe42e8f38873b..448b17080d3617cbf5d2fceec7e7fa62866760d4 100644 (file)
@@ -39,6 +39,26 @@ static void __activate_traps(struct kvm_vcpu *vcpu)
 
        ___activate_traps(vcpu);
 
+       if (has_cntpoff()) {
+               struct timer_map map;
+
+               get_timer_map(vcpu, &map);
+
+               /*
+                * We're entrering the guest. Reload the correct
+                * values from memory now that TGE is clear.
+                */
+               if (map.direct_ptimer == vcpu_ptimer(vcpu))
+                       val = __vcpu_sys_reg(vcpu, CNTP_CVAL_EL0);
+               if (map.direct_ptimer == vcpu_hptimer(vcpu))
+                       val = __vcpu_sys_reg(vcpu, CNTHP_CVAL_EL2);
+
+               if (map.direct_ptimer) {
+                       write_sysreg_el0(val, SYS_CNTP_CVAL);
+                       isb();
+               }
+       }
+
        val = read_sysreg(cpacr_el1);
        val |= CPACR_ELx_TTA;
        val &= ~(CPACR_EL1_ZEN_EL0EN | CPACR_EL1_ZEN_EL1EN |
@@ -77,6 +97,30 @@ static void __deactivate_traps(struct kvm_vcpu *vcpu)
 
        write_sysreg(HCR_HOST_VHE_FLAGS, hcr_el2);
 
+       if (has_cntpoff()) {
+               struct timer_map map;
+               u64 val, offset;
+
+               get_timer_map(vcpu, &map);
+
+               /*
+                * We're exiting the guest. Save the latest CVAL value
+                * to memory and apply the offset now that TGE is set.
+                */
+               val = read_sysreg_el0(SYS_CNTP_CVAL);
+               if (map.direct_ptimer == vcpu_ptimer(vcpu))
+                       __vcpu_sys_reg(vcpu, CNTP_CVAL_EL0) = val;
+               if (map.direct_ptimer == vcpu_hptimer(vcpu))
+                       __vcpu_sys_reg(vcpu, CNTHP_CVAL_EL2) = val;
+
+               offset = read_sysreg_s(SYS_CNTPOFF_EL2);
+
+               if (map.direct_ptimer && offset) {
+                       write_sysreg_el0(val + offset, SYS_CNTP_CVAL);
+                       isb();
+               }
+       }
+
        /*
         * ARM errata 1165522 and 1530923 require the actual execution of the
         * above before we can switch to the EL2/EL0 translation regime used by
index bb3cb005873ec9828b1ece587755cb8a9fc9b5ed..e748bc957d83262233b3c8a655ed68b0ad8f34dd 100644 (file)
@@ -82,6 +82,8 @@ struct timer_map {
        struct arch_timer_context *emul_ptimer;
 };
 
+void get_timer_map(struct kvm_vcpu *vcpu, struct timer_map *map);
+
 struct arch_timer_cpu {
        struct arch_timer_context timers[NR_KVM_TIMERS];
 
@@ -145,4 +147,9 @@ u64 timer_get_cval(struct arch_timer_context *ctxt);
 void kvm_timer_cpu_up(void);
 void kvm_timer_cpu_down(void);
 
+static inline bool has_cntpoff(void)
+{
+       return (has_vhe() && cpus_have_final_cap(ARM64_HAS_ECV_CNTPOFF));
+}
+
 #endif