Save and restore newly untrapped registers that will be directly
accessed by the guest when the PMU is partitioned.

* PMEVCNTRn_EL0
* PMCCNTR_EL0
* PMICNTR_EL0
* PMUSERENR_EL0
* PMSELR_EL0
* PMCR_EL0
* PMCNTEN_EL0
* PMINTEN_EL1

If the PMU is not partitioned or MDCR_EL2.TPM is set, all PMU
registers are trapped so return immediately.

Signed-off-by: Colton Lewis <coltonle...@google.com>
---
 arch/arm64/include/asm/kvm_host.h |   2 +
 arch/arm64/include/asm/kvm_pmu.h  |   2 +
 arch/arm64/kvm/arm.c              |   2 +
 arch/arm64/kvm/pmu-part.c         | 101 ++++++++++++++++++++++++++++++
 4 files changed, 107 insertions(+)

diff --git a/arch/arm64/include/asm/kvm_host.h 
b/arch/arm64/include/asm/kvm_host.h
index 2df76689381a..374771557d2c 100644
--- a/arch/arm64/include/asm/kvm_host.h
+++ b/arch/arm64/include/asm/kvm_host.h
@@ -453,9 +453,11 @@ enum vcpu_sysreg {
        PMEVCNTR0_EL0,  /* Event Counter Register (0-30) */
        PMEVCNTR30_EL0 = PMEVCNTR0_EL0 + 30,
        PMCCNTR_EL0,    /* Cycle Counter Register */
+       PMICNTR_EL0,    /* Instruction Counter Register */
        PMEVTYPER0_EL0, /* Event Type Register (0-30) */
        PMEVTYPER30_EL0 = PMEVTYPER0_EL0 + 30,
        PMCCFILTR_EL0,  /* Cycle Count Filter Register */
+       PMICFILTR_EL0,  /* Insturction Count Filter Register */
        PMCNTENSET_EL0, /* Count Enable Set Register */
        PMINTENSET_EL1, /* Interrupt Enable Set Register */
        PMOVSSET_EL0,   /* Overflow Flag Status Set Register */
diff --git a/arch/arm64/include/asm/kvm_pmu.h b/arch/arm64/include/asm/kvm_pmu.h
index 1b68f1a706d1..208893485027 100644
--- a/arch/arm64/include/asm/kvm_pmu.h
+++ b/arch/arm64/include/asm/kvm_pmu.h
@@ -96,6 +96,8 @@ void kvm_pmu_host_counters_disable(void);
 
 u8 kvm_pmu_guest_num_counters(struct kvm_vcpu *vcpu);
 u8 kvm_pmu_hpmn(struct kvm_vcpu *vcpu);
+void kvm_pmu_load(struct kvm_vcpu *vcpu);
+void kvm_pmu_put(struct kvm_vcpu *vcpu);
 
 #if !defined(__KVM_NVHE_HYPERVISOR__)
 bool kvm_vcpu_pmu_is_partitioned(struct kvm_vcpu *vcpu);
diff --git a/arch/arm64/kvm/arm.c b/arch/arm64/kvm/arm.c
index e452aba1a3b2..7c007ee44ecb 100644
--- a/arch/arm64/kvm/arm.c
+++ b/arch/arm64/kvm/arm.c
@@ -616,6 +616,7 @@ void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu)
                kvm_vcpu_load_vhe(vcpu);
        kvm_arch_vcpu_load_fp(vcpu);
        kvm_vcpu_pmu_restore_guest(vcpu);
+       kvm_pmu_load(vcpu);
        if (kvm_arm_is_pvtime_enabled(&vcpu->arch))
                kvm_make_request(KVM_REQ_RECORD_STEAL, vcpu);
 
@@ -658,6 +659,7 @@ void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu)
        kvm_timer_vcpu_put(vcpu);
        kvm_vgic_put(vcpu);
        kvm_vcpu_pmu_restore_host(vcpu);
+       kvm_pmu_put(vcpu);
        if (vcpu_has_nv(vcpu))
                kvm_vcpu_put_hw_mmu(vcpu);
        kvm_arm_vmid_clear_active();
diff --git a/arch/arm64/kvm/pmu-part.c b/arch/arm64/kvm/pmu-part.c
index 289f396bd887..19bd6e0da222 100644
--- a/arch/arm64/kvm/pmu-part.c
+++ b/arch/arm64/kvm/pmu-part.c
@@ -8,6 +8,7 @@
 #include <linux/perf/arm_pmu.h>
 #include <linux/perf/arm_pmuv3.h>
 
+#include <asm/kvm_emulate.h>
 #include <asm/kvm_pmu.h>
 #include <asm/arm_pmuv3.h>
 
@@ -175,3 +176,103 @@ u8 kvm_pmu_hpmn(struct kvm_vcpu *vcpu)
 
        return hpmn;
 }
+
+/**
+ * kvm_pmu_load() - Load untrapped PMU registers
+ * @vcpu: Pointer to struct kvm_vcpu
+ *
+ * Load all untrapped PMU registers from the VCPU into the PCPU. Mask
+ * to only bits belonging to guest-reserved counters and leave
+ * host-reserved counters alone in bitmask registers.
+ */
+void kvm_pmu_load(struct kvm_vcpu *vcpu)
+{
+       struct arm_pmu *pmu = vcpu->kvm->arch.arm_pmu;
+       u64 mask = kvm_pmu_guest_counter_mask(pmu);
+       u8 i;
+       u64 val;
+
+       /*
+        * If the PMU is not partitioned or we have MDCR_EL2_TPM,
+        * every PMU access is trapped so don't bother with the swap.
+        */
+       if (!kvm_pmu_is_partitioned(pmu) || (vcpu->arch.mdcr_el2 & 
MDCR_EL2_TPM))
+               return;
+
+       for (i = 0; i < pmu->hpmn_max; i++) {
+               val = __vcpu_sys_reg(vcpu, PMEVCNTR0_EL0 + i);
+               write_pmevcntrn(i, val);
+       }
+
+       val = __vcpu_sys_reg(vcpu, PMCCNTR_EL0);
+       write_pmccntr(val);
+
+       val = __vcpu_sys_reg(vcpu, PMUSERENR_EL0);
+       write_pmuserenr(val);
+
+       val = __vcpu_sys_reg(vcpu, PMSELR_EL0);
+       write_pmselr(val);
+
+       val = __vcpu_sys_reg(vcpu, PMCR_EL0);
+       write_pmcr(val);
+
+       /*
+        * Loading these registers is tricky because of
+        * 1. Applying only the bits for guest counters (indicated by mask)
+        * 2. Setting and clearing are different registers
+        */
+       val = __vcpu_sys_reg(vcpu, PMCNTENSET_EL0);
+       write_pmcntenset(val & mask);
+       write_pmcntenclr(~val & mask);
+
+       val = __vcpu_sys_reg(vcpu, PMINTENSET_EL1);
+       write_pmintenset(val & mask);
+       write_pmintenclr(~val & mask);
+}
+
+/**
+ * kvm_pmu_put() - Put untrapped PMU registers
+ * @vcpu: Pointer to struct kvm_vcpu
+ *
+ * Put all untrapped PMU registers from the VCPU into the PCPU. Mask
+ * to only bits belonging to guest-reserved counters and leave
+ * host-reserved counters alone in bitmask registers.
+ */
+void kvm_pmu_put(struct kvm_vcpu *vcpu)
+{
+       struct arm_pmu *pmu = vcpu->kvm->arch.arm_pmu;
+       u64 mask = kvm_pmu_guest_counter_mask(pmu);
+       u8 i;
+       u64 val;
+
+       /*
+        * If the PMU is not partitioned or we have MDCR_EL2_TPM,
+        * every PMU access is trapped so don't bother with the swap.
+        */
+       if (!kvm_pmu_is_partitioned(pmu) || (vcpu->arch.mdcr_el2 & 
MDCR_EL2_TPM))
+               return;
+
+       for (i = 0; i < pmu->hpmn_max; i++) {
+               val = read_pmevcntrn(i);
+               __vcpu_assign_sys_reg(vcpu, PMEVCNTR0_EL0 + i, val);
+       }
+
+       val = read_pmccntr();
+       __vcpu_assign_sys_reg(vcpu, PMCCNTR_EL0, val);
+
+       val = read_pmuserenr();
+       __vcpu_assign_sys_reg(vcpu, PMUSERENR_EL0, val);
+
+       val = read_pmselr();
+       __vcpu_assign_sys_reg(vcpu, PMSELR_EL0, val);
+
+       val = read_pmcr();
+       __vcpu_assign_sys_reg(vcpu, PMCR_EL0, val);
+
+       /* Mask these to only save the guest relevant bits. */
+       val = read_pmcntenset();
+       __vcpu_assign_sys_reg(vcpu, PMCNTENSET_EL0, val & mask);
+
+       val = read_pmintenset();
+       __vcpu_assign_sys_reg(vcpu, PMINTENSET_EL1, val & mask);
+}
-- 
2.50.0.714.g196bf9f422-goog


Reply via email to