On 10/30/2011 06:53 PM, Gleb Natapov wrote:
> From: Avi Kivity <[email protected]>

This has changed significantly, so please update the authorship.  You
can say 'based on original patch by ...' to provide due credit.

> Use perf_events to emulate an architectural PMU, version 2.

> +
> +/* mapping between fixed pmc index and arch_events array */
> +int fixed_pmc_events[] = {1, 0, 2};
> +
> +static bool pmc_is_gp(struct kvm_pmc *pmc)
> +{
> +     return pmc->type == KVM_PMC_GP;
> +}
> +
> +static inline u64 pmc_bitmask(struct kvm_pmc *pmc)
> +{
> +     struct kvm_pmu *pmu = &pmc->vcpu->arch.pmu;
> +
> +     return pmc_is_gp(pmc) ? pmu->gp_counter_bitmask :
> +             pmu->fixed_counter_bitmask;
> +}

Nicer to just push the bitmask (or bitwidth) into the counter itself.

> +
> +static inline int pmc_to_global_idx(struct kvm_pmc *pmc)
> +{
> +     struct kvm_pmu *pmu = &pmc->vcpu->arch.pmu;
> +     struct kvm_pmc *counters;
> +     int shift;
> +
> +     if (pmc_is_gp(pmc)) {
> +             counters = pmu->gp_counters;
> +             shift = X86_PMC_IDX_GENERIC;
> +     } else {
> +             counters = pmu->fixed_counters;
> +             shift = X86_PMC_IDX_FIXED;
> +     }
> +
> +     return pmc - counters + shift;
> +}

Again, push the global index into struct kvm_pmc.

> +
> +static void kvm_perf_overflow(struct perf_event *perf_event,
> +                           struct perf_sample_data *data,
> +                           struct pt_regs *regs)
> +{
> +     struct kvm_pmc *pmc = perf_event->overflow_handler_context;
> +     struct kvm_pmu *pmu = &pmc->vcpu->arch.pmu;
> +     __set_bit(pmc_to_global_idx(pmc),
> +                     (unsigned long *)&pmu->global_status);
> +}
> +
> +static void kvm_perf_overflow_intr(struct perf_event *perf_event,
> +             struct perf_sample_data *data, struct pt_regs *regs)
> +{
> +     struct kvm_pmc *pmc = perf_event->overflow_handler_context;
> +     struct kvm_pmu *pmu = &pmc->vcpu->arch.pmu;
> +     if (!__test_and_set_bit(pmc_to_global_idx(pmc),
> +                             (unsigned long *)&pmu->reprogram_pmi)) {
> +             kvm_perf_overflow(perf_event, data, regs);
> +             kvm_make_request(KVM_REQ_PMU, pmc->vcpu);
> +     }
> +}

Is it safe to use the __ versions here?

Do we need to follow kvm_make_request() with kvm_vcpu_kick()?  If there
is a skew between the overflow and the host PMI, the guest might have
executed a HLT.

> +
> +static void reprogram_fixed_counter(struct kvm_pmc *pmc, u8 en_pmi, int idx)
> +{
> +     unsigned en = en_pmi & 0x3;
> +     bool pmi = en_pmi & 0x8;
> +
> +     stop_counter(pmc);
> +
> +     if (!en || !pmc_enabled(pmc))
> +             return;
> +
> +     reprogram_counter(pmc, PERF_TYPE_HARDWARE,
> +                     arch_events[fixed_pmc_events[idx]].event_type,
> +                     !(en & 0x2), /* exclude user */
> +                     !(en & 0x1), /* exclude kernel */
> +                     pmi);

Are there no #defines for those constants?

> +}
> +
> +#define FIXED_EN_PMI(R, I) (((R) >> ((I) * 4)) & 0xf)

function

> +     default:
> +             if ((pmc = get_gp_pmc(pmu, index, MSR_IA32_PERFCTR0)) ||
> +                             (pmc = get_fixed_pmc(pmu, index))) {
> +                     data = (s64)(s32)data;
> +                     pmc->counter += data - read_pmc(pmc);
> +                     return 0;
> +             } else if ((pmc = get_gp_pmc(pmu, index, MSR_P6_EVNTSEL0))) {
> +                     if (data == pmc->eventsel)
> +                             return 0;
> +                     if (!(data & 0xffffffff00200000ull)) {
> +                             reprogram_gp_counter(pmc, data);
> +                             return 0;
> +                     }
> +             }
> +     }
> +     return 1;
> +}
> +
> +
> +void kvm_pmu_cpuid_update(struct kvm_vcpu *vcpu)
> +{
> +     struct kvm_pmu *pmu = &vcpu->arch.pmu;
> +     struct kvm_cpuid_entry2 *entry;
> +     unsigned bitmap_len;
> +
> +     pmu->nr_arch_gp_counters = 0;
> +     pmu->nr_arch_fixed_counters = 0;
> +     pmu->fixed_counter_bitmask = 0;
> +     pmu->version = 0;
> +
> +     entry = kvm_find_cpuid_entry(vcpu, 0xa, 0);
> +     if (!entry)
> +             return;
> +
> +     pmu->version = entry->eax & 0xff;
> +     if (!pmu->version)
> +             return;
> +
> +     pmu->nr_arch_gp_counters = min((int)(entry->eax >> 8) & 0xff,
> +                     X86_PMC_MAX_GENERIC);
> +     pmu->gp_counter_bitmask = ((u64)1 << ((entry->eax >> 16) & 0xff)) - 1;
> +     bitmap_len = (entry->eax >> 24) & 0xff;
> +     pmu->available_event_types = ~entry->ebx & ((1ull << bitmap_len) - 1);
> +
> +     if (pmu->version > 1) {
> +             pmu->nr_arch_fixed_counters = min((int)(entry->edx) & 0x1f,
> +                             X86_PMC_MAX_FIXED);

Misplaced parentheses (though no effect on generated code).

> +             pmu->fixed_counter_bitmask =
> +                     ((u64)1 << ((entry->edx >> 5) & 0xff)) - 1;

The user can cause this to be very small (even zero).  Can this cause an
NMI storm?

> +             pmu->global_ctrl_mask = ~(((1 << pmu->nr_arch_gp_counters) - 1)
> +                             | (((1ull << pmu->nr_arch_fixed_counters) - 1)
> +                                     << X86_PMC_IDX_FIXED));
> +     } else
> +             pmu->global_ctrl = (1 << pmu->nr_arch_gp_counters) - 1;
> +}

Nicer to just return early if version < 2; less indentation and easier
to prepare for version 3.

-- 
I have a truly marvellous patch that fixes the bug which this
signature is too narrow to contain.

--
To unsubscribe from this list: send the line "unsubscribe kvm" in
the body of a message to [email protected]
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Reply via email to