Add a common helper for *internal* PMC lookups, and delete the ops hook and Intel's implementation. Keep AMD's implementation, but rename it to amd_pmu_get_pmc() to make it somewhat more obvious that it's suited for both KVM-internal and guest-initiated lookups. Because KVM tracks all counters in a single bitmap, getting a counter when iterating over a bitmap, e.g. of all valid PMCs, requires a small amount of math, that while simple, isn't super obvious and doesn't use the same semantics as PMC lookups from RDPMC! Although AMD doesn't support fixed counters, the common PMU code still behaves as if there a split, the high half of which just happens to always be empty. Opportunstically add a comment to explain both what is going on, and why KVM uses a single bitmap, e.g. the boilerplate for iterating over separate bitmaps could be done via macros, so it's not (just) about deduplicating code. Link: https://lore.kernel.org/r/20231110022857.1273836-4-seanjc@google.com Signed-off-by: Sean Christopherson <seanjc@google.com>
244 lines
6.2 KiB
C
244 lines
6.2 KiB
C
// SPDX-License-Identifier: GPL-2.0-only
|
|
/*
|
|
* KVM PMU support for AMD
|
|
*
|
|
* Copyright 2015, Red Hat, Inc. and/or its affiliates.
|
|
*
|
|
* Author:
|
|
* Wei Huang <wei@redhat.com>
|
|
*
|
|
* Implementation is based on pmu_intel.c file
|
|
*/
|
|
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
|
|
|
|
#include <linux/types.h>
|
|
#include <linux/kvm_host.h>
|
|
#include <linux/perf_event.h>
|
|
#include "x86.h"
|
|
#include "cpuid.h"
|
|
#include "lapic.h"
|
|
#include "pmu.h"
|
|
#include "svm.h"
|
|
|
|
enum pmu_type {
|
|
PMU_TYPE_COUNTER = 0,
|
|
PMU_TYPE_EVNTSEL,
|
|
};
|
|
|
|
static struct kvm_pmc *amd_pmu_get_pmc(struct kvm_pmu *pmu, int pmc_idx)
|
|
{
|
|
unsigned int num_counters = pmu->nr_arch_gp_counters;
|
|
|
|
if (pmc_idx >= num_counters)
|
|
return NULL;
|
|
|
|
return &pmu->gp_counters[array_index_nospec(pmc_idx, num_counters)];
|
|
}
|
|
|
|
static inline struct kvm_pmc *get_gp_pmc_amd(struct kvm_pmu *pmu, u32 msr,
|
|
enum pmu_type type)
|
|
{
|
|
struct kvm_vcpu *vcpu = pmu_to_vcpu(pmu);
|
|
unsigned int idx;
|
|
|
|
if (!vcpu->kvm->arch.enable_pmu)
|
|
return NULL;
|
|
|
|
switch (msr) {
|
|
case MSR_F15H_PERF_CTL0 ... MSR_F15H_PERF_CTR5:
|
|
if (!guest_cpuid_has(vcpu, X86_FEATURE_PERFCTR_CORE))
|
|
return NULL;
|
|
/*
|
|
* Each PMU counter has a pair of CTL and CTR MSRs. CTLn
|
|
* MSRs (accessed via EVNTSEL) are even, CTRn MSRs are odd.
|
|
*/
|
|
idx = (unsigned int)((msr - MSR_F15H_PERF_CTL0) / 2);
|
|
if (!(msr & 0x1) != (type == PMU_TYPE_EVNTSEL))
|
|
return NULL;
|
|
break;
|
|
case MSR_K7_EVNTSEL0 ... MSR_K7_EVNTSEL3:
|
|
if (type != PMU_TYPE_EVNTSEL)
|
|
return NULL;
|
|
idx = msr - MSR_K7_EVNTSEL0;
|
|
break;
|
|
case MSR_K7_PERFCTR0 ... MSR_K7_PERFCTR3:
|
|
if (type != PMU_TYPE_COUNTER)
|
|
return NULL;
|
|
idx = msr - MSR_K7_PERFCTR0;
|
|
break;
|
|
default:
|
|
return NULL;
|
|
}
|
|
|
|
return amd_pmu_get_pmc(pmu, idx);
|
|
}
|
|
|
|
static int amd_check_rdpmc_early(struct kvm_vcpu *vcpu, unsigned int idx)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
|
|
if (idx >= pmu->nr_arch_gp_counters)
|
|
return -EINVAL;
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* idx is the ECX register of RDPMC instruction */
|
|
static struct kvm_pmc *amd_rdpmc_ecx_to_pmc(struct kvm_vcpu *vcpu,
|
|
unsigned int idx, u64 *mask)
|
|
{
|
|
return amd_pmu_get_pmc(vcpu_to_pmu(vcpu), idx);
|
|
}
|
|
|
|
static struct kvm_pmc *amd_msr_idx_to_pmc(struct kvm_vcpu *vcpu, u32 msr)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
struct kvm_pmc *pmc;
|
|
|
|
pmc = get_gp_pmc_amd(pmu, msr, PMU_TYPE_COUNTER);
|
|
pmc = pmc ? pmc : get_gp_pmc_amd(pmu, msr, PMU_TYPE_EVNTSEL);
|
|
|
|
return pmc;
|
|
}
|
|
|
|
static bool amd_is_valid_msr(struct kvm_vcpu *vcpu, u32 msr)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
|
|
switch (msr) {
|
|
case MSR_K7_EVNTSEL0 ... MSR_K7_PERFCTR3:
|
|
return pmu->version > 0;
|
|
case MSR_F15H_PERF_CTL0 ... MSR_F15H_PERF_CTR5:
|
|
return guest_cpuid_has(vcpu, X86_FEATURE_PERFCTR_CORE);
|
|
case MSR_AMD64_PERF_CNTR_GLOBAL_STATUS:
|
|
case MSR_AMD64_PERF_CNTR_GLOBAL_CTL:
|
|
case MSR_AMD64_PERF_CNTR_GLOBAL_STATUS_CLR:
|
|
return pmu->version > 1;
|
|
default:
|
|
if (msr > MSR_F15H_PERF_CTR5 &&
|
|
msr < MSR_F15H_PERF_CTL0 + 2 * pmu->nr_arch_gp_counters)
|
|
return pmu->version > 1;
|
|
break;
|
|
}
|
|
|
|
return amd_msr_idx_to_pmc(vcpu, msr);
|
|
}
|
|
|
|
static int amd_pmu_get_msr(struct kvm_vcpu *vcpu, struct msr_data *msr_info)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
struct kvm_pmc *pmc;
|
|
u32 msr = msr_info->index;
|
|
|
|
/* MSR_PERFCTRn */
|
|
pmc = get_gp_pmc_amd(pmu, msr, PMU_TYPE_COUNTER);
|
|
if (pmc) {
|
|
msr_info->data = pmc_read_counter(pmc);
|
|
return 0;
|
|
}
|
|
/* MSR_EVNTSELn */
|
|
pmc = get_gp_pmc_amd(pmu, msr, PMU_TYPE_EVNTSEL);
|
|
if (pmc) {
|
|
msr_info->data = pmc->eventsel;
|
|
return 0;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
static int amd_pmu_set_msr(struct kvm_vcpu *vcpu, struct msr_data *msr_info)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
struct kvm_pmc *pmc;
|
|
u32 msr = msr_info->index;
|
|
u64 data = msr_info->data;
|
|
|
|
/* MSR_PERFCTRn */
|
|
pmc = get_gp_pmc_amd(pmu, msr, PMU_TYPE_COUNTER);
|
|
if (pmc) {
|
|
pmc_write_counter(pmc, data);
|
|
return 0;
|
|
}
|
|
/* MSR_EVNTSELn */
|
|
pmc = get_gp_pmc_amd(pmu, msr, PMU_TYPE_EVNTSEL);
|
|
if (pmc) {
|
|
data &= ~pmu->reserved_bits;
|
|
if (data != pmc->eventsel) {
|
|
pmc->eventsel = data;
|
|
kvm_pmu_request_counter_reprogram(pmc);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
static void amd_pmu_refresh(struct kvm_vcpu *vcpu)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
union cpuid_0x80000022_ebx ebx;
|
|
|
|
pmu->version = 1;
|
|
if (guest_cpuid_has(vcpu, X86_FEATURE_PERFMON_V2)) {
|
|
pmu->version = 2;
|
|
/*
|
|
* Note, PERFMON_V2 is also in 0x80000022.0x0, i.e. the guest
|
|
* CPUID entry is guaranteed to be non-NULL.
|
|
*/
|
|
BUILD_BUG_ON(x86_feature_cpuid(X86_FEATURE_PERFMON_V2).function != 0x80000022 ||
|
|
x86_feature_cpuid(X86_FEATURE_PERFMON_V2).index);
|
|
ebx.full = kvm_find_cpuid_entry_index(vcpu, 0x80000022, 0)->ebx;
|
|
pmu->nr_arch_gp_counters = ebx.split.num_core_pmc;
|
|
} else if (guest_cpuid_has(vcpu, X86_FEATURE_PERFCTR_CORE)) {
|
|
pmu->nr_arch_gp_counters = AMD64_NUM_COUNTERS_CORE;
|
|
} else {
|
|
pmu->nr_arch_gp_counters = AMD64_NUM_COUNTERS;
|
|
}
|
|
|
|
pmu->nr_arch_gp_counters = min_t(unsigned int, pmu->nr_arch_gp_counters,
|
|
kvm_pmu_cap.num_counters_gp);
|
|
|
|
if (pmu->version > 1) {
|
|
pmu->global_ctrl_mask = ~((1ull << pmu->nr_arch_gp_counters) - 1);
|
|
pmu->global_status_mask = pmu->global_ctrl_mask;
|
|
}
|
|
|
|
pmu->counter_bitmask[KVM_PMC_GP] = ((u64)1 << 48) - 1;
|
|
pmu->reserved_bits = 0xfffffff000280000ull;
|
|
pmu->raw_event_mask = AMD64_RAW_EVENT_MASK;
|
|
/* not applicable to AMD; but clean them to prevent any fall out */
|
|
pmu->counter_bitmask[KVM_PMC_FIXED] = 0;
|
|
pmu->nr_arch_fixed_counters = 0;
|
|
bitmap_set(pmu->all_valid_pmc_idx, 0, pmu->nr_arch_gp_counters);
|
|
}
|
|
|
|
static void amd_pmu_init(struct kvm_vcpu *vcpu)
|
|
{
|
|
struct kvm_pmu *pmu = vcpu_to_pmu(vcpu);
|
|
int i;
|
|
|
|
BUILD_BUG_ON(KVM_AMD_PMC_MAX_GENERIC > AMD64_NUM_COUNTERS_CORE);
|
|
BUILD_BUG_ON(KVM_AMD_PMC_MAX_GENERIC > INTEL_PMC_MAX_GENERIC);
|
|
|
|
for (i = 0; i < KVM_AMD_PMC_MAX_GENERIC ; i++) {
|
|
pmu->gp_counters[i].type = KVM_PMC_GP;
|
|
pmu->gp_counters[i].vcpu = vcpu;
|
|
pmu->gp_counters[i].idx = i;
|
|
pmu->gp_counters[i].current_config = 0;
|
|
}
|
|
}
|
|
|
|
struct kvm_pmu_ops amd_pmu_ops __initdata = {
|
|
.rdpmc_ecx_to_pmc = amd_rdpmc_ecx_to_pmc,
|
|
.msr_idx_to_pmc = amd_msr_idx_to_pmc,
|
|
.check_rdpmc_early = amd_check_rdpmc_early,
|
|
.is_valid_msr = amd_is_valid_msr,
|
|
.get_msr = amd_pmu_get_msr,
|
|
.set_msr = amd_pmu_set_msr,
|
|
.refresh = amd_pmu_refresh,
|
|
.init = amd_pmu_init,
|
|
.EVENTSEL_EVENT = AMD64_EVENTSEL_EVENT,
|
|
.MAX_NR_GP_COUNTERS = KVM_AMD_PMC_MAX_GENERIC,
|
|
.MIN_NR_GP_COUNTERS = AMD64_NUM_COUNTERS,
|
|
};
|