2023-08-30 17:31:07 +02:00
|
|
|
/* SPDX-License-Identifier: GPL-2.0 */
|
|
|
|
#ifndef __KVM_X86_PMU_H
|
|
|
|
#define __KVM_X86_PMU_H
|
|
|
|
|
|
|
|
#include <linux/nospec.h>
|
|
|
|
|
|
|
|
#define vcpu_to_pmu(vcpu) (&(vcpu)->arch.pmu)
|
|
|
|
#define pmu_to_vcpu(pmu) (container_of((pmu), struct kvm_vcpu, arch.pmu))
|
|
|
|
#define pmc_to_pmu(pmc) (&(pmc)->vcpu->arch.pmu)
|
|
|
|
|
|
|
|
#define MSR_IA32_MISC_ENABLE_PMU_RO_MASK (MSR_IA32_MISC_ENABLE_PEBS_UNAVAIL | \
|
|
|
|
MSR_IA32_MISC_ENABLE_BTS_UNAVAIL)
|
|
|
|
|
|
|
|
/* retrieve the 4 bits for EN and PMI out of IA32_FIXED_CTR_CTRL */
|
|
|
|
#define fixed_ctrl_field(ctrl_reg, idx) (((ctrl_reg) >> ((idx)*4)) & 0xf)
|
|
|
|
|
|
|
|
#define VMWARE_BACKDOOR_PMC_HOST_TSC 0x10000
|
|
|
|
#define VMWARE_BACKDOOR_PMC_REAL_TIME 0x10001
|
|
|
|
#define VMWARE_BACKDOOR_PMC_APPARENT_TIME 0x10002
|
|
|
|
|
|
|
|
struct kvm_pmu_ops {
|
|
|
|
bool (*hw_event_available)(struct kvm_pmc *pmc);
|
|
|
|
struct kvm_pmc *(*pmc_idx_to_pmc)(struct kvm_pmu *pmu, int pmc_idx);
|
|
|
|
struct kvm_pmc *(*rdpmc_ecx_to_pmc)(struct kvm_vcpu *vcpu,
|
|
|
|
unsigned int idx, u64 *mask);
|
|
|
|
struct kvm_pmc *(*msr_idx_to_pmc)(struct kvm_vcpu *vcpu, u32 msr);
|
|
|
|
bool (*is_valid_rdpmc_ecx)(struct kvm_vcpu *vcpu, unsigned int idx);
|
|
|
|
bool (*is_valid_msr)(struct kvm_vcpu *vcpu, u32 msr);
|
|
|
|
int (*get_msr)(struct kvm_vcpu *vcpu, struct msr_data *msr_info);
|
|
|
|
int (*set_msr)(struct kvm_vcpu *vcpu, struct msr_data *msr_info);
|
|
|
|
void (*refresh)(struct kvm_vcpu *vcpu);
|
|
|
|
void (*init)(struct kvm_vcpu *vcpu);
|
|
|
|
void (*reset)(struct kvm_vcpu *vcpu);
|
|
|
|
void (*deliver_pmi)(struct kvm_vcpu *vcpu);
|
|
|
|
void (*cleanup)(struct kvm_vcpu *vcpu);
|
|
|
|
|
|
|
|
const u64 EVENTSEL_EVENT;
|
|
|
|
const int MAX_NR_GP_COUNTERS;
|
2023-10-24 12:59:35 +02:00
|
|
|
const int MIN_NR_GP_COUNTERS;
|
2023-08-30 17:31:07 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
void kvm_pmu_ops_update(const struct kvm_pmu_ops *pmu_ops);
|
|
|
|
|
2023-10-24 12:59:35 +02:00
|
|
|
static inline bool kvm_pmu_has_perf_global_ctrl(struct kvm_pmu *pmu)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Architecturally, Intel's SDM states that IA32_PERF_GLOBAL_CTRL is
|
|
|
|
* supported if "CPUID.0AH: EAX[7:0] > 0", i.e. if the PMU version is
|
|
|
|
* greater than zero. However, KVM only exposes and emulates the MSR
|
|
|
|
* to/for the guest if the guest PMU supports at least "Architectural
|
|
|
|
* Performance Monitoring Version 2".
|
|
|
|
*
|
|
|
|
* AMD's version of PERF_GLOBAL_CTRL conveniently shows up with v2.
|
|
|
|
*/
|
|
|
|
return pmu->version > 1;
|
|
|
|
}
|
|
|
|
|
2023-08-30 17:31:07 +02:00
|
|
|
static inline u64 pmc_bitmask(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
struct kvm_pmu *pmu = pmc_to_pmu(pmc);
|
|
|
|
|
|
|
|
return pmu->counter_bitmask[pmc->type];
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u64 pmc_read_counter(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
u64 counter, enabled, running;
|
|
|
|
|
|
|
|
counter = pmc->counter;
|
|
|
|
if (pmc->perf_event && !pmc->is_paused)
|
|
|
|
counter += perf_event_read_value(pmc->perf_event,
|
|
|
|
&enabled, &running);
|
|
|
|
/* FIXME: Scaling needed? */
|
|
|
|
return counter & pmc_bitmask(pmc);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void pmc_release_perf_event(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
if (pmc->perf_event) {
|
|
|
|
perf_event_release_kernel(pmc->perf_event);
|
|
|
|
pmc->perf_event = NULL;
|
|
|
|
pmc->current_config = 0;
|
|
|
|
pmc_to_pmu(pmc)->event_count--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void pmc_stop_counter(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
if (pmc->perf_event) {
|
|
|
|
pmc->counter = pmc_read_counter(pmc);
|
|
|
|
pmc_release_perf_event(pmc);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline bool pmc_is_gp(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
return pmc->type == KVM_PMC_GP;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline bool pmc_is_fixed(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
return pmc->type == KVM_PMC_FIXED;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline bool kvm_valid_perf_global_ctrl(struct kvm_pmu *pmu,
|
|
|
|
u64 data)
|
|
|
|
{
|
|
|
|
return !(pmu->global_ctrl_mask & data);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* returns general purpose PMC with the specified MSR. Note that it can be
|
|
|
|
* used for both PERFCTRn and EVNTSELn; that is why it accepts base as a
|
|
|
|
* parameter to tell them apart.
|
|
|
|
*/
|
|
|
|
static inline struct kvm_pmc *get_gp_pmc(struct kvm_pmu *pmu, u32 msr,
|
|
|
|
u32 base)
|
|
|
|
{
|
|
|
|
if (msr >= base && msr < base + pmu->nr_arch_gp_counters) {
|
|
|
|
u32 index = array_index_nospec(msr - base,
|
|
|
|
pmu->nr_arch_gp_counters);
|
|
|
|
|
|
|
|
return &pmu->gp_counters[index];
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* returns fixed PMC with the specified MSR */
|
|
|
|
static inline struct kvm_pmc *get_fixed_pmc(struct kvm_pmu *pmu, u32 msr)
|
|
|
|
{
|
|
|
|
int base = MSR_CORE_PERF_FIXED_CTR0;
|
|
|
|
|
|
|
|
if (msr >= base && msr < base + pmu->nr_arch_fixed_counters) {
|
|
|
|
u32 index = array_index_nospec(msr - base,
|
|
|
|
pmu->nr_arch_fixed_counters);
|
|
|
|
|
|
|
|
return &pmu->fixed_counters[index];
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline u64 get_sample_period(struct kvm_pmc *pmc, u64 counter_value)
|
|
|
|
{
|
|
|
|
u64 sample_period = (-counter_value) & pmc_bitmask(pmc);
|
|
|
|
|
|
|
|
if (!sample_period)
|
|
|
|
sample_period = pmc_bitmask(pmc) + 1;
|
|
|
|
return sample_period;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void pmc_update_sample_period(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
if (!pmc->perf_event || pmc->is_paused ||
|
|
|
|
!is_sampling_event(pmc->perf_event))
|
|
|
|
return;
|
|
|
|
|
|
|
|
perf_event_period(pmc->perf_event,
|
|
|
|
get_sample_period(pmc, pmc->counter));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline bool pmc_speculative_in_use(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
struct kvm_pmu *pmu = pmc_to_pmu(pmc);
|
|
|
|
|
|
|
|
if (pmc_is_fixed(pmc))
|
|
|
|
return fixed_ctrl_field(pmu->fixed_ctr_ctrl,
|
|
|
|
pmc->idx - INTEL_PMC_IDX_FIXED) & 0x3;
|
|
|
|
|
|
|
|
return pmc->eventsel & ARCH_PERFMON_EVENTSEL_ENABLE;
|
|
|
|
}
|
|
|
|
|
|
|
|
extern struct x86_pmu_capability kvm_pmu_cap;
|
|
|
|
|
|
|
|
static inline void kvm_init_pmu_capability(const struct kvm_pmu_ops *pmu_ops)
|
|
|
|
{
|
|
|
|
bool is_intel = boot_cpu_data.x86_vendor == X86_VENDOR_INTEL;
|
2023-10-24 12:59:35 +02:00
|
|
|
int min_nr_gp_ctrs = pmu_ops->MIN_NR_GP_COUNTERS;
|
2023-08-30 17:31:07 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Hybrid PMUs don't play nice with virtualization without careful
|
|
|
|
* configuration by userspace, and KVM's APIs for reporting supported
|
|
|
|
* vPMU features do not account for hybrid PMUs. Disable vPMU support
|
|
|
|
* for hybrid PMUs until KVM gains a way to let userspace opt-in.
|
|
|
|
*/
|
|
|
|
if (cpu_feature_enabled(X86_FEATURE_HYBRID_CPU))
|
|
|
|
enable_pmu = false;
|
|
|
|
|
|
|
|
if (enable_pmu) {
|
|
|
|
perf_get_x86_pmu_capability(&kvm_pmu_cap);
|
|
|
|
|
|
|
|
/*
|
2023-10-24 12:59:35 +02:00
|
|
|
* WARN if perf did NOT disable hardware PMU if the number of
|
|
|
|
* architecturally required GP counters aren't present, i.e. if
|
|
|
|
* there are a non-zero number of counters, but fewer than what
|
|
|
|
* is architecturally required.
|
2023-08-30 17:31:07 +02:00
|
|
|
*/
|
2023-10-24 12:59:35 +02:00
|
|
|
if (!kvm_pmu_cap.num_counters_gp ||
|
|
|
|
WARN_ON_ONCE(kvm_pmu_cap.num_counters_gp < min_nr_gp_ctrs))
|
|
|
|
enable_pmu = false;
|
|
|
|
else if (is_intel && !kvm_pmu_cap.version)
|
2023-08-30 17:31:07 +02:00
|
|
|
enable_pmu = false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!enable_pmu) {
|
|
|
|
memset(&kvm_pmu_cap, 0, sizeof(kvm_pmu_cap));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
kvm_pmu_cap.version = min(kvm_pmu_cap.version, 2);
|
|
|
|
kvm_pmu_cap.num_counters_gp = min(kvm_pmu_cap.num_counters_gp,
|
|
|
|
pmu_ops->MAX_NR_GP_COUNTERS);
|
|
|
|
kvm_pmu_cap.num_counters_fixed = min(kvm_pmu_cap.num_counters_fixed,
|
|
|
|
KVM_PMC_MAX_FIXED);
|
|
|
|
}
|
|
|
|
|
2023-10-24 12:59:35 +02:00
|
|
|
static inline void kvm_pmu_request_counter_reprogram(struct kvm_pmc *pmc)
|
2023-08-30 17:31:07 +02:00
|
|
|
{
|
|
|
|
set_bit(pmc->idx, pmc_to_pmu(pmc)->reprogram_pmi);
|
|
|
|
kvm_make_request(KVM_REQ_PMU, pmc->vcpu);
|
|
|
|
}
|
|
|
|
|
2023-10-24 12:59:35 +02:00
|
|
|
static inline void reprogram_counters(struct kvm_pmu *pmu, u64 diff)
|
|
|
|
{
|
|
|
|
int bit;
|
|
|
|
|
|
|
|
if (!diff)
|
|
|
|
return;
|
|
|
|
|
|
|
|
for_each_set_bit(bit, (unsigned long *)&diff, X86_PMC_IDX_MAX)
|
|
|
|
set_bit(bit, pmu->reprogram_pmi);
|
|
|
|
kvm_make_request(KVM_REQ_PMU, pmu_to_vcpu(pmu));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check if a PMC is enabled by comparing it against global_ctrl bits.
|
|
|
|
*
|
|
|
|
* If the vPMU doesn't have global_ctrl MSR, all vPMCs are enabled.
|
|
|
|
*/
|
|
|
|
static inline bool pmc_is_globally_enabled(struct kvm_pmc *pmc)
|
|
|
|
{
|
|
|
|
struct kvm_pmu *pmu = pmc_to_pmu(pmc);
|
|
|
|
|
|
|
|
if (!kvm_pmu_has_perf_global_ctrl(pmu))
|
|
|
|
return true;
|
|
|
|
|
|
|
|
return test_bit(pmc->idx, (unsigned long *)&pmu->global_ctrl);
|
|
|
|
}
|
|
|
|
|
2023-08-30 17:31:07 +02:00
|
|
|
void kvm_pmu_deliver_pmi(struct kvm_vcpu *vcpu);
|
|
|
|
void kvm_pmu_handle_event(struct kvm_vcpu *vcpu);
|
|
|
|
int kvm_pmu_rdpmc(struct kvm_vcpu *vcpu, unsigned pmc, u64 *data);
|
|
|
|
bool kvm_pmu_is_valid_rdpmc_ecx(struct kvm_vcpu *vcpu, unsigned int idx);
|
|
|
|
bool kvm_pmu_is_valid_msr(struct kvm_vcpu *vcpu, u32 msr);
|
|
|
|
int kvm_pmu_get_msr(struct kvm_vcpu *vcpu, struct msr_data *msr_info);
|
|
|
|
int kvm_pmu_set_msr(struct kvm_vcpu *vcpu, struct msr_data *msr_info);
|
|
|
|
void kvm_pmu_refresh(struct kvm_vcpu *vcpu);
|
|
|
|
void kvm_pmu_reset(struct kvm_vcpu *vcpu);
|
|
|
|
void kvm_pmu_init(struct kvm_vcpu *vcpu);
|
|
|
|
void kvm_pmu_cleanup(struct kvm_vcpu *vcpu);
|
|
|
|
void kvm_pmu_destroy(struct kvm_vcpu *vcpu);
|
|
|
|
int kvm_vm_ioctl_set_pmu_event_filter(struct kvm *kvm, void __user *argp);
|
|
|
|
void kvm_pmu_trigger_event(struct kvm_vcpu *vcpu, u64 perf_hw_id);
|
|
|
|
|
|
|
|
bool is_vmware_backdoor_pmc(u32 pmc_idx);
|
|
|
|
|
|
|
|
extern struct kvm_pmu_ops intel_pmu_ops;
|
|
|
|
extern struct kvm_pmu_ops amd_pmu_ops;
|
|
|
|
#endif /* __KVM_X86_PMU_H */
|