Re: [PATCH v4 4/6] kvm powerpc/book3s-apiv2: Introduce kvm-hv specific PMU

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



Athira Rajeev <atrajeev@xxxxxxxxxxxxx> writes:

>> On 24 Feb 2025, at 6:45 PM, Vaibhav Jain <vaibhav@xxxxxxxxxxxxx> wrote:
>> 
>> Introduce a new PMU named 'kvm-hv' inside a new module named 'kvm-hv-pmu'
>> to report Book3s kvm-hv specific performance counters. This will expose
>> KVM-HV specific performance attributes to user-space via kernel's PMU
>> infrastructure and would enableusers to monitor active kvm-hv based guests.
>> 
>> The patch creates necessary scaffolding to for the new PMU callbacks and
>> introduces the new kernel module name 'kvm-hv-pmu' which is built with
>> CONFIG_KVM_BOOK3S_HV_PMU. The patch doesn't introduce any perf-events yet,
>> which will be introduced in later patches
>> 
>> Signed-off-by: Vaibhav Jain <vaibhav@xxxxxxxxxxxxx>
>> 
>> ---
>> Changelog
>> 
>> v3->v4:
>> * Introduced a new kernel module named 'kmv-hv-pmu' to host the new PMU
>> instead of building the as part of KVM-HV module. [ Maddy ]
>> * Moved the code from arch/powerpc/kvm to arch/powerpc/perf [ Atheera ]
>> * Added a new config named KVM_BOOK3S_HV_PMU to arch/powerpc/kvm/Kconfig
>> 
>> v2->v3:
>> * Fixed a build warning reported by kernel build robot.
>> Link:
>> https://lore.kernel.org/oe-kbuild-all/202501171030.3x0gqW8G-lkp@xxxxxxxxx
>> 
>> v1->v2:
>> * Fixed an issue of kvm-hv not loading on baremetal kvm [Gautam]
>> ---
>> arch/powerpc/kvm/Kconfig       |  13 ++++
>> arch/powerpc/perf/Makefile     |   2 +
>> arch/powerpc/perf/kvm-hv-pmu.c | 138 +++++++++++++++++++++++++++++++++
>> 3 files changed, 153 insertions(+)
>> create mode 100644 arch/powerpc/perf/kvm-hv-pmu.c
>> 
>> diff --git a/arch/powerpc/kvm/Kconfig b/arch/powerpc/kvm/Kconfig
>> index dbfdc126bf14..5f0ce19e7e27 100644
>> --- a/arch/powerpc/kvm/Kconfig
>> +++ b/arch/powerpc/kvm/Kconfig
>> @@ -83,6 +83,7 @@ config KVM_BOOK3S_64_HV
>> depends on KVM_BOOK3S_64 && PPC_POWERNV
>> select KVM_BOOK3S_HV_POSSIBLE
>> select KVM_GENERIC_MMU_NOTIFIER
>> + select KVM_BOOK3S_HV_PMU
>> select CMA
>> help
>>  Support running unmodified book3s_64 guest kernels in
>> @@ -171,6 +172,18 @@ config KVM_BOOK3S_HV_NESTED_PMU_WORKAROUND
>>  those buggy L1s which saves the L2 state, at the cost of performance
>>  in all nested-capable guest entry/exit.
>> 
>> +config KVM_BOOK3S_HV_PMU
>> + tristate "Hypervisor Perf events for KVM Book3s-HV"
>> + depends on KVM_BOOK3S_64_HV && HV_PERF_CTRS
>> + help
>> +  Enable Book3s-HV Hypervisor Perf events PMU named 'kvm-hv'. These
>> +  Perf events give an overview of hypervisor performance overall
>> +  instead of a specific guests. Currently the PMU reports
>> +  L0-Hypervisor stats on a kvm-hv enabled PSeries LPAR like:
>> +  * Total/Used Guest-Heap
>> +  * Total/Used Guest Page-table Memory
>> +  * Total amount of Guest Page-table Memory reclaimed
>> +
>> config KVM_BOOKE_HV
>> bool
>> 
>> diff --git a/arch/powerpc/perf/Makefile b/arch/powerpc/perf/Makefile
>> index ac2cf58d62db..7f53fcb7495a 100644
>> --- a/arch/powerpc/perf/Makefile
>> +++ b/arch/powerpc/perf/Makefile
>> @@ -18,6 +18,8 @@ obj-$(CONFIG_HV_PERF_CTRS) += hv-24x7.o hv-gpci.o hv-common.o
>> 
>> obj-$(CONFIG_VPA_PMU) += vpa-pmu.o
>> 
>> +obj-$(CONFIG_KVM_BOOK3S_HV_PMU) += kvm-hv-pmu.o
>> +
>> obj-$(CONFIG_PPC_8xx) += 8xx-pmu.o
>> 
>> obj-$(CONFIG_PPC64) += $(obj64-y)
>> diff --git a/arch/powerpc/perf/kvm-hv-pmu.c b/arch/powerpc/perf/kvm-hv-pmu.c
>> new file mode 100644
>> index 000000000000..c154f54e09e2
>> --- /dev/null
>> +++ b/arch/powerpc/perf/kvm-hv-pmu.c
>> @@ -0,0 +1,138 @@
>> +// SPDX-License-Identifier: GPL-2.0
>> +/*
>> + * Description: PMUs specific to running nested KVM-HV guests
>> + * on Book3S processors (specifically POWER9 and later).
>> + */
>> +
>> +#define pr_fmt(fmt)  "kvmppc-pmu: " fmt
>> +
>> +#include "asm-generic/local64.h"
>> +#include <linux/kernel.h>
>> +#include <linux/errno.h>
>> +#include <linux/ratelimit.h>
>> +#include <linux/kvm_host.h>
>> +#include <linux/gfp_types.h>
>> +#include <linux/pgtable.h>
>> +#include <linux/perf_event.h>
>> +#include <linux/spinlock_types.h>
>> +#include <linux/spinlock.h>
>> +
>> +#include <asm/types.h>
>> +#include <asm/kvm_ppc.h>
>> +#include <asm/kvm_book3s.h>
>> +#include <asm/mmu.h>
>> +#include <asm/pgalloc.h>
>> +#include <asm/pte-walk.h>
>> +#include <asm/reg.h>
>> +#include <asm/plpar_wrappers.h>
>> +#include <asm/firmware.h>
>> +
>> +enum kvmppc_pmu_eventid {
>> + KVMPPC_EVENT_MAX,
>> +};
>> +
>> +static struct attribute *kvmppc_pmu_events_attr[] = {
>> + NULL,
>> +};
>> +
>> +static const struct attribute_group kvmppc_pmu_events_group = {
>> + .name = "events",
>> + .attrs = kvmppc_pmu_events_attr,
>> +};
>> +
>> +PMU_FORMAT_ATTR(event, "config:0");
>> +static struct attribute *kvmppc_pmu_format_attr[] = {
>> + &format_attr_event.attr,
>> + NULL,
>> +};
>> +
>> +static struct attribute_group kvmppc_pmu_format_group = {
>> + .name = "format",
>> + .attrs = kvmppc_pmu_format_attr,
>> +};
>> +
>> +static const struct attribute_group *kvmppc_pmu_attr_groups[] = {
>> + &kvmppc_pmu_events_group,
>> + &kvmppc_pmu_format_group,
>> + NULL,
>> +};
>> +
>> +static int kvmppc_pmu_event_init(struct perf_event *event)
>> +{
>> + unsigned int config = event->attr.config;
>> +
>> + pr_debug("%s: Event(%p) id=%llu cpu=%x on_cpu=%x config=%u",
>> + __func__, event, event->id, event->cpu,
>> + event->oncpu, config);
>> +
>> + if (event->attr.type != event->pmu->type)
>> + return -ENOENT;
>> +
>> + if (config >= KVMPPC_EVENT_MAX)
>> + return -EINVAL;
>> +
>> + local64_set(&event->hw.prev_count, 0);
>> + local64_set(&event->count, 0);
>> +
>> + return 0;
>> +}
>> +
>> +static void kvmppc_pmu_del(struct perf_event *event, int flags)
>> +{
>> +}
>> +
>> +static int kvmppc_pmu_add(struct perf_event *event, int flags)
>> +{
>> + return 0;
>> +}
>> +
>> +static void kvmppc_pmu_read(struct perf_event *event)
>> +{
>> +}
>> +
>> +/* L1 wide counters PMU */
>> +static struct pmu kvmppc_pmu = {
>> + .module = THIS_MODULE,
>> + .task_ctx_nr = perf_sw_context,
>> + .name = "kvm-hv",
>> + .event_init = kvmppc_pmu_event_init,
>> + .add = kvmppc_pmu_add,
>> + .del = kvmppc_pmu_del,
>> + .read = kvmppc_pmu_read,
>> + .attr_groups = kvmppc_pmu_attr_groups,
>> + .type = -1,
>> +};
>> +
>> +static int __init kvmppc_register_pmu(void)
>> +{
>> + int rc = -EOPNOTSUPP;
>> +
>> + /* only support events for nestedv2 right now */
>> + if (kvmhv_is_nestedv2()) {
>
> We don’t need PVR check here ? Description of module says this is
> supported for power9 and later.
The hcalls this module depends on, are only available to LPAR/KVM-Guest running with api-v2 support hence this is needed.

>> + /* Setup done now register the PMU */
>> + pr_info("Registering kvm-hv pmu");
>> +
>> + /* Register only if we arent already registered */
> Not sure why we need this… Have you seen any issue without this ? I don’t see any similar check in arch/powerpc/perf/vpa-pmu.c ,
>
This check is taken from the previous version of this patch which
prevented struct pmu initialization multiple times. However with
now a seperate module this check is probably not needed.

>> + rc = (kvmppc_pmu.type == -1) ?
>> +     perf_pmu_register(&kvmppc_pmu, kvmppc_pmu.name,
>> +       -1) : 0;
>> + }
>> +
>> + return rc;
>> +}
>> +
>> +static void __exit kvmppc_unregister_pmu(void)
>> +{
>> + if (kvmhv_is_nestedv2()) {
>> + if (kvmppc_pmu.type != -1)
>> + perf_pmu_unregister(&kvmppc_pmu);
>> +
>> + pr_info("kvmhv_pmu unregistered.\n");
>> + }
>> +}
>> +
>> +module_init(kvmppc_register_pmu);
>> +module_exit(kvmppc_unregister_pmu);
>> +MODULE_DESCRIPTION("KVM PPC Book3s-hv PMU");
>> +MODULE_AUTHOR("Vaibhav Jain <vaibhav@xxxxxxxxxxxxx>");
>> +MODULE_LICENSE("GPL");
>> -- 
>> 2.48.1
>> 
>> 
>> 
>

-- 
Cheers
~ Vaibhav





[Index of Archives]     [KVM ARM]     [KVM ia64]     [KVM ppc]     [Virtualization Tools]     [Spice Development]     [Libvirt]     [Libvirt Users]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite Questions]     [Linux Kernel]     [Linux SCSI]     [XFree86]

  Powered by Linux