lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <e704b8ef-7488-96f4-27a8-35af722d4a3f@gmail.com>
Date:   Mon, 6 Nov 2023 15:19:43 +0800
From:   JinrongLiang <ljr.kernel@...il.com>
To:     Jim Mattson <jmattson@...gle.com>,
        Sean Christopherson <seanjc@...gle.com>
Cc:     Paolo Bonzini <pbonzini@...hat.com>, kvm@...r.kernel.org,
        linux-kernel@...r.kernel.org,
        Kan Liang <kan.liang@...ux.intel.com>,
        Dapeng Mi <dapeng1.mi@...ux.intel.com>,
        Like Xu <likexu@...cent.com>,
        Aaron Lewis <aaronlewis@...gle.com>,
        Jinrong Liang <cloudliang@...cent.com>
Subject: Re: [PATCH v6 09/20] KVM: selftests: Add pmu.h and lib/pmu.c for
 common PMU assets

在 2023/11/4 21:20, Jim Mattson 写道:
> On Fri, Nov 3, 2023 at 5:02 PM Sean Christopherson <seanjc@...gle.com> wrote:
>>
>> From: Jinrong Liang <cloudliang@...cent.com>
>>
>> By defining the PMU performance events and masks relevant for x86 in
>> the new pmu.h and pmu.c, it becomes easier to reference them, minimizing
>> potential errors in code that handles these values.
>>
>> Clean up pmu_event_filter_test.c by including pmu.h and removing
>> unnecessary macros.
>>
>> Suggested-by: Sean Christopherson <seanjc@...gle.com>
>> Signed-off-by: Jinrong Liang <cloudliang@...cent.com>
>> [sean: drop PSEUDO_ARCH_REFERENCE_CYCLES]
>> Signed-off-by: Sean Christopherson <seanjc@...gle.com>
>> ---
>>   tools/testing/selftests/kvm/Makefile          |  1 +
>>   tools/testing/selftests/kvm/include/pmu.h     | 84 +++++++++++++++++++
>>   tools/testing/selftests/kvm/lib/pmu.c         | 28 +++++++
>>   .../kvm/x86_64/pmu_event_filter_test.c        | 32 ++-----
>>   4 files changed, 122 insertions(+), 23 deletions(-)
>>   create mode 100644 tools/testing/selftests/kvm/include/pmu.h
>>   create mode 100644 tools/testing/selftests/kvm/lib/pmu.c
>>
>> diff --git a/tools/testing/selftests/kvm/Makefile b/tools/testing/selftests/kvm/Makefile
>> index a5963ab9215b..44d8d022b023 100644
>> --- a/tools/testing/selftests/kvm/Makefile
>> +++ b/tools/testing/selftests/kvm/Makefile
>> @@ -32,6 +32,7 @@ LIBKVM += lib/guest_modes.c
>>   LIBKVM += lib/io.c
>>   LIBKVM += lib/kvm_util.c
>>   LIBKVM += lib/memstress.c
>> +LIBKVM += lib/pmu.c
>>   LIBKVM += lib/guest_sprintf.c
>>   LIBKVM += lib/rbtree.c
>>   LIBKVM += lib/sparsebit.c
>> diff --git a/tools/testing/selftests/kvm/include/pmu.h b/tools/testing/selftests/kvm/include/pmu.h
>> new file mode 100644
>> index 000000000000..987602c62b51
>> --- /dev/null
>> +++ b/tools/testing/selftests/kvm/include/pmu.h
>> @@ -0,0 +1,84 @@
>> +/* SPDX-License-Identifier: GPL-2.0-only */
>> +/*
>> + * Copyright (C) 2023, Tencent, Inc.
>> + */
>> +#ifndef SELFTEST_KVM_PMU_H
>> +#define SELFTEST_KVM_PMU_H
>> +
>> +#include <stdint.h>
>> +
>> +#define X86_PMC_IDX_MAX                                64
>> +#define INTEL_PMC_MAX_GENERIC                          32
> 
> I think this is actually 15. Note that IA32_PMC0 through IA32_PMC7
> have MSR indices from 0xc1 through 0xc8, and MSR 0xcf is
> IA32_CORE_CAPABILITIES. At the very least, we have to handle
> non-contiguous MSR indices if we ever go beyond IA32_PMC14.
> 
>> +#define KVM_PMU_EVENT_FILTER_MAX_EVENTS                300
>> +
>> +#define GP_COUNTER_NR_OFS_BIT                          8
>> +#define EVENT_LENGTH_OFS_BIT                           24
>> +
>> +#define PMU_VERSION_MASK                               GENMASK_ULL(7, 0)
>> +#define EVENT_LENGTH_MASK                              GENMASK_ULL(31, EVENT_LENGTH_OFS_BIT)
>> +#define GP_COUNTER_NR_MASK                             GENMASK_ULL(15, GP_COUNTER_NR_OFS_BIT)
>> +#define FIXED_COUNTER_NR_MASK                          GENMASK_ULL(4, 0)
>> +
>> +#define ARCH_PERFMON_EVENTSEL_EVENT                    GENMASK_ULL(7, 0)
>> +#define ARCH_PERFMON_EVENTSEL_UMASK                    GENMASK_ULL(15, 8)
>> +#define ARCH_PERFMON_EVENTSEL_USR                      BIT_ULL(16)
>> +#define ARCH_PERFMON_EVENTSEL_OS                       BIT_ULL(17)
>> +#define ARCH_PERFMON_EVENTSEL_EDGE                     BIT_ULL(18)
>> +#define ARCH_PERFMON_EVENTSEL_PIN_CONTROL              BIT_ULL(19)
>> +#define ARCH_PERFMON_EVENTSEL_INT                      BIT_ULL(20)
>> +#define ARCH_PERFMON_EVENTSEL_ANY                      BIT_ULL(21)
>> +#define ARCH_PERFMON_EVENTSEL_ENABLE                   BIT_ULL(22)
>> +#define ARCH_PERFMON_EVENTSEL_INV                      BIT_ULL(23)
>> +#define ARCH_PERFMON_EVENTSEL_CMASK                    GENMASK_ULL(31, 24)
>> +
>> +#define PMC_MAX_FIXED                                  16
>> +#define PMC_IDX_FIXED                                  32
>> +
>> +/* RDPMC offset for Fixed PMCs */
>> +#define PMC_FIXED_RDPMC_BASE                           BIT_ULL(30)
>> +#define PMC_FIXED_RDPMC_METRICS                        BIT_ULL(29)
>> +
>> +#define FIXED_BITS_MASK                                0xFULL
>> +#define FIXED_BITS_STRIDE                              4
>> +#define FIXED_0_KERNEL                                 BIT_ULL(0)
>> +#define FIXED_0_USER                                   BIT_ULL(1)
>> +#define FIXED_0_ANYTHREAD                              BIT_ULL(2)
>> +#define FIXED_0_ENABLE_PMI                             BIT_ULL(3)
>> +
>> +#define fixed_bits_by_idx(_idx, _bits)                 \
>> +       ((_bits) << ((_idx) * FIXED_BITS_STRIDE))
>> +
>> +#define AMD64_NR_COUNTERS                              4
>> +#define AMD64_NR_COUNTERS_CORE                         6
>> +
>> +#define PMU_CAP_FW_WRITES                              BIT_ULL(13)
>> +#define PMU_CAP_LBR_FMT                                0x3f
>> +
>> +enum intel_pmu_architectural_events {
>> +       /*
>> +        * The order of the architectural events matters as support for each
>> +        * event is enumerated via CPUID using the index of the event.
>> +        */
>> +       INTEL_ARCH_CPU_CYCLES,
>> +       INTEL_ARCH_INSTRUCTIONS_RETIRED,
>> +       INTEL_ARCH_REFERENCE_CYCLES,
>> +       INTEL_ARCH_LLC_REFERENCES,
>> +       INTEL_ARCH_LLC_MISSES,
>> +       INTEL_ARCH_BRANCHES_RETIRED,
>> +       INTEL_ARCH_BRANCHES_MISPREDICTED,
>> +       NR_INTEL_ARCH_EVENTS,
>> +};
>> +
>> +enum amd_pmu_k7_events {
>> +       AMD_ZEN_CORE_CYCLES,
>> +       AMD_ZEN_INSTRUCTIONS,
>> +       AMD_ZEN_BRANCHES,
>> +       AMD_ZEN_BRANCH_MISSES,
>> +       NR_AMD_ARCH_EVENTS,
>> +};
>> +
>> +extern const uint64_t intel_pmu_arch_events[];
>> +extern const uint64_t amd_pmu_arch_events[];
> 
> AMD doesn't define *any* architectural events. Perhaps
> amd_pmu_zen_events[], though who knows what Zen5 and  beyond will
> bring?
> 
>> +extern const int intel_pmu_fixed_pmc_events[];
>> +
>> +#endif /* SELFTEST_KVM_PMU_H */
>> diff --git a/tools/testing/selftests/kvm/lib/pmu.c b/tools/testing/selftests/kvm/lib/pmu.c
>> new file mode 100644
>> index 000000000000..27a6c35f98a1
>> --- /dev/null
>> +++ b/tools/testing/selftests/kvm/lib/pmu.c
>> @@ -0,0 +1,28 @@
>> +// SPDX-License-Identifier: GPL-2.0-only
>> +/*
>> + * Copyright (C) 2023, Tencent, Inc.
>> + */
>> +
>> +#include <stdint.h>
>> +
>> +#include "pmu.h"
>> +
>> +/* Definitions for Architectural Performance Events */
>> +#define ARCH_EVENT(select, umask) (((select) & 0xff) | ((umask) & 0xff) << 8)
> 
> There's nothing architectural about this. Perhaps RAW_EVENT() for
> consistency with perf?
> 
>> +
>> +const uint64_t intel_pmu_arch_events[] = {
>> +       [INTEL_ARCH_CPU_CYCLES]                 = ARCH_EVENT(0x3c, 0x0),
>> +       [INTEL_ARCH_INSTRUCTIONS_RETIRED]       = ARCH_EVENT(0xc0, 0x0),
>> +       [INTEL_ARCH_REFERENCE_CYCLES]           = ARCH_EVENT(0x3c, 0x1),
>> +       [INTEL_ARCH_LLC_REFERENCES]             = ARCH_EVENT(0x2e, 0x4f),
>> +       [INTEL_ARCH_LLC_MISSES]                 = ARCH_EVENT(0x2e, 0x41),
>> +       [INTEL_ARCH_BRANCHES_RETIRED]           = ARCH_EVENT(0xc4, 0x0),
>> +       [INTEL_ARCH_BRANCHES_MISPREDICTED]      = ARCH_EVENT(0xc5, 0x0),
> 
> [INTEL_ARCH_TOPDOWN_SLOTS] = ARCH_EVENT(0xa4, 1),
> 
>> +};
>> +
>> +const uint64_t amd_pmu_arch_events[] = {
>> +       [AMD_ZEN_CORE_CYCLES]                   = ARCH_EVENT(0x76, 0x00),
>> +       [AMD_ZEN_INSTRUCTIONS]                  = ARCH_EVENT(0xc0, 0x00),
>> +       [AMD_ZEN_BRANCHES]                      = ARCH_EVENT(0xc2, 0x00),
>> +       [AMD_ZEN_BRANCH_MISSES]                 = ARCH_EVENT(0xc3, 0x00),
>> +};
>> diff --git a/tools/testing/selftests/kvm/x86_64/pmu_event_filter_test.c b/tools/testing/selftests/kvm/x86_64/pmu_event_filter_test.c
>> index 283cc55597a4..b6e4f57a8651 100644
>> --- a/tools/testing/selftests/kvm/x86_64/pmu_event_filter_test.c
>> +++ b/tools/testing/selftests/kvm/x86_64/pmu_event_filter_test.c
>> @@ -11,31 +11,18 @@
>>    */
>>
>>   #define _GNU_SOURCE /* for program_invocation_short_name */
>> -#include "test_util.h"
>> +
>>   #include "kvm_util.h"
>> +#include "pmu.h"
>>   #include "processor.h"
>> -
>> -/*
>> - * In lieu of copying perf_event.h into tools...
>> - */
>> -#define ARCH_PERFMON_EVENTSEL_OS                       (1ULL << 17)
>> -#define ARCH_PERFMON_EVENTSEL_ENABLE                   (1ULL << 22)
>> -
>> -/* End of stuff taken from perf_event.h. */
>> -
>> -/* Oddly, this isn't in perf_event.h. */
>> -#define ARCH_PERFMON_BRANCHES_RETIRED          5
>> +#include "test_util.h"
>>
>>   #define NUM_BRANCHES 42
>> -#define INTEL_PMC_IDX_FIXED            32
>> -
>> -/* Matches KVM_PMU_EVENT_FILTER_MAX_EVENTS in pmu.c */
>> -#define MAX_FILTER_EVENTS              300
>>   #define MAX_TEST_EVENTS                10
>>
>>   #define PMU_EVENT_FILTER_INVALID_ACTION                (KVM_PMU_EVENT_DENY + 1)
>>   #define PMU_EVENT_FILTER_INVALID_FLAGS                 (KVM_PMU_EVENT_FLAGS_VALID_MASK << 1)
>> -#define PMU_EVENT_FILTER_INVALID_NEVENTS               (MAX_FILTER_EVENTS + 1)
>> +#define PMU_EVENT_FILTER_INVALID_NEVENTS               (KVM_PMU_EVENT_FILTER_MAX_EVENTS + 1)
>>
>>   /*
>>    * This is how the event selector and unit mask are stored in an AMD
>> @@ -63,7 +50,6 @@
>>
>>   #define AMD_ZEN_BR_RETIRED EVENT(0xc2, 0)
> 
> Now AMD_ZEN_BRANCHES, above?

Yes, I forgot to replace INTEL_BR_RETIRED, AMD_ZEN_BR_RETIRED and 
INST_RETIRED in pmu_event_filter_test.c and remove their macro definitions.

Thanks,

Jinrong

> 
>>
>> -
>>   /*
>>    * "Retired instructions", from Processor Programming Reference
>>    * (PPR) for AMD Family 17h Model 01h, Revision B1 Processors,
>> @@ -84,7 +70,7 @@ struct __kvm_pmu_event_filter {
>>          __u32 fixed_counter_bitmap;
>>          __u32 flags;
>>          __u32 pad[4];
>> -       __u64 events[MAX_FILTER_EVENTS];
>> +       __u64 events[KVM_PMU_EVENT_FILTER_MAX_EVENTS];
>>   };
>>
>>   /*
>> @@ -729,14 +715,14 @@ static void add_dummy_events(uint64_t *events, int nevents)
>>
>>   static void test_masked_events(struct kvm_vcpu *vcpu)
>>   {
>> -       int nevents = MAX_FILTER_EVENTS - MAX_TEST_EVENTS;
>> -       uint64_t events[MAX_FILTER_EVENTS];
>> +       int nevents = KVM_PMU_EVENT_FILTER_MAX_EVENTS - MAX_TEST_EVENTS;
>> +       uint64_t events[KVM_PMU_EVENT_FILTER_MAX_EVENTS];
>>
>>          /* Run the test cases against a sparse PMU event filter. */
>>          run_masked_events_tests(vcpu, events, 0);
>>
>>          /* Run the test cases against a dense PMU event filter. */
>> -       add_dummy_events(events, MAX_FILTER_EVENTS);
>> +       add_dummy_events(events, KVM_PMU_EVENT_FILTER_MAX_EVENTS);
>>          run_masked_events_tests(vcpu, events, nevents);
>>   }
>>
>> @@ -818,7 +804,7 @@ static void intel_run_fixed_counter_guest_code(uint8_t fixed_ctr_idx)
>>                  /* Only OS_EN bit is enabled for fixed counter[idx]. */
>>                  wrmsr(MSR_CORE_PERF_FIXED_CTR_CTRL, BIT_ULL(4 * fixed_ctr_idx));
>>                  wrmsr(MSR_CORE_PERF_GLOBAL_CTRL,
>> -                     BIT_ULL(INTEL_PMC_IDX_FIXED + fixed_ctr_idx));
>> +                     BIT_ULL(PMC_IDX_FIXED + fixed_ctr_idx));
>>                  __asm__ __volatile__("loop ." : "+c"((int){NUM_BRANCHES}));
>>                  wrmsr(MSR_CORE_PERF_GLOBAL_CTRL, 0);
>>
>> --
>> 2.42.0.869.gea05f2083d-goog
>>

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ