[<prev] [next>] [<thread-prev] [day] [month] [year] [list]
Message-ID: <223a817b-66dd-4182-838f-a186b059fe41@os.amperecomputing.com>
Date: Fri, 28 Feb 2025 18:45:38 -0800
From: Yang Shi <yang@...amperecomputing.com>
To: Mikołaj Lenczewski <miko.lenczewski@....com>,
ryan.roberts@....com, suzuki.poulose@....com, catalin.marinas@....com,
will@...nel.org, joro@...tes.org, jean-philippe@...aro.org,
mark.rutland@....com, joey.gouly@....com, oliver.upton@...ux.dev,
james.morse@....com, broonie@...nel.org, maz@...nel.org, david@...hat.com,
akpm@...ux-foundation.org, jgg@...pe.ca, nicolinc@...dia.com,
mshavit@...gle.com, jsnitsel@...hat.com, smostafa@...gle.com,
linux-arm-kernel@...ts.infradead.org, linux-kernel@...r.kernel.org,
iommu@...ts.linux.dev
Subject: Re: [PATCH v2 1/4] arm64: Add BBM Level 2 cpu feature
On 2/28/25 5:29 PM, Yang Shi wrote:
>
>
>
> On 2/28/25 10:24 AM, Mikołaj Lenczewski wrote:
>> The Break-Before-Make cpu feature supports multiple levels (levels 0-2),
>> and this commit adds a dedicated BBML2 cpufeature to test against
>> support for.
>>
>> This is a system feature as we might have a big.LITTLE architecture
>> where some cores support BBML2 and some don't, but we want all cores to
>> be available and BBM to default to level 0 (as opposed to having cores
>> without BBML2 not coming online).
>>
>> To support BBML2 in as wide a range of contexts as we can, we want not
>> only the architectural guarantees that BBML2 makes, but additionally
>> want BBML2 to not create TLB conflict aborts. Not causing aborts avoids
>> us having to prove that no recursive faults can be induced in any path
>> that uses BBML2, allowing its use for arbitrary kernel mappings.
>> Support detection of such CPUs.
>>
>> Signed-off-by: Mikołaj Lenczewski <miko.lenczewski@....com>
>> ---
>> arch/arm64/Kconfig | 11 +++++
>> arch/arm64/include/asm/cpucaps.h | 2 +
>> arch/arm64/include/asm/cpufeature.h | 5 +++
>> arch/arm64/kernel/cpufeature.c | 69 +++++++++++++++++++++++++++++
>> arch/arm64/tools/cpucaps | 1 +
>> 5 files changed, 88 insertions(+)
>>
>> diff --git a/arch/arm64/Kconfig b/arch/arm64/Kconfig
>> index 940343beb3d4..baae6d458996 100644
>> --- a/arch/arm64/Kconfig
>> +++ b/arch/arm64/Kconfig
>> @@ -2057,6 +2057,17 @@ config ARM64_TLB_RANGE
>> The feature introduces new assembly instructions, and they were
>> support when binutils >= 2.30.
>> +config ARM64_ENABLE_BBML2_NOABORT
>> + bool "Enable support for Break-Before-Make Level 2 detection and
>> usage"
>> + default y
>> + help
>> + FEAT_BBM provides detection of support levels for
>> break-before-make
>> + sequences. If BBM level 2 is supported, some TLB maintenance
>> requirements
>> + can be relaxed to improve performance. We additonally require the
>> + property that the implementation cannot ever raise TLB
>> Conflict Aborts.
>> + Selecting N causes the kernel to fallback to BBM level 0
>> behaviour
>> + even if the system supports BBM level 2.
>> +
>> endmenu # "ARMv8.4 architectural features"
>> menu "ARMv8.5 architectural features"
>> diff --git a/arch/arm64/include/asm/cpucaps.h
>> b/arch/arm64/include/asm/cpucaps.h
>> index 0b5ca6e0eb09..2d6db33d4e45 100644
>> --- a/arch/arm64/include/asm/cpucaps.h
>> +++ b/arch/arm64/include/asm/cpucaps.h
>> @@ -23,6 +23,8 @@ cpucap_is_possible(const unsigned int cap)
>> return IS_ENABLED(CONFIG_ARM64_PAN);
>> case ARM64_HAS_EPAN:
>> return IS_ENABLED(CONFIG_ARM64_EPAN);
>> + case ARM64_HAS_BBML2_NOABORT:
>> + return IS_ENABLED(CONFIG_ARM64_BBML2_NOABORT);
>> case ARM64_SVE:
>> return IS_ENABLED(CONFIG_ARM64_SVE);
>> case ARM64_SME:
>> diff --git a/arch/arm64/include/asm/cpufeature.h
>> b/arch/arm64/include/asm/cpufeature.h
>> index e0e4478f5fb5..108ef3fbbc00 100644
>> --- a/arch/arm64/include/asm/cpufeature.h
>> +++ b/arch/arm64/include/asm/cpufeature.h
>> @@ -866,6 +866,11 @@ static __always_inline bool
>> system_supports_mpam_hcr(void)
>> return alternative_has_cap_unlikely(ARM64_MPAM_HCR);
>> }
>> +static inline bool system_supports_bbml2_noabort(void)
>> +{
>> + return alternative_has_cap_unlikely(ARM64_HAS_BBML2_NOABORT);
>> +}
>
> Hi Miko,
>
> I added AmpereOne mdir on top of this patch. I can see BBML2 feature
> is detected via dmesg. But system_supports_bbml2_noabort() returns
> false. The warning in the below debug patch is triggered:
>
> diff --git a/arch/arm64/kernel/cpufeature.c
> b/arch/arm64/kernel/cpufeature.c
> index faa9094d97dd..a70829ae2bd0 100644
> --- a/arch/arm64/kernel/cpufeature.c
> +++ b/arch/arm64/kernel/cpufeature.c
> @@ -3814,6 +3814,9 @@ void __init setup_system_features(void)
> {
> setup_system_capabilities();
>
> + if (!system_supports_bbml2_noabort())
> + WARN_ON_ONCE(1);
> +
> kpti_install_ng_mappings();
>
> sve_setup();
>
> I thought it may be too early. But it seems other system features work
> well, for example, MPAM. I didn't figure out why. It is weird.
I just figured out the problem It is because the wrong kconfig name is
used in cpucaps.h. The code is:
+ case ARM64_HAS_BBML2_NOABORT:
+ return IS_ENABLED(CONFIG_ARM64_BBML2_NOABORT);
But the kconfig name actually is:
+config ARM64_ENABLE_BBML2_NOABORT
IMHO, the "ENABLE" in kconfig name sounds unnecessary.
Thanks,
Yang
>
> Thanks,
> Yang
>
>
>> +
>> int do_emulate_mrs(struct pt_regs *regs, u32 sys_reg, u32 rt);
>> bool try_emulate_mrs(struct pt_regs *regs, u32 isn);
>> diff --git a/arch/arm64/kernel/cpufeature.c
>> b/arch/arm64/kernel/cpufeature.c
>> index d561cf3b8ac7..63f6d356dc77 100644
>> --- a/arch/arm64/kernel/cpufeature.c
>> +++ b/arch/arm64/kernel/cpufeature.c
>> @@ -2176,6 +2176,68 @@ static bool hvhe_possible(const struct
>> arm64_cpu_capabilities *entry,
>> return
>> arm64_test_sw_feature_override(ARM64_SW_FEATURE_OVERRIDE_HVHE);
>> }
>> +static bool cpu_has_bbml2_noabort(unsigned int cpu_midr)
>> +{
>> + /* We want to allow usage of bbml2 in as wide a range of kernel
>> contexts
>> + * as possible. This list is therefore an allow-list of known-good
>> + * implementations that both support bbml2 and additionally,
>> fulfill the
>> + * extra constraint of never generating TLB conflict aborts when
>> using
>> + * the relaxed bbml2 semantics (such aborts make use of bbml2 in
>> certain
>> + * kernel contexts difficult to prove safe against recursive
>> aborts).
>> + *
>> + * Note that implementations can only be considered "known-good"
>> if their
>> + * implementors attest to the fact that the implementation never
>> raises
>> + * TLBI conflict aborts for bbml2 mapping granularity changes.
>> + */
>> + static const struct midr_range supports_bbml2_noabort_list[] = {
>> + MIDR_REV_RANGE(MIDR_CORTEX_X4, 0, 3, 0xf),
>> + MIDR_REV_RANGE(MIDR_NEOVERSE_V3, 0, 2, 0xf),
>> + {}
>> + };
>> +
>> + return is_midr_in_range_list(cpu_midr,
>> supports_bbml2_noabort_list);
>> +}
>> +
>> +static inline unsigned int __cpu_read_midr(int cpu)
>> +{
>> + WARN_ON_ONCE(!cpu_online(cpu));
>> +
>> + return per_cpu(cpu_data, cpu).reg_midr;
>> +}
>> +
>> +static bool has_bbml2_noabort(const struct arm64_cpu_capabilities
>> *caps, int scope)
>> +{
>> + if (!IS_ENABLED(CONFIG_ARM64_ENABLE_BBML2_NOABORT))
>> + return false;
>> +
>> + if (scope & SCOPE_SYSTEM) {
>> + int cpu;
>> +
>> + /* We are a boot CPU, and must verify that all enumerated boot
>> + * CPUs have MIDR values within our allowlist. Otherwise, we do
>> + * not allow the BBML2 feature to avoid potential faults when
>> + * the insufficient CPUs access memory regions using BBML2
>> + * semantics.
>> + */
>> + for_each_online_cpu(cpu) {
>> + if (!cpu_has_bbml2_noabort(__cpu_read_midr(cpu)))
>> + return false;
>> + }
>> +
>> + return true;
>> + } else if (scope & SCOPE_LOCAL_CPU) {
>> + /* We are a hot-plugged CPU, so only need to check our MIDR.
>> + * If we have the correct MIDR, but the kernel booted on an
>> + * insufficient CPU, we will not use BBML2 (this is safe). If
>> + * we have an incorrect MIDR, but the kernel booted on a
>> + * sufficient CPU, we will not bring up this CPU.
>> + */
>> + return cpu_has_bbml2_noabort(read_cpuid_id());
>> + }
>> +
>> + return false;
>> +}
>> +
>> #ifdef CONFIG_ARM64_PAN
>> static void cpu_enable_pan(const struct arm64_cpu_capabilities
>> *__unused)
>> {
>> @@ -2926,6 +2988,13 @@ static const struct arm64_cpu_capabilities
>> arm64_features[] = {
>> .matches = has_cpuid_feature,
>> ARM64_CPUID_FIELDS(ID_AA64MMFR2_EL1, EVT, IMP)
>> },
>> + {
>> + .desc = "BBM Level 2 without conflict abort",
>> + .capability = ARM64_HAS_BBML2_NOABORT,
>> + .type = ARM64_CPUCAP_SYSTEM_FEATURE,
>> + .matches = has_bbml2_noabort,
>> + ARM64_CPUID_FIELDS(ID_AA64MMFR2_EL1, BBM, 2)
>> + },
>> {
>> .desc = "52-bit Virtual Addressing for KVM (LPA2)",
>> .capability = ARM64_HAS_LPA2,
>> diff --git a/arch/arm64/tools/cpucaps b/arch/arm64/tools/cpucaps
>> index 1e65f2fb45bd..b03a375e5507 100644
>> --- a/arch/arm64/tools/cpucaps
>> +++ b/arch/arm64/tools/cpucaps
>> @@ -14,6 +14,7 @@ HAS_ADDRESS_AUTH_ARCH_QARMA5
>> HAS_ADDRESS_AUTH_IMP_DEF
>> HAS_AMU_EXTN
>> HAS_ARMv8_4_TTL
>> +HAS_BBML2_NOABORT
>> HAS_CACHE_DIC
>> HAS_CACHE_IDC
>> HAS_CNP
>
Powered by blists - more mailing lists