[<prev] [next>] [<thread-prev] [day] [month] [year] [list]
Message-ID: <5a62c225-243e-49c6-b1ea-c30fef2313b9@gmail.com>
Date: Sat, 29 Mar 2025 01:10:15 +0530
From: Sahil Siddiq <icegambit91@...il.com>
To: Stafford Horne <shorne@...il.com>
Cc: jonas@...thpole.se, stefan.kristiansson@...nalahti.fi,
sahilcdq@...ton.me, linux-openrisc@...r.kernel.org,
linux-kernel@...r.kernel.org
Subject: Re: [PATCH v3 2/3] openrisc: Introduce new utility functions to flush
and invalidate caches
Hi,
Thank you for the review.
On 3/26/25 10:41 PM, Stafford Horne wrote:
> On Mon, Mar 24, 2025 at 01:25:43AM +0530, Sahil Siddiq wrote:
>> According to the OpenRISC architecture manual, the dcache and icache may
>> not be present. When these caches are present, the invalidate and flush
>> registers may be absent. The current implementation does not perform
>> checks to verify their presence before utilizing cache registers, or
>> invalidating and flushing cache blocks.
>>
>> Introduce new functions to detect the presence of cache components and
>> related special-purpose registers.
>>
>> There are a few places where a range of addresses have to be flushed or
>> invalidated and the implementation is duplicated. Introduce new utility
>> functions and macros that generalize this implementation and reduce
>> duplication.
>>
>> Signed-off-by: Sahil Siddiq <sahilcdq@...ton.me>
>> ---
>> Changes from v2 -> v3:
>> - arch/openrisc/include/asm/cacheflush.h: Declare new functions and macros.
>> - arch/openrisc/include/asm/cpuinfo.h: Implement new functions.
>> (cpu_cache_is_present):
>> 1. The implementation of this function was strewn all over the place in
>> the previous versions.
>> 2. Fix condition. The condition in the previous version was incorrect.
>> (cb_inv_flush_is_implemented): New function.
>> - arch/openrisc/kernel/dma.c: Use new functions.
>> - arch/openrisc/mm/cache.c:
>> (cache_loop): Extend function.
>> (local_*_page_*): Use new cache_loop interface.
>> (local_*_range_*): Implement new functions.
>> - arch/openrisc/mm/init.c: Use new functions.
>>
>> arch/openrisc/include/asm/cacheflush.h | 17 +++++++++
>> arch/openrisc/include/asm/cpuinfo.h | 42 +++++++++++++++++++++
>> arch/openrisc/kernel/dma.c | 18 ++-------
>> arch/openrisc/mm/cache.c | 52 ++++++++++++++++++++++----
>> arch/openrisc/mm/init.c | 5 ++-
>> 5 files changed, 110 insertions(+), 24 deletions(-)
>>
>> diff --git a/arch/openrisc/include/asm/cacheflush.h b/arch/openrisc/include/asm/cacheflush.h
>> index 984c331ff5f4..0e60af486ec1 100644
>> --- a/arch/openrisc/include/asm/cacheflush.h
>> +++ b/arch/openrisc/include/asm/cacheflush.h
>> @@ -23,6 +23,9 @@
>> */
>> extern void local_dcache_page_flush(struct page *page);
>> extern void local_icache_page_inv(struct page *page);
>> +extern void local_dcache_range_flush(unsigned long start, unsigned long end);
>> +extern void local_dcache_range_inv(unsigned long start, unsigned long end);
>> +extern void local_icache_range_inv(unsigned long start, unsigned long end);
>>
>> /*
>> * Data cache flushing always happen on the local cpu. Instruction cache
>> @@ -38,6 +41,20 @@ extern void local_icache_page_inv(struct page *page);
>> extern void smp_icache_page_inv(struct page *page);
>> #endif /* CONFIG_SMP */
>>
>> +/*
>> + * Even if the actual block size is larger than L1_CACHE_BYTES, paddr
>> + * can be incremented by L1_CACHE_BYTES. When paddr is written to the
>> + * invalidate register, the entire cache line encompassing this address
>> + * is invalidated. Each subsequent reference to the same cache line will
>> + * not affect the invalidation process.
>> + */
>> +#define local_dcache_block_flush(addr) \
>> + local_dcache_range_flush(addr, addr + L1_CACHE_BYTES)
>> +#define local_dcache_block_inv(addr) \
>> + local_dcache_range_inv(addr, addr + L1_CACHE_BYTES)
>> +#define local_icache_block_inv(addr) \
>> + local_icache_range_inv(addr, addr + L1_CACHE_BYTES)
>> +
>> /*
>> * Synchronizes caches. Whenever a cpu writes executable code to memory, this
>> * should be called to make sure the processor sees the newly written code.
>> diff --git a/arch/openrisc/include/asm/cpuinfo.h b/arch/openrisc/include/asm/cpuinfo.h
>> index 82f5d4c06314..7839c41152af 100644
>> --- a/arch/openrisc/include/asm/cpuinfo.h
>> +++ b/arch/openrisc/include/asm/cpuinfo.h
>> @@ -15,6 +15,9 @@
>> #ifndef __ASM_OPENRISC_CPUINFO_H
>> #define __ASM_OPENRISC_CPUINFO_H
>>
>> +#include <asm/spr.h>
>> +#include <asm/spr_defs.h>
>> +
>> struct cache_desc {
>> u32 size;
>> u32 sets;
>> @@ -34,4 +37,43 @@ struct cpuinfo_or1k {
>> extern struct cpuinfo_or1k cpuinfo_or1k[NR_CPUS];
>> extern void setup_cpuinfo(void);
>>
>> +/*
>> + * Check if the cache component exists.
>> + */
>> +static inline bool cpu_cache_is_present(const unsigned int cache_type)
>> +{
>> + unsigned long upr = mfspr(SPR_UPR);
>> +
>> + return !!(upr & (SPR_UPR_UP | cache_type));
>> +}
>> +
>> +/*
>> + * Check if the cache block flush/invalidate register is implemented for the
>> + * cache component.
>> + */
>> +static inline bool cb_inv_flush_is_implemented(const unsigned int reg,
>> + const unsigned int cache_type)
>> +{
>> + unsigned long cfgr;
>> +
>> + if (cache_type == SPR_UPR_DCP) {
>> + cfgr = mfspr(SPR_DCCFGR);
>> + if (reg == SPR_DCBFR)
>> + return !!(cfgr & SPR_DCCFGR_CBFRI);
>> +
>> + if (reg == SPR_DCBIR)
>> + return !!(cfgr & SPR_DCCFGR_CBIRI);
>> + }
>> +
>> + /*
>> + * The cache block flush register is not implemented for the instruction cache.
>> + */
>> + if (cache_type == SPR_UPR_ICP) {
>> + cfgr = mfspr(SPR_ICCFGR);
>> + return !!(cfgr & SPR_ICCFGR_CBIRI);
>> + }
>> +
>> + return false;
>> +}
>
> Could these 2 functions move to cache.c?
Sure, I'll do that.
>> #endif /* __ASM_OPENRISC_CPUINFO_H */
>> diff --git a/arch/openrisc/kernel/dma.c b/arch/openrisc/kernel/dma.c
>> index b3edbb33b621..3a7b5baaa450 100644
>> --- a/arch/openrisc/kernel/dma.c
>> +++ b/arch/openrisc/kernel/dma.c
>> @@ -17,6 +17,7 @@
>> #include <linux/pagewalk.h>
>>
>> #include <asm/cpuinfo.h>
>> +#include <asm/cacheflush.h>
>> #include <asm/spr_defs.h>
>> #include <asm/tlbflush.h>
>>
>> @@ -24,9 +25,6 @@ static int
>> page_set_nocache(pte_t *pte, unsigned long addr,
>> unsigned long next, struct mm_walk *walk)
>> {
>> - unsigned long cl;
>> - struct cpuinfo_or1k *cpuinfo = &cpuinfo_or1k[smp_processor_id()];
>> -
>> pte_val(*pte) |= _PAGE_CI;
>>
>> /*
>> @@ -36,8 +34,7 @@ page_set_nocache(pte_t *pte, unsigned long addr,
>> flush_tlb_kernel_range(addr, addr + PAGE_SIZE);
>>
>> /* Flush page out of dcache */
>> - for (cl = __pa(addr); cl < __pa(next); cl += cpuinfo->dcache_block_size)
>> - mtspr(SPR_DCBFR, cl);
>> + local_dcache_range_flush(__pa(addr), __pa(next));
>>
>> return 0;
>> }
>> @@ -98,21 +95,14 @@ void arch_dma_clear_uncached(void *cpu_addr, size_t size)
>> void arch_sync_dma_for_device(phys_addr_t addr, size_t size,
>> enum dma_data_direction dir)
>> {
>> - unsigned long cl;
>> - struct cpuinfo_or1k *cpuinfo = &cpuinfo_or1k[smp_processor_id()];
>> -
>> switch (dir) {
>> case DMA_TO_DEVICE:
>> /* Flush the dcache for the requested range */
>> - for (cl = addr; cl < addr + size;
>> - cl += cpuinfo->dcache_block_size)
>> - mtspr(SPR_DCBFR, cl);
>> + local_dcache_range_flush(addr, addr + size);
>> break;
>> case DMA_FROM_DEVICE:
>> /* Invalidate the dcache for the requested range */
>> - for (cl = addr; cl < addr + size;
>> - cl += cpuinfo->dcache_block_size)
>> - mtspr(SPR_DCBIR, cl);
>> + local_dcache_range_inv(addr, addr + size);
>> break;
>> default:
>> /*
>> diff --git a/arch/openrisc/mm/cache.c b/arch/openrisc/mm/cache.c
>> index eb43b73f3855..aca64c5a20b3 100644
>> --- a/arch/openrisc/mm/cache.c
>> +++ b/arch/openrisc/mm/cache.c
>> @@ -14,31 +14,67 @@
>> #include <asm/spr_defs.h>
>> #include <asm/cache.h>
>> #include <asm/cacheflush.h>
>> +#include <asm/cpuinfo.h>
>> #include <asm/tlbflush.h>
>>
>> -static __always_inline void cache_loop(struct page *page, const unsigned int reg)
>> +static __always_inline void cache_loop(struct page *page, unsigned long *start,
>> + unsigned long *end, const unsigned int reg,
>> + const unsigned int cache_type)
>> {
>> - unsigned long paddr = page_to_pfn(page) << PAGE_SHIFT;
>> - unsigned long line = paddr & ~(L1_CACHE_BYTES - 1);
>> + unsigned long paddr, next;
>>
>> - while (line < paddr + PAGE_SIZE) {
>> - mtspr(reg, line);
>> - line += L1_CACHE_BYTES;
>> + if (!cpu_cache_is_present(cache_type))
>> + return;
>> +
>> + if (!cb_inv_flush_is_implemented(reg, cache_type))
>> + return;
>
> This check may be a bit overkill, but OK.
I thought I would implement this because I was not sure of what would happen
when attempting to read from these registers in a processor that didn't have
them.
>> + if (page) {
>> + paddr = page_to_pfn(page) << PAGE_SHIFT;
>> + next = paddr + PAGE_SIZE;
>> + paddr &= ~(L1_CACHE_BYTES - 1);
>> + } else if (start && end) {
>> + paddr = *start;
>> + next = *end;
>
> Overloading the one function with page and start/end seems a bit messy.
>
> It may be nicer to have 2 functions:
>
> cache_loop_page(page, reg, cache_type) {
> unsigned long paddr = page_to_pfn(page) << PAGE_SHIFT;
> unsiogned long end = paddr + PAGE_SIZE;
> paddr &= ~(L1_CACHE_BYTES - 1);
> cache_loop(paddr, end, reg, cache_type);
> }
>
> cache_loop(start, end, reg, cache_type)
>
>> + } else {
>> + printk(KERN_ERR "Missing start and/or end address.\n");
>> + return;
>
> Then this could be removed.
I agree. This is cleaner. I'll make the relevant changes.
Thanks,
Sahil
Powered by blists - more mailing lists