Message ID | 20230227175741.71216-18-willy@infradead.org (mailing list archive) |
---|---|
State | Superseded |
Headers | show |
Series | None | expand |
On 2023-02-27 12:57 p.m., Matthew Wilcox (Oracle) wrote: > Add set_ptes(), update_mmu_cache_range(), flush_dcache_folio() > and flush_icache_pages(). Change the PG_arch_1 (aka PG_dcache_dirty) flag > from being per-page to per-folio. > > Signed-off-by: Matthew Wilcox (Oracle) <willy@infradead.org> > Cc: "James E.J. Bottomley" <James.Bottomley@HansenPartnership.com> > Cc: Helge Deller <deller@gmx.de> > Cc: linux-parisc@vger.kernel.org > --- > arch/parisc/include/asm/cacheflush.h | 14 ++-- > arch/parisc/include/asm/pgtable.h | 28 +++++--- > arch/parisc/kernel/cache.c | 101 +++++++++++++++++++-------- > 3 files changed, 99 insertions(+), 44 deletions(-) > > diff --git a/arch/parisc/include/asm/cacheflush.h b/arch/parisc/include/asm/cacheflush.h > index ff07c509e04b..0bf8b69d086b 100644 > --- a/arch/parisc/include/asm/cacheflush.h > +++ b/arch/parisc/include/asm/cacheflush.h > @@ -46,16 +46,20 @@ void invalidate_kernel_vmap_range(void *vaddr, int size); > #define flush_cache_vmap(start, end) flush_cache_all() > #define flush_cache_vunmap(start, end) flush_cache_all() > > +void flush_dcache_folio(struct folio *folio); > +#define flush_dcache_folio flush_dcache_folio > #define ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE 1 > -void flush_dcache_page(struct page *page); > +static inline void flush_dcache_page(struct page *page) > +{ > + flush_dcache_folio(page_folio(page)); > +} > > #define flush_dcache_mmap_lock(mapping) xa_lock_irq(&mapping->i_pages) > #define flush_dcache_mmap_unlock(mapping) xa_unlock_irq(&mapping->i_pages) > > -#define flush_icache_page(vma,page) do { \ > - flush_kernel_dcache_page_addr(page_address(page)); \ > - flush_kernel_icache_page(page_address(page)); \ > -} while (0) > +void flush_icache_pages(struct vm_area_struct *vma, struct page *page, > + unsigned int nr); > +#define flush_icache_page(vma, page) flush_icache_pages(vma, page, 1) > > #define flush_icache_range(s,e) do { \ > flush_kernel_dcache_range_asm(s,e); \ > diff --git a/arch/parisc/include/asm/pgtable.h b/arch/parisc/include/asm/pgtable.h > index e2950f5db7c9..78ee9816f423 100644 > --- a/arch/parisc/include/asm/pgtable.h > +++ b/arch/parisc/include/asm/pgtable.h > @@ -73,14 +73,7 @@ extern void __update_cache(pte_t pte); > mb(); \ > } while(0) > > -#define set_pte_at(mm, addr, pteptr, pteval) \ > - do { \ > - if (pte_present(pteval) && \ > - pte_user(pteval)) \ > - __update_cache(pteval); \ > - *(pteptr) = (pteval); \ > - purge_tlb_entries(mm, addr); \ > - } while (0) > +#define set_pte_at(mm, addr, ptep, pte) set_ptes(mm, addr, ptep, pte, 1) > > #endif /* !__ASSEMBLY__ */ > > @@ -391,11 +384,28 @@ static inline unsigned long pmd_page_vaddr(pmd_t pmd) > > extern void paging_init (void); > > +static inline void set_ptes(struct mm_struct *mm, unsigned long addr, > + pte_t *ptep, pte_t pte, unsigned int nr) > +{ > + if (pte_present(pte) && pte_user(pte)) > + __update_cache(pte); > + for (;;) { > + *ptep = pte; > + purge_tlb_entries(mm, addr); > + if (--nr == 0) > + break; > + ptep++; > + pte_val(pte) += 1 << PFN_PTE_SHIFT; > + addr += PAGE_SIZE; > + } > +} > + > /* Used for deferring calls to flush_dcache_page() */ > > #define PG_dcache_dirty PG_arch_1 > > -#define update_mmu_cache(vms,addr,ptep) __update_cache(*ptep) > +#define update_mmu_cache_range(vma, addr, ptep, nr) __update_cache(*ptep) > +#define update_mmu_cache(vma, addr, ptep) __update_cache(*ptep) > > /* > * Encode/decode swap entries and swap PTEs. Swap PTEs are all PTEs that > diff --git a/arch/parisc/kernel/cache.c b/arch/parisc/kernel/cache.c > index 984d3a1b3828..16057812103b 100644 > --- a/arch/parisc/kernel/cache.c > +++ b/arch/parisc/kernel/cache.c > @@ -92,11 +92,11 @@ static inline void flush_data_cache(void) > /* Kernel virtual address of pfn. */ > #define pfn_va(pfn) __va(PFN_PHYS(pfn)) > > -void > -__update_cache(pte_t pte) > +void __update_cache(pte_t pte) > { > unsigned long pfn = pte_pfn(pte); > - struct page *page; > + struct folio *folio; > + unsigned int nr; > > /* We don't have pte special. As a result, we can be called with > an invalid pfn and we don't need to flush the kernel dcache page. > @@ -104,13 +104,17 @@ __update_cache(pte_t pte) > if (!pfn_valid(pfn)) > return; > > - page = pfn_to_page(pfn); > - if (page_mapping_file(page) && > - test_bit(PG_dcache_dirty, &page->flags)) { > - flush_kernel_dcache_page_addr(pfn_va(pfn)); > - clear_bit(PG_dcache_dirty, &page->flags); > + folio = page_folio(pfn_to_page(pfn)); > + pfn = folio_pfn(folio); > + nr = folio_nr_pages(folio); > + if (folio_flush_mapping(folio) && Shouldn't this call be to folio_mapping()? > + test_bit(PG_dcache_dirty, &folio->flags)) { > + while (nr--) > + flush_kernel_dcache_page_addr(pfn_va(pfn + nr)); > + clear_bit(PG_dcache_dirty, &folio->flags); > } else if (parisc_requires_coherency()) > - flush_kernel_dcache_page_addr(pfn_va(pfn)); > + while (nr--) > + flush_kernel_dcache_page_addr(pfn_va(pfn + nr)); > } > > void > @@ -365,6 +369,20 @@ static void flush_user_cache_page(struct vm_area_struct *vma, unsigned long vmad > preempt_enable(); > } > > +void flush_icache_pages(struct vm_area_struct *vma, struct page *page, > + unsigned int nr) > +{ > + void *kaddr = page_address(page); > + > + for (;;) { > + flush_kernel_dcache_page_addr(kaddr); > + flush_kernel_icache_page(kaddr); > + if (--nr == 0) > + break; > + page += PAGE_SIZE; > + } > +} > + > static inline pte_t *get_ptep(struct mm_struct *mm, unsigned long addr) > { > pte_t *ptep = NULL; > @@ -393,26 +411,30 @@ static inline bool pte_needs_flush(pte_t pte) > == (_PAGE_PRESENT | _PAGE_ACCESSED); > } > > -void flush_dcache_page(struct page *page) > +void flush_dcache_folio(struct folio *folio) > { > - struct address_space *mapping = page_mapping_file(page); > - struct vm_area_struct *mpnt; > - unsigned long offset; > + struct address_space *mapping = folio_flush_mapping(folio); Likewise. > + struct vm_area_struct *vma; > unsigned long addr, old_addr = 0; > + void *kaddr; > unsigned long count = 0; > + unsigned long i, nr; > pgoff_t pgoff; > > if (mapping && !mapping_mapped(mapping)) { > - set_bit(PG_dcache_dirty, &page->flags); > + set_bit(PG_dcache_dirty, &folio->flags); > return; > } > > - flush_kernel_dcache_page_addr(page_address(page)); > + nr = folio_nr_pages(folio); > + kaddr = folio_address(folio); > + for (i = 0; i < nr; i++) > + flush_kernel_dcache_page_addr(kaddr + i * PAGE_SIZE); > > if (!mapping) > return; > > - pgoff = page->index; > + pgoff = folio->index; > > /* > * We have carefully arranged in arch_get_unmapped_area() that > @@ -422,15 +444,29 @@ void flush_dcache_page(struct page *page) > * on machines that support equivalent aliasing > */ > flush_dcache_mmap_lock(mapping); > - vma_interval_tree_foreach(mpnt, &mapping->i_mmap, pgoff, pgoff) { > - offset = (pgoff - mpnt->vm_pgoff) << PAGE_SHIFT; > - addr = mpnt->vm_start + offset; > - if (parisc_requires_coherency()) { > - pte_t *ptep; > + vma_interval_tree_foreach(vma, &mapping->i_mmap, pgoff, pgoff + nr - 1) { > + unsigned long offset = pgoff - vma->vm_pgoff; > + unsigned long pfn = folio_pfn(folio); > + > + addr = vma->vm_start; > + nr = folio_nr_pages(folio); > + if (offset > -nr) { > + pfn -= offset; > + nr += offset; > + } else { > + addr += offset * PAGE_SIZE; > + } > + if (addr + nr * PAGE_SIZE > vma->vm_end) > + nr = (vma->vm_end - addr) / PAGE_SIZE; > > - ptep = get_ptep(mpnt->vm_mm, addr); > - if (ptep && pte_needs_flush(*ptep)) > - flush_user_cache_page(mpnt, addr); > + if (parisc_requires_coherency()) { > + for (i = 0; i < nr; i++) { > + pte_t *ptep = get_ptep(vma->vm_mm, > + addr + i * PAGE_SIZE); > + if (ptep && pte_needs_flush(*ptep)) > + flush_user_cache_page(vma, > + addr + i * PAGE_SIZE); > + } > } else { > /* > * The TLB is the engine of coherence on parisc: > @@ -443,27 +479,32 @@ void flush_dcache_page(struct page *page) > * in (until the user or kernel specifically > * accesses it, of course) > */ > - flush_tlb_page(mpnt, addr); > + for (i = 0; i < nr; i++) > + flush_tlb_page(vma, addr + i * PAGE_SIZE); > if (old_addr == 0 || (old_addr & (SHM_COLOUR - 1)) > != (addr & (SHM_COLOUR - 1))) { > - __flush_cache_page(mpnt, addr, page_to_phys(page)); > + for (i = 0; i < nr; i++) > + __flush_cache_page(vma, > + addr + i * PAGE_SIZE, > + (pfn + i) * PAGE_SIZE); > /* > * Software is allowed to have any number > * of private mappings to a page. > */ > - if (!(mpnt->vm_flags & VM_SHARED)) > + if (!(vma->vm_flags & VM_SHARED)) > continue; > if (old_addr) > pr_err("INEQUIVALENT ALIASES 0x%lx and 0x%lx in file %pD\n", > - old_addr, addr, mpnt->vm_file); > - old_addr = addr; > + old_addr, addr, vma->vm_file); > + if (nr == folio_nr_pages(folio)) > + old_addr = addr; > } > } > WARN_ON(++count == 4096); > } > flush_dcache_mmap_unlock(mapping); > } > -EXPORT_SYMBOL(flush_dcache_page); > +EXPORT_SYMBOL(flush_dcache_folio); > > /* Defined in arch/parisc/kernel/pacache.S */ > EXPORT_SYMBOL(flush_kernel_dcache_range_asm);
On Mon, Feb 27, 2023 at 05:49:18PM -0500, John David Anglin wrote: > > @@ -104,13 +104,17 @@ __update_cache(pte_t pte) > > if (!pfn_valid(pfn)) > > return; > > - page = pfn_to_page(pfn); > > - if (page_mapping_file(page) && > > - test_bit(PG_dcache_dirty, &page->flags)) { > > - flush_kernel_dcache_page_addr(pfn_va(pfn)); > > - clear_bit(PG_dcache_dirty, &page->flags); > > + folio = page_folio(pfn_to_page(pfn)); > > + pfn = folio_pfn(folio); > > + nr = folio_nr_pages(folio); > > + if (folio_flush_mapping(folio) && > Shouldn't this call be to folio_mapping()? For pages in the swap cache, folio_mapping() will return the swap cache mapping, which isn't what we want. folio_file_mapping() will return the swap file mapping, which is also not what we want. folio_flush_mapping() returns NULL, which is what we want.
diff --git a/arch/parisc/include/asm/cacheflush.h b/arch/parisc/include/asm/cacheflush.h index ff07c509e04b..0bf8b69d086b 100644 --- a/arch/parisc/include/asm/cacheflush.h +++ b/arch/parisc/include/asm/cacheflush.h @@ -46,16 +46,20 @@ void invalidate_kernel_vmap_range(void *vaddr, int size); #define flush_cache_vmap(start, end) flush_cache_all() #define flush_cache_vunmap(start, end) flush_cache_all() +void flush_dcache_folio(struct folio *folio); +#define flush_dcache_folio flush_dcache_folio #define ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE 1 -void flush_dcache_page(struct page *page); +static inline void flush_dcache_page(struct page *page) +{ + flush_dcache_folio(page_folio(page)); +} #define flush_dcache_mmap_lock(mapping) xa_lock_irq(&mapping->i_pages) #define flush_dcache_mmap_unlock(mapping) xa_unlock_irq(&mapping->i_pages) -#define flush_icache_page(vma,page) do { \ - flush_kernel_dcache_page_addr(page_address(page)); \ - flush_kernel_icache_page(page_address(page)); \ -} while (0) +void flush_icache_pages(struct vm_area_struct *vma, struct page *page, + unsigned int nr); +#define flush_icache_page(vma, page) flush_icache_pages(vma, page, 1) #define flush_icache_range(s,e) do { \ flush_kernel_dcache_range_asm(s,e); \ diff --git a/arch/parisc/include/asm/pgtable.h b/arch/parisc/include/asm/pgtable.h index e2950f5db7c9..78ee9816f423 100644 --- a/arch/parisc/include/asm/pgtable.h +++ b/arch/parisc/include/asm/pgtable.h @@ -73,14 +73,7 @@ extern void __update_cache(pte_t pte); mb(); \ } while(0) -#define set_pte_at(mm, addr, pteptr, pteval) \ - do { \ - if (pte_present(pteval) && \ - pte_user(pteval)) \ - __update_cache(pteval); \ - *(pteptr) = (pteval); \ - purge_tlb_entries(mm, addr); \ - } while (0) +#define set_pte_at(mm, addr, ptep, pte) set_ptes(mm, addr, ptep, pte, 1) #endif /* !__ASSEMBLY__ */ @@ -391,11 +384,28 @@ static inline unsigned long pmd_page_vaddr(pmd_t pmd) extern void paging_init (void); +static inline void set_ptes(struct mm_struct *mm, unsigned long addr, + pte_t *ptep, pte_t pte, unsigned int nr) +{ + if (pte_present(pte) && pte_user(pte)) + __update_cache(pte); + for (;;) { + *ptep = pte; + purge_tlb_entries(mm, addr); + if (--nr == 0) + break; + ptep++; + pte_val(pte) += 1 << PFN_PTE_SHIFT; + addr += PAGE_SIZE; + } +} + /* Used for deferring calls to flush_dcache_page() */ #define PG_dcache_dirty PG_arch_1 -#define update_mmu_cache(vms,addr,ptep) __update_cache(*ptep) +#define update_mmu_cache_range(vma, addr, ptep, nr) __update_cache(*ptep) +#define update_mmu_cache(vma, addr, ptep) __update_cache(*ptep) /* * Encode/decode swap entries and swap PTEs. Swap PTEs are all PTEs that diff --git a/arch/parisc/kernel/cache.c b/arch/parisc/kernel/cache.c index 984d3a1b3828..16057812103b 100644 --- a/arch/parisc/kernel/cache.c +++ b/arch/parisc/kernel/cache.c @@ -92,11 +92,11 @@ static inline void flush_data_cache(void) /* Kernel virtual address of pfn. */ #define pfn_va(pfn) __va(PFN_PHYS(pfn)) -void -__update_cache(pte_t pte) +void __update_cache(pte_t pte) { unsigned long pfn = pte_pfn(pte); - struct page *page; + struct folio *folio; + unsigned int nr; /* We don't have pte special. As a result, we can be called with an invalid pfn and we don't need to flush the kernel dcache page. @@ -104,13 +104,17 @@ __update_cache(pte_t pte) if (!pfn_valid(pfn)) return; - page = pfn_to_page(pfn); - if (page_mapping_file(page) && - test_bit(PG_dcache_dirty, &page->flags)) { - flush_kernel_dcache_page_addr(pfn_va(pfn)); - clear_bit(PG_dcache_dirty, &page->flags); + folio = page_folio(pfn_to_page(pfn)); + pfn = folio_pfn(folio); + nr = folio_nr_pages(folio); + if (folio_flush_mapping(folio) && + test_bit(PG_dcache_dirty, &folio->flags)) { + while (nr--) + flush_kernel_dcache_page_addr(pfn_va(pfn + nr)); + clear_bit(PG_dcache_dirty, &folio->flags); } else if (parisc_requires_coherency()) - flush_kernel_dcache_page_addr(pfn_va(pfn)); + while (nr--) + flush_kernel_dcache_page_addr(pfn_va(pfn + nr)); } void @@ -365,6 +369,20 @@ static void flush_user_cache_page(struct vm_area_struct *vma, unsigned long vmad preempt_enable(); } +void flush_icache_pages(struct vm_area_struct *vma, struct page *page, + unsigned int nr) +{ + void *kaddr = page_address(page); + + for (;;) { + flush_kernel_dcache_page_addr(kaddr); + flush_kernel_icache_page(kaddr); + if (--nr == 0) + break; + page += PAGE_SIZE; + } +} + static inline pte_t *get_ptep(struct mm_struct *mm, unsigned long addr) { pte_t *ptep = NULL; @@ -393,26 +411,30 @@ static inline bool pte_needs_flush(pte_t pte) == (_PAGE_PRESENT | _PAGE_ACCESSED); } -void flush_dcache_page(struct page *page) +void flush_dcache_folio(struct folio *folio) { - struct address_space *mapping = page_mapping_file(page); - struct vm_area_struct *mpnt; - unsigned long offset; + struct address_space *mapping = folio_flush_mapping(folio); + struct vm_area_struct *vma; unsigned long addr, old_addr = 0; + void *kaddr; unsigned long count = 0; + unsigned long i, nr; pgoff_t pgoff; if (mapping && !mapping_mapped(mapping)) { - set_bit(PG_dcache_dirty, &page->flags); + set_bit(PG_dcache_dirty, &folio->flags); return; } - flush_kernel_dcache_page_addr(page_address(page)); + nr = folio_nr_pages(folio); + kaddr = folio_address(folio); + for (i = 0; i < nr; i++) + flush_kernel_dcache_page_addr(kaddr + i * PAGE_SIZE); if (!mapping) return; - pgoff = page->index; + pgoff = folio->index; /* * We have carefully arranged in arch_get_unmapped_area() that @@ -422,15 +444,29 @@ void flush_dcache_page(struct page *page) * on machines that support equivalent aliasing */ flush_dcache_mmap_lock(mapping); - vma_interval_tree_foreach(mpnt, &mapping->i_mmap, pgoff, pgoff) { - offset = (pgoff - mpnt->vm_pgoff) << PAGE_SHIFT; - addr = mpnt->vm_start + offset; - if (parisc_requires_coherency()) { - pte_t *ptep; + vma_interval_tree_foreach(vma, &mapping->i_mmap, pgoff, pgoff + nr - 1) { + unsigned long offset = pgoff - vma->vm_pgoff; + unsigned long pfn = folio_pfn(folio); + + addr = vma->vm_start; + nr = folio_nr_pages(folio); + if (offset > -nr) { + pfn -= offset; + nr += offset; + } else { + addr += offset * PAGE_SIZE; + } + if (addr + nr * PAGE_SIZE > vma->vm_end) + nr = (vma->vm_end - addr) / PAGE_SIZE; - ptep = get_ptep(mpnt->vm_mm, addr); - if (ptep && pte_needs_flush(*ptep)) - flush_user_cache_page(mpnt, addr); + if (parisc_requires_coherency()) { + for (i = 0; i < nr; i++) { + pte_t *ptep = get_ptep(vma->vm_mm, + addr + i * PAGE_SIZE); + if (ptep && pte_needs_flush(*ptep)) + flush_user_cache_page(vma, + addr + i * PAGE_SIZE); + } } else { /* * The TLB is the engine of coherence on parisc: @@ -443,27 +479,32 @@ void flush_dcache_page(struct page *page) * in (until the user or kernel specifically * accesses it, of course) */ - flush_tlb_page(mpnt, addr); + for (i = 0; i < nr; i++) + flush_tlb_page(vma, addr + i * PAGE_SIZE); if (old_addr == 0 || (old_addr & (SHM_COLOUR - 1)) != (addr & (SHM_COLOUR - 1))) { - __flush_cache_page(mpnt, addr, page_to_phys(page)); + for (i = 0; i < nr; i++) + __flush_cache_page(vma, + addr + i * PAGE_SIZE, + (pfn + i) * PAGE_SIZE); /* * Software is allowed to have any number * of private mappings to a page. */ - if (!(mpnt->vm_flags & VM_SHARED)) + if (!(vma->vm_flags & VM_SHARED)) continue; if (old_addr) pr_err("INEQUIVALENT ALIASES 0x%lx and 0x%lx in file %pD\n", - old_addr, addr, mpnt->vm_file); - old_addr = addr; + old_addr, addr, vma->vm_file); + if (nr == folio_nr_pages(folio)) + old_addr = addr; } } WARN_ON(++count == 4096); } flush_dcache_mmap_unlock(mapping); } -EXPORT_SYMBOL(flush_dcache_page); +EXPORT_SYMBOL(flush_dcache_folio); /* Defined in arch/parisc/kernel/pacache.S */ EXPORT_SYMBOL(flush_kernel_dcache_range_asm);
Add set_ptes(), update_mmu_cache_range(), flush_dcache_folio() and flush_icache_pages(). Change the PG_arch_1 (aka PG_dcache_dirty) flag from being per-page to per-folio. Signed-off-by: Matthew Wilcox (Oracle) <willy@infradead.org> Cc: "James E.J. Bottomley" <James.Bottomley@HansenPartnership.com> Cc: Helge Deller <deller@gmx.de> Cc: linux-parisc@vger.kernel.org --- arch/parisc/include/asm/cacheflush.h | 14 ++-- arch/parisc/include/asm/pgtable.h | 28 +++++--- arch/parisc/kernel/cache.c | 101 +++++++++++++++++++-------- 3 files changed, 99 insertions(+), 44 deletions(-)