Message ID | 570D00F9.4070406@ti.com (mailing list archive) |
---|---|
State | New, archived |
Headers | show |
On Tue, Apr 12, 2016 at 05:06:49PM +0300, Tero Kristo wrote: > On 04/12/2016 04:25 PM, Mark Rutland wrote: > >On Tue, Apr 12, 2016 at 11:14:39AM +0300, Tero Kristo wrote: > >>Some obvious holes in this implementation: > >> > >>1) during execution of arch/arm/kernel/head.S, the tweaked MMU shareability > >> settings are not in place. However, I am not too sure how much that > >> matters, as I am not sure what is mapped at this point. Kernel image > >> mapping should not matter at least, as we typically should not be doing > >> any DMA transfers from the kernel image. > > > >Strictly speaking, changing the shareability can result in a loss of > >coherency, even if all accesses are made by the same CPU. See > >"Mismatched memory attributes" in section A3.5.7 of the ARMv7-AR > >Reference Manual (ARM DDI 0406C.c). > > Basically we are not attempting to change shareability in-the-fly, > but instead configure a different shareability value that is going > to be used always. I understood that this was a one-time transition; the problem still applies, per the architecture. Your implementation _may_ provide stronger guarantees than architecturally required. Caches lines allocated as a result of accesses with one set of attributes are not necessarily coherent with accesses with differing attributes (even if only differing in terms of shareability). Until the cache maintenance mandated by the ARM ARM is performed, you may encounter a number of issues. Thus changing attributes once during the boot process is potentially problematic. > >It's not just DMA that matters. I believe we may have page tables as > >part of the kernel image, for instance, and those need to be accessed > >with consistent attributes by the MMU when doing page table walks. > > > >You can avoid issues so long as you have appropriate cache maintenance, > >but that's both expensive (all memory previously mapped must be > >Clean+Invalidated by VA) and painful (as you can't reliably use any of > >said memory until after the maintenance). > > The hack we have internally just maps all the DMA pages as outer > shareable. I'm not sure precisely what you mean by "DMA pages" here. Surely this applies to any mappings created using the usual page table accessors? > I think maybe adding the original hack might help understanding the > issue, so added inline in the end as reference. We just attempt to > change the shareability value from 3 (the current) to 2. I understand that you only wish to change the shareability. What I am describing are the caveats that come with doing do, which are not necessarily intuitive, but are laid out in the ARM ARM. Thanks, Mark.
diff --git a/arch/arm/include/asm/pgtable-3level-hwdef.h b/arch/arm/include/asm/pgtable-3level-hwdef.h index f8f1cff..62adf21 100644 --- a/arch/arm/include/asm/pgtable-3level-hwdef.h +++ b/arch/arm/include/asm/pgtable-3level-hwdef.h @@ -44,7 +44,11 @@ #define PMD_SECT_CACHEABLE (_AT(pmdval_t, 1) << 3) #define PMD_SECT_USER (_AT(pmdval_t, 1) << 6) /* AP[1] */ #define PMD_SECT_AP2 (_AT(pmdval_t, 1) << 7) /* read only */ +#ifdef CONFIG_KEYSTONE2_DMA_COHERENT +#define PMD_SECT_S (_AT(pmdval_t, 2) << 8) +#else #define PMD_SECT_S (_AT(pmdval_t, 3) << 8) +#endif #define PMD_SECT_AF (_AT(pmdval_t, 1) << 10) #define PMD_SECT_nG (_AT(pmdval_t, 1) << 11) #define PMD_SECT_PXN (_AT(pmdval_t, 1) << 53) @@ -73,7 +77,12 @@ #define PTE_BUFFERABLE (_AT(pteval_t, 1) << 2) /* AttrIndx[0] */ #define PTE_CACHEABLE (_AT(pteval_t, 1) << 3) /* AttrIndx[1] */ #define PTE_AP2 (_AT(pteval_t, 1) << 7) /* AP[2] */ +#ifdef CONFIG_KEYSTONE2_DMA_COHERENT +/* SH[1:0], outer shareable */ +#define PTE_EXT_SHARED (_AT(pteval_t, 2) << 8) +#else #define PTE_EXT_SHARED (_AT(pteval_t, 3) << 8) /* SH[1:0], inner shareable */ +#endif #define PTE_EXT_AF (_AT(pteval_t, 1) << 10) /* Access Flag */ #define PTE_EXT_NG (_AT(pteval_t, 1) << 11) /* nG */ #define PTE_EXT_PXN (_AT(pteval_t, 1) << 53) /* PXN */ diff --git a/arch/arm/include/asm/pgtable-3level.h b/arch/arm/include/asm/pgtable-3level.h index a745a2a..b4090b1 100644 --- a/arch/arm/include/asm/pgtable-3level.h +++ b/arch/arm/include/asm/pgtable-3level.h @@ -78,7 +78,12 @@ #define L_PTE_VALID (_AT(pteval_t, 1) << 0) /* Valid */ #define L_PTE_PRESENT (_AT(pteval_t, 3) << 0) /* Present */ #define L_PTE_USER (_AT(pteval_t, 1) << 6) /* AP[1] */ +#ifdef CONFIG_KEYSTONE2_DMA_COHERENT +/* SH[1:0], outer shareable */ +#define L_PTE_SHARED (_AT(pteval_t, 2) << 8) +#else #define L_PTE_SHARED (_AT(pteval_t, 3) << 8) /* SH[1:0], inner shareable */ +#endif #define L_PTE_YOUNG (_AT(pteval_t, 1) << 10) /* AF */ #define L_PTE_XN (_AT(pteval_t, 1) << 54) /* XN */ #define L_PTE_DIRTY (_AT(pteval_t, 1) << 55) diff --git a/arch/arm/mach-keystone/Kconfig b/arch/arm/mach-keystone/Kconfig index ea955f6db..558385e 100644 --- a/arch/arm/mach-keystone/Kconfig +++ b/arch/arm/mach-keystone/Kconfig @@ -11,6 +11,10 @@ config ARCH_KEYSTONE select ZONE_DMA if ARM_LPAE select MIGHT_HAVE_PCI select PCI_DOMAINS if PCI + select KEYSTONE2_DMA_COHERENT help Support for boards based on the Texas Instruments Keystone family of SoCs. + +config KEYSTONE2_DMA_COHERENT + bool