diff options
author | Youngjin Kim <nkim@nvidia.com> | 2010-12-09 15:20:10 +0900 |
---|---|---|
committer | Niket Sirsi <nsirsi@nvidia.com> | 2010-12-13 19:34:15 -0800 |
commit | a16216bd61a6200bef7f1bb3852c749eac6c4688 (patch) | |
tree | 1ef6511a2bb6eb930bdd0fceacf802ffed705dbf | |
parent | 5cea6270cdac231fe9efbbd898bf8883418d65dd (diff) |
Revert "video: tegra: nvmap: Clean whole L1 instead of VA cleaning"
This reverts commit 6469f378a596f0572035cd27a17851ea86b763c9.
Bug 758628
Bug 748669
Original commit attmpted to have a smarter cache cleaning code.
But that work didn't work out well and just resulted in display
corruption.
Reviewed-on: http://git-master/r/11817
(cherry picked from commit 60207394cc16689f06ccbac993eefd2928565031)
Change-Id: I92bd95154f372eb0a081a4c3919b87d576ea4cb5
Reviewed-on: http://git-master/r/12449
Reviewed-by: Youngjin Kim <nkim@nvidia.com>
Tested-by: Youngjin Kim <nkim@nvidia.com>
Reviewed-by: Markus Holtmanns <mholtmanns@nvidia.com>
Tested-by: Markus Holtmanns <mholtmanns@nvidia.com>
Reviewed-by: Niket Sirsi <nsirsi@nvidia.com>
Tested-by: Niket Sirsi <nsirsi@nvidia.com>
Reviewed-by: Yu-Huan Hsu <yhsu@nvidia.com>
-rw-r--r-- | arch/arm/mm/cache-v7.S | 53 | ||||
-rw-r--r-- | drivers/video/tegra/nvmap.c | 26 |
2 files changed, 24 insertions, 55 deletions
diff --git a/arch/arm/mm/cache-v7.S b/arch/arm/mm/cache-v7.S index 24494f0ef917..884ac48a2010 100644 --- a/arch/arm/mm/cache-v7.S +++ b/arch/arm/mm/cache-v7.S @@ -18,28 +18,27 @@ #include "proc-macros.S" /* - * v7_op_dcache_all op + * v7_flush_dcache_all() * - * op=c14, Flush the whole D-cache. - * op=c10 Clean the whould D-cache. + * Flush the whole D-cache. * * Corrupted registers: r0-r7, r9-r11 (r6 only in Thumb mode) * * - mm - mm_struct describing address space */ -.macro v7_op_dcache_all op @ op=c10 clean, op=c14 flush +ENTRY(v7_flush_dcache_all) dmb @ ensure ordering with previous memory accesses mrc p15, 1, r0, c0, c0, 1 @ read clidr ands r3, r0, #0x7000000 @ extract loc from clidr mov r3, r3, lsr #23 @ left align loc bit field - beq 1005f @ if loc is 0, then no need to clean + beq finished @ if loc is 0, then no need to clean mov r10, #0 @ start clean at cache level 0 -1001: +loop1: add r2, r10, r10, lsr #1 @ work out 3x current cache level mov r1, r0, lsr r2 @ extract cache type bits from clidr and r1, r1, #7 @ mask of the bits for current cache only cmp r1, #2 @ see what cache we have at this level - blt 1004f @ skip if no cache, or just i-cache + blt skip @ skip if no cache, or just i-cache mcr p15, 2, r10, c0, c0, 0 @ select current cache level in cssr isb @ isb to sych the new cssr&csidr mrc p15, 1, r1, c0, c0, 0 @ read the new csidr @@ -50,40 +49,32 @@ clz r5, r4 @ find bit position of way size increment ldr r7, =0x7fff ands r7, r7, r1, lsr #13 @ extract max number of the index size -1002: +loop2: mov r9, r4 @ create working copy of max way size -1003: +loop3: ARM( orr r11, r10, r9, lsl r5 ) @ factor way and cache number into r11 THUMB( lsl r6, r9, r5 ) THUMB( orr r11, r10, r6 ) @ factor way and cache number into r11 ARM( orr r11, r11, r7, lsl r2 ) @ factor index number into r11 THUMB( lsl r6, r7, r2 ) THUMB( orr r11, r11, r6 ) @ factor index number into r11 - mcr p15, 0, r11, c7, \op, 2 @ op=c10/c14, clean/clean & invalidate by set/way + mcr p15, 0, r11, c7, c14, 2 @ clean & invalidate by set/way subs r9, r9, #1 @ decrement the way - bge 1003b + bge loop3 subs r7, r7, #1 @ decrement the index - bge 1002b -1004: + bge loop2 +skip: add r10, r10, #2 @ increment cache number cmp r3, r10 - bgt 1001b -1005: + bgt loop1 +finished: mov r10, #0 @ swith back to cache level 0 mcr p15, 2, r10, c0, c0, 0 @ select current cache level in cssr dsb isb mov pc, lr -.endm - -ENTRY(v7_flush_dcache_all) - v7_op_dcache_all c14 ENDPROC(v7_flush_dcache_all) -ENTRY(v7_clean_dcache_all) - v7_op_dcache_all c10 -ENDPROC(v7_clean_dcache_all) - /* * v7_flush_cache_all() * @@ -111,22 +102,6 @@ ENTRY(v7_flush_kern_cache_all) ENDPROC(v7_flush_kern_cache_all) /* - * v7_clean_kern_cache_all() - */ -ENTRY(v7_clean_kern_cache_all) - ARM( stmfd sp!, {r4-r5, r7, r9-r11, lr} ) - THUMB( stmfd sp!, {r4-r7, r9-r11, lr} ) - bl v7_clean_dcache_all - mov r0, #0 -#ifdef CONFIG_SMP - mcr p15, 0, r0, c7, c1, 0 @ invalidate I-cache inner shareable -#endif - ARM( ldmfd sp!, {r4-r5, r7, r9-r11, lr} ) - THUMB( ldmfd sp!, {r4-r7, r9-r11, lr} ) - mov pc, lr -ENDPROC(v7_clean_kern_cache_all) - -/* * v7_flush_cache_all() * * Flush all TLB entries in a particular address space diff --git a/drivers/video/tegra/nvmap.c b/drivers/video/tegra/nvmap.c index ce0da9904afe..f260e1cb9573 100644 --- a/drivers/video/tegra/nvmap.c +++ b/drivers/video/tegra/nvmap.c @@ -149,9 +149,6 @@ static struct rb_root nvmap_handles = RB_ROOT; static struct tegra_iovmm_client *nvmap_vm_client = NULL; -extern void v7_flush_kern_cache_all(void); -extern void v7_clean_kern_cache_all(void); - /* default heap order policy */ static unsigned int _nvmap_heap_policy (unsigned int heaps, int numpages) { @@ -2834,16 +2831,6 @@ static int _nvmap_do_cache_maint(struct nvmap_handle *h, outer_maint = NULL; } - if (end - start > PAGE_SIZE * 3) { - if (op == NVMEM_CACHE_OP_WB) { - v7_clean_kern_cache_all(); - inner_maint = NULL; - } else if (op == NVMEM_CACHE_OP_WB_INV) { - v7_flush_kern_cache_all(); - inner_maint = NULL; - } - } - prot = _nvmap_flag_to_pgprot(h->flags, pgprot_kernel); if (h->alloc && !h->heap_pgalloc) { @@ -2852,7 +2839,7 @@ static int _nvmap_do_cache_maint(struct nvmap_handle *h, spin_unlock(&h->carveout.co_heap->lock); } - while (start < end && (inner_maint || outer_maint)) { + while (start < end) { struct page *page = NULL; unsigned long phys; void *src; @@ -2881,7 +2868,7 @@ static int _nvmap_do_cache_maint(struct nvmap_handle *h, src = addr + (phys & ~PAGE_MASK); count = min_t(size_t, end-start, PAGE_SIZE-(phys&~PAGE_MASK)); - if (inner_maint) inner_maint(src, src+count); + inner_maint(src, src+count); if (outer_maint) outer_maint(phys, phys+count); start += count; if (page) put_page(page); @@ -3026,12 +3013,19 @@ static ssize_t _nvmap_do_rw_handle(struct nvmap_handle *h, int is_read, } while (count--) { - size_t ret = _nvmap_do_one_rw_handle(h, is_read, + size_t ret; + if (is_read) + _nvmap_do_cache_maint(h, h_offs, h_offs + elem_size, + NVMEM_CACHE_OP_INV, false); + ret = _nvmap_do_one_rw_handle(h, is_read, is_user, h_offs, sys_addr, elem_size, &addr); if (ret < 0) { if (!bytes_copied) bytes_copied = ret; break; } + if (!is_read) + _nvmap_do_cache_maint(h, h_offs, h_offs + ret, + NVMEM_CACHE_OP_WB, false); bytes_copied += ret; if (ret < elem_size) break; sys_addr += sys_stride; |