]>
Commit | Line | Data |
---|---|---|
1da177e4 LT |
1 | /* |
2 | * arch/sh/mm/cache-sh4.c | |
3 | * | |
4 | * Copyright (C) 1999, 2000, 2002 Niibe Yutaka | |
deaef20e | 5 | * Copyright (C) 2001 - 2009 Paul Mundt |
1da177e4 | 6 | * Copyright (C) 2003 Richard Curnow |
09b5a10c | 7 | * Copyright (c) 2007 STMicroelectronics (R&D) Ltd. |
1da177e4 LT |
8 | * |
9 | * This file is subject to the terms and conditions of the GNU General Public | |
10 | * License. See the file "COPYING" in the main directory of this archive | |
11 | * for more details. | |
12 | */ | |
1da177e4 | 13 | #include <linux/init.h> |
1da177e4 | 14 | #include <linux/mm.h> |
52e27782 PM |
15 | #include <linux/io.h> |
16 | #include <linux/mutex.h> | |
2277ab4a | 17 | #include <linux/fs.h> |
deaef20e PM |
18 | #include <linux/highmem.h> |
19 | #include <asm/pgtable.h> | |
1da177e4 | 20 | #include <asm/mmu_context.h> |
f03c4866 | 21 | #include <asm/cache_insns.h> |
1da177e4 LT |
22 | #include <asm/cacheflush.h> |
23 | ||
28ccf7f9 PM |
24 | /* |
25 | * The maximum number of pages we support up to when doing ranged dcache | |
26 | * flushing. Anything exceeding this will simply flush the dcache in its | |
27 | * entirety. | |
28 | */ | |
09b5a10c | 29 | #define MAX_ICACHE_PAGES 32 |
28ccf7f9 | 30 | |
a7a7c0e1 | 31 | static void __flush_cache_one(unsigned long addr, unsigned long phys, |
a252710f | 32 | unsigned long exec_offset); |
b638d0b9 | 33 | |
1da177e4 LT |
34 | /* |
35 | * Write back the range of D-cache, and purge the I-cache. | |
36 | * | |
09b5a10c CS |
37 | * Called from kernel/module.c:sys_init_module and routine for a.out format, |
38 | * signal handler code and kprobes code | |
1da177e4 | 39 | */ |
2dc2f8e0 | 40 | static void sh4_flush_icache_range(void *args) |
1da177e4 | 41 | { |
f26b2a56 | 42 | struct flusher_data *data = args; |
f26b2a56 | 43 | unsigned long start, end; |
983f4c51 | 44 | unsigned long flags, v; |
1da177e4 LT |
45 | int i; |
46 | ||
f26b2a56 PM |
47 | start = data->addr1; |
48 | end = data->addr2; | |
49 | ||
682f88ab PM |
50 | /* If there are too many pages then just blow away the caches */ |
51 | if (((end - start) >> PAGE_SHIFT) >= MAX_ICACHE_PAGES) { | |
52 | local_flush_cache_all(NULL); | |
53 | return; | |
54 | } | |
55 | ||
56 | /* | |
57 | * Selectively flush d-cache then invalidate the i-cache. | |
58 | * This is inefficient, so only use this for small ranges. | |
59 | */ | |
60 | start &= ~(L1_CACHE_BYTES-1); | |
61 | end += L1_CACHE_BYTES-1; | |
62 | end &= ~(L1_CACHE_BYTES-1); | |
983f4c51 | 63 | |
682f88ab PM |
64 | local_irq_save(flags); |
65 | jump_to_uncached(); | |
983f4c51 | 66 | |
682f88ab PM |
67 | for (v = start; v < end; v += L1_CACHE_BYTES) { |
68 | unsigned long icacheaddr; | |
a9d244a2 | 69 | int j, n; |
983f4c51 | 70 | |
682f88ab | 71 | __ocbwb(v); |
983f4c51 | 72 | |
682f88ab PM |
73 | icacheaddr = CACHE_IC_ADDRESS_ARRAY | (v & |
74 | cpu_data->icache.entry_mask); | |
09b5a10c | 75 | |
682f88ab | 76 | /* Clear i-cache line valid-bit */ |
a9d244a2 | 77 | n = boot_cpu_data.icache.n_aliases; |
682f88ab | 78 | for (i = 0; i < cpu_data->icache.ways; i++) { |
a9d244a2 MF |
79 | for (j = 0; j < n; j++) |
80 | __raw_writel(0, icacheaddr + (j * PAGE_SIZE)); | |
682f88ab PM |
81 | icacheaddr += cpu_data->icache.way_incr; |
82 | } | |
09b5a10c | 83 | } |
682f88ab PM |
84 | |
85 | back_to_cached(); | |
86 | local_irq_restore(flags); | |
1da177e4 LT |
87 | } |
88 | ||
a7a7c0e1 | 89 | static inline void flush_cache_one(unsigned long start, unsigned long phys) |
1da177e4 | 90 | { |
983f4c51 | 91 | unsigned long flags, exec_offset = 0; |
33573c0e | 92 | |
1da177e4 | 93 | /* |
1f69b6af MF |
94 | * All types of SH-4 require PC to be uncached to operate on the I-cache. |
95 | * Some types of SH-4 require PC to be uncached to operate on the D-cache. | |
1da177e4 | 96 | */ |
7ec9d6f8 | 97 | if ((boot_cpu_data.flags & CPU_HAS_P2_FLUSH_BUG) || |
33573c0e | 98 | (start < CACHE_OC_ADDRESS_ARRAY)) |
1f69b6af | 99 | exec_offset = cached_to_uncached; |
33573c0e | 100 | |
983f4c51 | 101 | local_irq_save(flags); |
a781d1e5 | 102 | __flush_cache_one(start, phys, exec_offset); |
983f4c51 | 103 | local_irq_restore(flags); |
1da177e4 LT |
104 | } |
105 | ||
106 | /* | |
107 | * Write back & invalidate the D-cache of the page. | |
108 | * (To avoid "alias" issues) | |
109 | */ | |
e76a0136 | 110 | static void sh4_flush_dcache_page(void *arg) |
1da177e4 | 111 | { |
e76a0136 | 112 | struct page *page = arg; |
b4c89276 | 113 | unsigned long addr = (unsigned long)page_address(page); |
c139a595 | 114 | #ifndef CONFIG_SMP |
2277ab4a PM |
115 | struct address_space *mapping = page_mapping(page); |
116 | ||
2277ab4a | 117 | if (mapping && !mapping_mapped(mapping)) |
55661fc1 | 118 | clear_bit(PG_dcache_clean, &page->flags); |
2277ab4a PM |
119 | else |
120 | #endif | |
b4c89276 MF |
121 | flush_cache_one(CACHE_OC_ADDRESS_ARRAY | |
122 | (addr & shm_align_mask), page_to_phys(page)); | |
fdfc74f9 PM |
123 | |
124 | wmb(); | |
1da177e4 LT |
125 | } |
126 | ||
28ccf7f9 | 127 | /* TODO: Selective icache invalidation through IC address array.. */ |
2dc2f8e0 | 128 | static void flush_icache_all(void) |
1da177e4 | 129 | { |
983f4c51 | 130 | unsigned long flags, ccr; |
1da177e4 | 131 | |
983f4c51 | 132 | local_irq_save(flags); |
cbaa118e | 133 | jump_to_uncached(); |
1da177e4 LT |
134 | |
135 | /* Flush I-cache */ | |
a5f6ea29 | 136 | ccr = __raw_readl(SH_CCR); |
1da177e4 | 137 | ccr |= CCR_CACHE_ICI; |
a5f6ea29 | 138 | __raw_writel(ccr, SH_CCR); |
1da177e4 | 139 | |
29847622 | 140 | /* |
cbaa118e | 141 | * back_to_cached() will take care of the barrier for us, don't add |
29847622 PM |
142 | * another one! |
143 | */ | |
983f4c51 | 144 | |
cbaa118e | 145 | back_to_cached(); |
983f4c51 | 146 | local_irq_restore(flags); |
1da177e4 LT |
147 | } |
148 | ||
bd6df574 | 149 | static void flush_dcache_all(void) |
1da177e4 | 150 | { |
bd6df574 PM |
151 | unsigned long addr, end_addr, entry_offset; |
152 | ||
153 | end_addr = CACHE_OC_ADDRESS_ARRAY + | |
154 | (current_cpu_data.dcache.sets << | |
155 | current_cpu_data.dcache.entry_shift) * | |
156 | current_cpu_data.dcache.ways; | |
157 | ||
158 | entry_offset = 1 << current_cpu_data.dcache.entry_shift; | |
159 | ||
160 | for (addr = CACHE_OC_ADDRESS_ARRAY; addr < end_addr; ) { | |
161 | __raw_writel(0, addr); addr += entry_offset; | |
162 | __raw_writel(0, addr); addr += entry_offset; | |
163 | __raw_writel(0, addr); addr += entry_offset; | |
164 | __raw_writel(0, addr); addr += entry_offset; | |
165 | __raw_writel(0, addr); addr += entry_offset; | |
166 | __raw_writel(0, addr); addr += entry_offset; | |
167 | __raw_writel(0, addr); addr += entry_offset; | |
168 | __raw_writel(0, addr); addr += entry_offset; | |
169 | } | |
a252710f PM |
170 | } |
171 | ||
f26b2a56 | 172 | static void sh4_flush_cache_all(void *unused) |
a252710f PM |
173 | { |
174 | flush_dcache_all(); | |
1da177e4 LT |
175 | flush_icache_all(); |
176 | } | |
177 | ||
28ccf7f9 PM |
178 | /* |
179 | * Note : (RPC) since the caches are physically tagged, the only point | |
180 | * of flush_cache_mm for SH-4 is to get rid of aliases from the | |
181 | * D-cache. The assumption elsewhere, e.g. flush_cache_range, is that | |
182 | * lines can stay resident so long as the virtual address they were | |
183 | * accessed with (hence cache set) is in accord with the physical | |
654d364e | 184 | * address (i.e. tag). It's no different here. |
28ccf7f9 PM |
185 | * |
186 | * Caller takes mm->mmap_sem. | |
187 | */ | |
f26b2a56 | 188 | static void sh4_flush_cache_mm(void *arg) |
1da177e4 | 189 | { |
f26b2a56 PM |
190 | struct mm_struct *mm = arg; |
191 | ||
e7b8b7f1 PM |
192 | if (cpu_context(smp_processor_id(), mm) == NO_CONTEXT) |
193 | return; | |
194 | ||
654d364e | 195 | flush_dcache_all(); |
1da177e4 LT |
196 | } |
197 | ||
198 | /* | |
199 | * Write back and invalidate I/D-caches for the page. | |
200 | * | |
201 | * ADDR: Virtual Address (U0 address) | |
202 | * PFN: Physical page number | |
203 | */ | |
f26b2a56 | 204 | static void sh4_flush_cache_page(void *args) |
1da177e4 | 205 | { |
f26b2a56 PM |
206 | struct flusher_data *data = args; |
207 | struct vm_area_struct *vma; | |
deaef20e | 208 | struct page *page; |
f26b2a56 | 209 | unsigned long address, pfn, phys; |
deaef20e PM |
210 | int map_coherent = 0; |
211 | pgd_t *pgd; | |
212 | pud_t *pud; | |
213 | pmd_t *pmd; | |
214 | pte_t *pte; | |
215 | void *vaddr; | |
b638d0b9 | 216 | |
f26b2a56 | 217 | vma = data->vma; |
abeaf33a | 218 | address = data->addr1 & PAGE_MASK; |
f26b2a56 PM |
219 | pfn = data->addr2; |
220 | phys = pfn << PAGE_SHIFT; | |
deaef20e | 221 | page = pfn_to_page(pfn); |
f26b2a56 | 222 | |
e7b8b7f1 PM |
223 | if (cpu_context(smp_processor_id(), vma->vm_mm) == NO_CONTEXT) |
224 | return; | |
225 | ||
deaef20e PM |
226 | pgd = pgd_offset(vma->vm_mm, address); |
227 | pud = pud_offset(pgd, address); | |
228 | pmd = pmd_offset(pud, address); | |
229 | pte = pte_offset_kernel(pmd, address); | |
230 | ||
231 | /* If the page isn't present, there is nothing to do here. */ | |
232 | if (!(pte_val(*pte) & _PAGE_PRESENT)) | |
233 | return; | |
1da177e4 | 234 | |
deaef20e PM |
235 | if ((vma->vm_mm == current->active_mm)) |
236 | vaddr = NULL; | |
237 | else { | |
b638d0b9 | 238 | /* |
deaef20e PM |
239 | * Use kmap_coherent or kmap_atomic to do flushes for |
240 | * another ASID than the current one. | |
b638d0b9 | 241 | */ |
deaef20e | 242 | map_coherent = (current_cpu_data.dcache.n_aliases && |
55661fc1 | 243 | test_bit(PG_dcache_clean, &page->flags) && |
e1534ae9 | 244 | page_mapcount(page)); |
deaef20e PM |
245 | if (map_coherent) |
246 | vaddr = kmap_coherent(page, address); | |
247 | else | |
bc3e11be | 248 | vaddr = kmap_atomic(page); |
deaef20e PM |
249 | |
250 | address = (unsigned long)vaddr; | |
251 | } | |
252 | ||
e717cc6c | 253 | flush_cache_one(CACHE_OC_ADDRESS_ARRAY | |
deaef20e PM |
254 | (address & shm_align_mask), phys); |
255 | ||
256 | if (vma->vm_flags & VM_EXEC) | |
257 | flush_icache_all(); | |
258 | ||
259 | if (vaddr) { | |
260 | if (map_coherent) | |
261 | kunmap_coherent(vaddr); | |
262 | else | |
bc3e11be | 263 | kunmap_atomic(vaddr); |
b638d0b9 | 264 | } |
1da177e4 LT |
265 | } |
266 | ||
267 | /* | |
268 | * Write back and invalidate D-caches. | |
269 | * | |
270 | * START, END: Virtual Address (U0 address) | |
271 | * | |
272 | * NOTE: We need to flush the _physical_ page entry. | |
273 | * Flushing the cache lines for U0 only isn't enough. | |
274 | * We need to flush for P1 too, which may contain aliases. | |
275 | */ | |
f26b2a56 | 276 | static void sh4_flush_cache_range(void *args) |
1da177e4 | 277 | { |
f26b2a56 PM |
278 | struct flusher_data *data = args; |
279 | struct vm_area_struct *vma; | |
280 | unsigned long start, end; | |
281 | ||
282 | vma = data->vma; | |
283 | start = data->addr1; | |
284 | end = data->addr2; | |
285 | ||
e7b8b7f1 PM |
286 | if (cpu_context(smp_processor_id(), vma->vm_mm) == NO_CONTEXT) |
287 | return; | |
288 | ||
b638d0b9 RC |
289 | /* |
290 | * If cache is only 4k-per-way, there are never any 'aliases'. Since | |
291 | * the cache is physically tagged, the data can just be left in there. | |
292 | */ | |
7ec9d6f8 | 293 | if (boot_cpu_data.dcache.n_aliases == 0) |
b638d0b9 RC |
294 | return; |
295 | ||
654d364e | 296 | flush_dcache_all(); |
b638d0b9 | 297 | |
654d364e | 298 | if (vma->vm_flags & VM_EXEC) |
1da177e4 LT |
299 | flush_icache_all(); |
300 | } | |
301 | ||
b638d0b9 | 302 | /** |
a7a7c0e1 | 303 | * __flush_cache_one |
b638d0b9 RC |
304 | * |
305 | * @addr: address in memory mapped cache array | |
306 | * @phys: P1 address to flush (has to match tags if addr has 'A' bit | |
307 | * set i.e. associative write) | |
308 | * @exec_offset: set to 0x20000000 if flush has to be executed from P2 | |
309 | * region else 0x0 | |
310 | * | |
311 | * The offset into the cache array implied by 'addr' selects the | |
312 | * 'colour' of the virtual address range that will be flushed. The | |
313 | * operation (purge/write-back) is selected by the lower 2 bits of | |
314 | * 'phys'. | |
315 | */ | |
a7a7c0e1 | 316 | static void __flush_cache_one(unsigned long addr, unsigned long phys, |
b638d0b9 RC |
317 | unsigned long exec_offset) |
318 | { | |
319 | int way_count; | |
320 | unsigned long base_addr = addr; | |
321 | struct cache_info *dcache; | |
322 | unsigned long way_incr; | |
323 | unsigned long a, ea, p; | |
324 | unsigned long temp_pc; | |
325 | ||
7ec9d6f8 | 326 | dcache = &boot_cpu_data.dcache; |
b638d0b9 RC |
327 | /* Write this way for better assembly. */ |
328 | way_count = dcache->ways; | |
329 | way_incr = dcache->way_incr; | |
330 | ||
331 | /* | |
332 | * Apply exec_offset (i.e. branch to P2 if required.). | |
333 | * | |
334 | * FIXME: | |
335 | * | |
336 | * If I write "=r" for the (temp_pc), it puts this in r6 hence | |
337 | * trashing exec_offset before it's been added on - why? Hence | |
338 | * "=&r" as a 'workaround' | |
339 | */ | |
340 | asm volatile("mov.l 1f, %0\n\t" | |
341 | "add %1, %0\n\t" | |
342 | "jmp @%0\n\t" | |
343 | "nop\n\t" | |
344 | ".balign 4\n\t" | |
345 | "1: .long 2f\n\t" | |
346 | "2:\n" : "=&r" (temp_pc) : "r" (exec_offset)); | |
347 | ||
348 | /* | |
349 | * We know there will be >=1 iteration, so write as do-while to avoid | |
350 | * pointless nead-of-loop check for 0 iterations. | |
351 | */ | |
352 | do { | |
353 | ea = base_addr + PAGE_SIZE; | |
354 | a = base_addr; | |
355 | p = phys; | |
356 | ||
357 | do { | |
358 | *(volatile unsigned long *)a = p; | |
359 | /* | |
360 | * Next line: intentionally not p+32, saves an add, p | |
361 | * will do since only the cache tag bits need to | |
362 | * match. | |
363 | */ | |
364 | *(volatile unsigned long *)(a+32) = p; | |
365 | a += 64; | |
366 | p += 64; | |
367 | } while (a < ea); | |
368 | ||
369 | base_addr += way_incr; | |
370 | } while (--way_count != 0); | |
371 | } | |
372 | ||
37443ef3 PM |
373 | extern void __weak sh4__flush_region_init(void); |
374 | ||
375 | /* | |
376 | * SH-4 has virtually indexed and physically tagged cache. | |
377 | */ | |
378 | void __init sh4_cache_init(void) | |
379 | { | |
380 | printk("PVR=%08x CVR=%08x PRR=%08x\n", | |
9d56dd3b PM |
381 | __raw_readl(CCN_PVR), |
382 | __raw_readl(CCN_CVR), | |
383 | __raw_readl(CCN_PRR)); | |
37443ef3 | 384 | |
f26b2a56 PM |
385 | local_flush_icache_range = sh4_flush_icache_range; |
386 | local_flush_dcache_page = sh4_flush_dcache_page; | |
387 | local_flush_cache_all = sh4_flush_cache_all; | |
388 | local_flush_cache_mm = sh4_flush_cache_mm; | |
389 | local_flush_cache_dup_mm = sh4_flush_cache_mm; | |
390 | local_flush_cache_page = sh4_flush_cache_page; | |
391 | local_flush_cache_range = sh4_flush_cache_range; | |
37443ef3 PM |
392 | |
393 | sh4__flush_region_init(); | |
394 | } |