blob: d6dd83826f8af0baffd833ad11807d18377d5cfb [file] [log] [blame]
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +02001/*
2 * arch/arm/mm/cache-feroceon-l2.c - Feroceon L2 cache controller support
3 *
4 * Copyright (C) 2008 Marvell Semiconductor
5 *
6 * This file is licensed under the terms of the GNU General Public
7 * License version 2. This program is licensed "as is" without any
8 * warranty of any kind, whether express or implied.
9 *
10 * References:
11 * - Unified Layer 2 Cache for Feroceon CPU Cores,
12 * Document ID MV-S104858-00, Rev. A, October 23 2007.
13 */
14
15#include <linux/init.h>
16#include <asm/cacheflush.h>
Nicolas Pitre1bb77262008-09-12 16:11:51 -040017#include <asm/kmap_types.h>
18#include <asm/fixmap.h>
19#include <asm/pgtable.h>
20#include <asm/tlbflush.h>
Lennert Buytenhek6f088f12008-08-09 13:44:58 +020021#include <plat/cache-feroceon-l2.h>
Nicolas Pitre1bb77262008-09-12 16:11:51 -040022#include "mm.h"
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020023
24/*
25 * Low-level cache maintenance operations.
26 *
27 * As well as the regular 'clean/invalidate/flush L2 cache line by
28 * MVA' instructions, the Feroceon L2 cache controller also features
29 * 'clean/invalidate L2 range by MVA' operations.
30 *
31 * Cache range operations are initiated by writing the start and
32 * end addresses to successive cp15 registers, and process every
33 * cache line whose first byte address lies in the inclusive range
34 * [start:end].
35 *
36 * The cache range operations stall the CPU pipeline until completion.
37 *
38 * The range operations require two successive cp15 writes, in
39 * between which we don't want to be preempted.
40 */
Nicolas Pitre1bb77262008-09-12 16:11:51 -040041
42static inline unsigned long l2_start_va(unsigned long paddr)
43{
44#ifdef CONFIG_HIGHMEM
45 /*
46 * Let's do our own fixmap stuff in a minimal way here.
47 * Because range ops can't be done on physical addresses,
48 * we simply install a virtual mapping for it only for the
49 * TLB lookup to occur, hence no need to flush the untouched
50 * memory mapping. This is protected with the disabling of
51 * interrupts by the caller.
52 */
53 unsigned long idx = KM_L2_CACHE + KM_TYPE_NR * smp_processor_id();
54 unsigned long vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
55 set_pte_ext(TOP_PTE(vaddr), pfn_pte(paddr >> PAGE_SHIFT, PAGE_KERNEL), 0);
56 local_flush_tlb_kernel_page(vaddr);
57 return vaddr + (paddr & ~PAGE_MASK);
58#else
59 return __phys_to_virt(paddr);
60#endif
61}
62
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020063static inline void l2_clean_pa(unsigned long addr)
64{
65 __asm__("mcr p15, 1, %0, c15, c9, 3" : : "r" (addr));
66}
67
Nicolas Pitre1bb77262008-09-12 16:11:51 -040068static inline void l2_clean_pa_range(unsigned long start, unsigned long end)
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020069{
Nicolas Pitre1bb77262008-09-12 16:11:51 -040070 unsigned long va_start, va_end, flags;
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020071
72 /*
73 * Make sure 'start' and 'end' reference the same page, as
74 * L2 is PIPT and range operations only do a TLB lookup on
75 * the start address.
76 */
Nicolas Pitre99c6bb32008-09-11 15:14:59 -040077 BUG_ON((start ^ end) >> PAGE_SHIFT);
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020078
79 raw_local_irq_save(flags);
Nicolas Pitre1bb77262008-09-12 16:11:51 -040080 va_start = l2_start_va(start);
81 va_end = va_start + (end - start);
Nicolas Pitre99c6bb32008-09-11 15:14:59 -040082 __asm__("mcr p15, 1, %0, c15, c9, 4\n\t"
83 "mcr p15, 1, %1, c15, c9, 5"
Nicolas Pitre1bb77262008-09-12 16:11:51 -040084 : : "r" (va_start), "r" (va_end));
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020085 raw_local_irq_restore(flags);
86}
87
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020088static inline void l2_clean_inv_pa(unsigned long addr)
89{
90 __asm__("mcr p15, 1, %0, c15, c10, 3" : : "r" (addr));
91}
92
93static inline void l2_inv_pa(unsigned long addr)
94{
95 __asm__("mcr p15, 1, %0, c15, c11, 3" : : "r" (addr));
96}
97
Nicolas Pitre1bb77262008-09-12 16:11:51 -040098static inline void l2_inv_pa_range(unsigned long start, unsigned long end)
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +020099{
Nicolas Pitre1bb77262008-09-12 16:11:51 -0400100 unsigned long va_start, va_end, flags;
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200101
102 /*
103 * Make sure 'start' and 'end' reference the same page, as
104 * L2 is PIPT and range operations only do a TLB lookup on
105 * the start address.
106 */
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400107 BUG_ON((start ^ end) >> PAGE_SHIFT);
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200108
109 raw_local_irq_save(flags);
Nicolas Pitre1bb77262008-09-12 16:11:51 -0400110 va_start = l2_start_va(start);
111 va_end = va_start + (end - start);
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400112 __asm__("mcr p15, 1, %0, c15, c11, 4\n\t"
113 "mcr p15, 1, %1, c15, c11, 5"
Nicolas Pitre1bb77262008-09-12 16:11:51 -0400114 : : "r" (va_start), "r" (va_end));
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200115 raw_local_irq_restore(flags);
116}
117
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200118
119/*
120 * Linux primitives.
121 *
122 * Note that the end addresses passed to Linux primitives are
123 * noninclusive, while the hardware cache range operations use
124 * inclusive start and end addresses.
125 */
126#define CACHE_LINE_SIZE 32
127#define MAX_RANGE_SIZE 1024
128
129static int l2_wt_override;
130
131static unsigned long calc_range_end(unsigned long start, unsigned long end)
132{
133 unsigned long range_end;
134
135 BUG_ON(start & (CACHE_LINE_SIZE - 1));
136 BUG_ON(end & (CACHE_LINE_SIZE - 1));
137
138 /*
139 * Try to process all cache lines between 'start' and 'end'.
140 */
141 range_end = end;
142
143 /*
144 * Limit the number of cache lines processed at once,
145 * since cache range operations stall the CPU pipeline
146 * until completion.
147 */
148 if (range_end > start + MAX_RANGE_SIZE)
149 range_end = start + MAX_RANGE_SIZE;
150
151 /*
152 * Cache range operations can't straddle a page boundary.
153 */
154 if (range_end > (start | (PAGE_SIZE - 1)) + 1)
155 range_end = (start | (PAGE_SIZE - 1)) + 1;
156
157 return range_end;
158}
159
160static void feroceon_l2_inv_range(unsigned long start, unsigned long end)
161{
162 /*
163 * Clean and invalidate partial first cache line.
164 */
165 if (start & (CACHE_LINE_SIZE - 1)) {
166 l2_clean_inv_pa(start & ~(CACHE_LINE_SIZE - 1));
167 start = (start | (CACHE_LINE_SIZE - 1)) + 1;
168 }
169
170 /*
171 * Clean and invalidate partial last cache line.
172 */
Nicolas Pitre72bc2b12008-11-08 21:15:53 +0100173 if (start < end && end & (CACHE_LINE_SIZE - 1)) {
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200174 l2_clean_inv_pa(end & ~(CACHE_LINE_SIZE - 1));
175 end &= ~(CACHE_LINE_SIZE - 1);
176 }
177
178 /*
179 * Invalidate all full cache lines between 'start' and 'end'.
180 */
Nicolas Pitre72bc2b12008-11-08 21:15:53 +0100181 while (start < end) {
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200182 unsigned long range_end = calc_range_end(start, end);
183 l2_inv_pa_range(start, range_end - CACHE_LINE_SIZE);
184 start = range_end;
185 }
186
187 dsb();
188}
189
190static void feroceon_l2_clean_range(unsigned long start, unsigned long end)
191{
192 /*
193 * If L2 is forced to WT, the L2 will always be clean and we
194 * don't need to do anything here.
195 */
196 if (!l2_wt_override) {
197 start &= ~(CACHE_LINE_SIZE - 1);
198 end = (end + CACHE_LINE_SIZE - 1) & ~(CACHE_LINE_SIZE - 1);
199 while (start != end) {
200 unsigned long range_end = calc_range_end(start, end);
201 l2_clean_pa_range(start, range_end - CACHE_LINE_SIZE);
202 start = range_end;
203 }
204 }
205
206 dsb();
207}
208
209static void feroceon_l2_flush_range(unsigned long start, unsigned long end)
210{
211 start &= ~(CACHE_LINE_SIZE - 1);
212 end = (end + CACHE_LINE_SIZE - 1) & ~(CACHE_LINE_SIZE - 1);
213 while (start != end) {
214 unsigned long range_end = calc_range_end(start, end);
215 if (!l2_wt_override)
216 l2_clean_pa_range(start, range_end - CACHE_LINE_SIZE);
217 l2_inv_pa_range(start, range_end - CACHE_LINE_SIZE);
218 start = range_end;
219 }
220
221 dsb();
222}
223
224
225/*
226 * Routines to disable and re-enable the D-cache and I-cache at run
227 * time. These are necessary because the L2 cache can only be enabled
228 * or disabled while the L1 Dcache and Icache are both disabled.
229 */
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400230static int __init flush_and_disable_dcache(void)
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200231{
232 u32 cr;
233
234 cr = get_cr();
235 if (cr & CR_C) {
236 unsigned long flags;
237
238 raw_local_irq_save(flags);
239 flush_cache_all();
240 set_cr(cr & ~CR_C);
241 raw_local_irq_restore(flags);
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400242 return 1;
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200243 }
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400244 return 0;
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200245}
246
247static void __init enable_dcache(void)
248{
249 u32 cr;
250
251 cr = get_cr();
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400252 set_cr(cr | CR_C);
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200253}
254
255static void __init __invalidate_icache(void)
256{
257 int dummy;
258
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400259 __asm__ __volatile__("mcr p15, 0, %0, c7, c5, 0" : "=r" (dummy));
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200260}
261
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400262static int __init invalidate_and_disable_icache(void)
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200263{
264 u32 cr;
265
266 cr = get_cr();
267 if (cr & CR_I) {
268 set_cr(cr & ~CR_I);
269 __invalidate_icache();
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400270 return 1;
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200271 }
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400272 return 0;
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200273}
274
275static void __init enable_icache(void)
276{
277 u32 cr;
278
279 cr = get_cr();
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400280 set_cr(cr | CR_I);
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200281}
282
283static inline u32 read_extra_features(void)
284{
285 u32 u;
286
287 __asm__("mrc p15, 1, %0, c15, c1, 0" : "=r" (u));
288
289 return u;
290}
291
292static inline void write_extra_features(u32 u)
293{
294 __asm__("mcr p15, 1, %0, c15, c1, 0" : : "r" (u));
295}
296
297static void __init disable_l2_prefetch(void)
298{
299 u32 u;
300
301 /*
302 * Read the CPU Extra Features register and verify that the
303 * Disable L2 Prefetch bit is set.
304 */
305 u = read_extra_features();
306 if (!(u & 0x01000000)) {
307 printk(KERN_INFO "Feroceon L2: Disabling L2 prefetch.\n");
308 write_extra_features(u | 0x01000000);
309 }
310}
311
312static void __init enable_l2(void)
313{
314 u32 u;
315
316 u = read_extra_features();
317 if (!(u & 0x00400000)) {
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400318 int i, d;
319
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200320 printk(KERN_INFO "Feroceon L2: Enabling L2\n");
321
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400322 d = flush_and_disable_dcache();
323 i = invalidate_and_disable_icache();
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200324 write_extra_features(u | 0x00400000);
Nicolas Pitre99c6bb32008-09-11 15:14:59 -0400325 if (i)
326 enable_icache();
327 if (d)
328 enable_dcache();
Lennert Buytenhek99c6dc12008-06-22 22:45:04 +0200329 }
330}
331
332void __init feroceon_l2_init(int __l2_wt_override)
333{
334 l2_wt_override = __l2_wt_override;
335
336 disable_l2_prefetch();
337
338 outer_cache.inv_range = feroceon_l2_inv_range;
339 outer_cache.clean_range = feroceon_l2_clean_range;
340 outer_cache.flush_range = feroceon_l2_flush_range;
341
342 enable_l2();
343
344 printk(KERN_INFO "Feroceon L2: Cache support initialised%s.\n",
345 l2_wt_override ? ", in WT override mode" : "");
346}