2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
6 * Copyright (C) 1999-2006 Helge Deller <deller@gmx.de> (07-13-1999)
7 * Copyright (C) 1999 SuSE GmbH Nuernberg
8 * Copyright (C) 2000 Philipp Rumpf (prumpf@tux.org)
10 * Cache and TLB management
14 #include <linux/init.h>
15 #include <linux/kernel.h>
17 #include <linux/module.h>
18 #include <linux/seq_file.h>
19 #include <linux/pagemap.h>
20 #include <linux/sched.h>
21 #include <linux/sched/mm.h>
23 #include <asm/cache.h>
24 #include <asm/cacheflush.h>
25 #include <asm/tlbflush.h>
27 #include <asm/pgalloc.h>
28 #include <asm/processor.h>
29 #include <asm/sections.h>
30 #include <asm/shmparam.h>
32 int split_tlb __read_mostly
;
33 int dcache_stride __read_mostly
;
34 int icache_stride __read_mostly
;
35 EXPORT_SYMBOL(dcache_stride
);
37 void flush_dcache_page_asm(unsigned long phys_addr
, unsigned long vaddr
);
38 EXPORT_SYMBOL(flush_dcache_page_asm
);
39 void flush_icache_page_asm(unsigned long phys_addr
, unsigned long vaddr
);
42 /* On some machines (e.g. ones with the Merced bus), there can be
43 * only a single PxTLB broadcast at a time; this must be guaranteed
44 * by software. We put a spinlock around all TLB flushes to
47 DEFINE_SPINLOCK(pa_tlb_lock
);
49 struct pdc_cache_info cache_info __read_mostly
;
51 static struct pdc_btlb_info btlb_info __read_mostly
;
56 flush_data_cache(void)
58 on_each_cpu(flush_data_cache_local
, NULL
, 1);
61 flush_instruction_cache(void)
63 on_each_cpu(flush_instruction_cache_local
, NULL
, 1);
68 flush_cache_all_local(void)
70 flush_instruction_cache_local(NULL
);
71 flush_data_cache_local(NULL
);
73 EXPORT_SYMBOL(flush_cache_all_local
);
75 /* Virtual address of pfn. */
76 #define pfn_va(pfn) __va(PFN_PHYS(pfn))
79 update_mmu_cache(struct vm_area_struct
*vma
, unsigned long address
, pte_t
*ptep
)
81 unsigned long pfn
= pte_pfn(*ptep
);
84 /* We don't have pte special. As a result, we can be called with
85 an invalid pfn and we don't need to flush the kernel dcache page.
86 This occurs with FireGL card in C8000. */
90 page
= pfn_to_page(pfn
);
91 if (page_mapping(page
) && test_bit(PG_dcache_dirty
, &page
->flags
)) {
92 flush_kernel_dcache_page_addr(pfn_va(pfn
));
93 clear_bit(PG_dcache_dirty
, &page
->flags
);
94 } else if (parisc_requires_coherency())
95 flush_kernel_dcache_page_addr(pfn_va(pfn
));
99 show_cache_info(struct seq_file
*m
)
103 seq_printf(m
, "I-cache\t\t: %ld KB\n",
104 cache_info
.ic_size
/1024 );
105 if (cache_info
.dc_loop
!= 1)
106 snprintf(buf
, 32, "%lu-way associative", cache_info
.dc_loop
);
107 seq_printf(m
, "D-cache\t\t: %ld KB (%s%s, %s)\n",
108 cache_info
.dc_size
/1024,
109 (cache_info
.dc_conf
.cc_wt
? "WT":"WB"),
110 (cache_info
.dc_conf
.cc_sh
? ", shared I/D":""),
111 ((cache_info
.dc_loop
== 1) ? "direct mapped" : buf
));
112 seq_printf(m
, "ITLB entries\t: %ld\n" "DTLB entries\t: %ld%s\n",
115 cache_info
.dt_conf
.tc_sh
? " - shared with ITLB":""
119 /* BTLB - Block TLB */
120 if (btlb_info
.max_size
==0) {
121 seq_printf(m
, "BTLB\t\t: not supported\n" );
124 "BTLB fixed\t: max. %d pages, pagesize=%d (%dMB)\n"
125 "BTLB fix-entr.\t: %d instruction, %d data (%d combined)\n"
126 "BTLB var-entr.\t: %d instruction, %d data (%d combined)\n",
127 btlb_info
.max_size
, (int)4096,
128 btlb_info
.max_size
>>8,
129 btlb_info
.fixed_range_info
.num_i
,
130 btlb_info
.fixed_range_info
.num_d
,
131 btlb_info
.fixed_range_info
.num_comb
,
132 btlb_info
.variable_range_info
.num_i
,
133 btlb_info
.variable_range_info
.num_d
,
134 btlb_info
.variable_range_info
.num_comb
141 parisc_cache_init(void)
143 if (pdc_cache_info(&cache_info
) < 0)
144 panic("parisc_cache_init: pdc_cache_info failed");
147 printk("ic_size %lx dc_size %lx it_size %lx\n",
152 printk("DC base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx\n",
154 cache_info
.dc_stride
,
158 printk("dc_conf = 0x%lx alias %d blk %d line %d shift %d\n",
159 *(unsigned long *) (&cache_info
.dc_conf
),
160 cache_info
.dc_conf
.cc_alias
,
161 cache_info
.dc_conf
.cc_block
,
162 cache_info
.dc_conf
.cc_line
,
163 cache_info
.dc_conf
.cc_shift
);
164 printk(" wt %d sh %d cst %d hv %d\n",
165 cache_info
.dc_conf
.cc_wt
,
166 cache_info
.dc_conf
.cc_sh
,
167 cache_info
.dc_conf
.cc_cst
,
168 cache_info
.dc_conf
.cc_hv
);
170 printk("IC base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx\n",
172 cache_info
.ic_stride
,
176 printk("IT base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx off_base 0x%lx off_stride 0x%lx off_count 0x%lx\n",
177 cache_info
.it_sp_base
,
178 cache_info
.it_sp_stride
,
179 cache_info
.it_sp_count
,
181 cache_info
.it_off_base
,
182 cache_info
.it_off_stride
,
183 cache_info
.it_off_count
);
185 printk("DT base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx off_base 0x%lx off_stride 0x%lx off_count 0x%lx\n",
186 cache_info
.dt_sp_base
,
187 cache_info
.dt_sp_stride
,
188 cache_info
.dt_sp_count
,
190 cache_info
.dt_off_base
,
191 cache_info
.dt_off_stride
,
192 cache_info
.dt_off_count
);
194 printk("ic_conf = 0x%lx alias %d blk %d line %d shift %d\n",
195 *(unsigned long *) (&cache_info
.ic_conf
),
196 cache_info
.ic_conf
.cc_alias
,
197 cache_info
.ic_conf
.cc_block
,
198 cache_info
.ic_conf
.cc_line
,
199 cache_info
.ic_conf
.cc_shift
);
200 printk(" wt %d sh %d cst %d hv %d\n",
201 cache_info
.ic_conf
.cc_wt
,
202 cache_info
.ic_conf
.cc_sh
,
203 cache_info
.ic_conf
.cc_cst
,
204 cache_info
.ic_conf
.cc_hv
);
206 printk("D-TLB conf: sh %d page %d cst %d aid %d sr %d\n",
207 cache_info
.dt_conf
.tc_sh
,
208 cache_info
.dt_conf
.tc_page
,
209 cache_info
.dt_conf
.tc_cst
,
210 cache_info
.dt_conf
.tc_aid
,
211 cache_info
.dt_conf
.tc_sr
);
213 printk("I-TLB conf: sh %d page %d cst %d aid %d sr %d\n",
214 cache_info
.it_conf
.tc_sh
,
215 cache_info
.it_conf
.tc_page
,
216 cache_info
.it_conf
.tc_cst
,
217 cache_info
.it_conf
.tc_aid
,
218 cache_info
.it_conf
.tc_sr
);
222 if (cache_info
.dt_conf
.tc_sh
== 0 || cache_info
.dt_conf
.tc_sh
== 2) {
223 if (cache_info
.dt_conf
.tc_sh
== 2)
224 printk(KERN_WARNING
"Unexpected TLB configuration. "
225 "Will flush I/D separately (could be optimized).\n");
230 /* "New and Improved" version from Jim Hull
231 * (1 << (cc_block-1)) * (cc_line << (4 + cnf.cc_shift))
232 * The following CAFL_STRIDE is an optimized version, see
233 * http://lists.parisc-linux.org/pipermail/parisc-linux/2004-June/023625.html
234 * http://lists.parisc-linux.org/pipermail/parisc-linux/2004-June/023671.html
236 #define CAFL_STRIDE(cnf) (cnf.cc_line << (3 + cnf.cc_block + cnf.cc_shift))
237 dcache_stride
= CAFL_STRIDE(cache_info
.dc_conf
);
238 icache_stride
= CAFL_STRIDE(cache_info
.ic_conf
);
242 if (pdc_btlb_info(&btlb_info
) < 0) {
243 memset(&btlb_info
, 0, sizeof btlb_info
);
247 if ((boot_cpu_data
.pdc
.capabilities
& PDC_MODEL_NVA_MASK
) ==
248 PDC_MODEL_NVA_UNSUPPORTED
) {
249 printk(KERN_WARNING
"parisc_cache_init: Only equivalent aliasing supported!\n");
251 panic("SMP kernel required to avoid non-equivalent aliasing");
256 void disable_sr_hashing(void)
258 int srhash_type
, retval
;
259 unsigned long space_bits
;
261 switch (boot_cpu_data
.cpu_type
) {
262 case pcx
: /* We shouldn't get this far. setup.c should prevent it. */
269 srhash_type
= SRHASH_PCXST
;
273 srhash_type
= SRHASH_PCXL
;
276 case pcxl2
: /* pcxl2 doesn't support space register hashing */
279 default: /* Currently all PA2.0 machines use the same ins. sequence */
280 srhash_type
= SRHASH_PA20
;
284 disable_sr_hashing_asm(srhash_type
);
286 retval
= pdc_spaceid_bits(&space_bits
);
287 /* If this procedure isn't implemented, don't panic. */
288 if (retval
< 0 && retval
!= PDC_BAD_OPTION
)
289 panic("pdc_spaceid_bits call failed.\n");
291 panic("SpaceID hashing is still on!\n");
295 __flush_cache_page(struct vm_area_struct
*vma
, unsigned long vmaddr
,
296 unsigned long physaddr
)
299 flush_dcache_page_asm(physaddr
, vmaddr
);
300 if (vma
->vm_flags
& VM_EXEC
)
301 flush_icache_page_asm(physaddr
, vmaddr
);
305 void flush_dcache_page(struct page
*page
)
307 struct address_space
*mapping
= page_mapping(page
);
308 struct vm_area_struct
*mpnt
;
309 unsigned long offset
;
310 unsigned long addr
, old_addr
= 0;
313 if (mapping
&& !mapping_mapped(mapping
)) {
314 set_bit(PG_dcache_dirty
, &page
->flags
);
318 flush_kernel_dcache_page(page
);
325 /* We have carefully arranged in arch_get_unmapped_area() that
326 * *any* mappings of a file are always congruently mapped (whether
327 * declared as MAP_PRIVATE or MAP_SHARED), so we only need
328 * to flush one address here for them all to become coherent */
330 flush_dcache_mmap_lock(mapping
);
331 vma_interval_tree_foreach(mpnt
, &mapping
->i_mmap
, pgoff
, pgoff
) {
332 offset
= (pgoff
- mpnt
->vm_pgoff
) << PAGE_SHIFT
;
333 addr
= mpnt
->vm_start
+ offset
;
335 /* The TLB is the engine of coherence on parisc: The
336 * CPU is entitled to speculate any page with a TLB
337 * mapping, so here we kill the mapping then flush the
338 * page along a special flush only alias mapping.
339 * This guarantees that the page is no-longer in the
340 * cache for any process and nor may it be
341 * speculatively read in (until the user or kernel
342 * specifically accesses it, of course) */
344 flush_tlb_page(mpnt
, addr
);
345 if (old_addr
== 0 || (old_addr
& (SHM_COLOUR
- 1))
346 != (addr
& (SHM_COLOUR
- 1))) {
347 __flush_cache_page(mpnt
, addr
, page_to_phys(page
));
349 printk(KERN_ERR
"INEQUIVALENT ALIASES 0x%lx and 0x%lx in file %pD\n", old_addr
, addr
, mpnt
->vm_file
);
353 flush_dcache_mmap_unlock(mapping
);
355 EXPORT_SYMBOL(flush_dcache_page
);
357 /* Defined in arch/parisc/kernel/pacache.S */
358 EXPORT_SYMBOL(flush_kernel_dcache_range_asm
);
359 EXPORT_SYMBOL(flush_kernel_dcache_page_asm
);
360 EXPORT_SYMBOL(flush_data_cache_local
);
361 EXPORT_SYMBOL(flush_kernel_icache_range_asm
);
363 #define FLUSH_THRESHOLD 0x80000 /* 0.5MB */
364 static unsigned long parisc_cache_flush_threshold __read_mostly
= FLUSH_THRESHOLD
;
366 #define FLUSH_TLB_THRESHOLD (2*1024*1024) /* 2MB initial TLB threshold */
367 static unsigned long parisc_tlb_flush_threshold __read_mostly
= FLUSH_TLB_THRESHOLD
;
369 void __init
parisc_setup_cache_timing(void)
371 unsigned long rangetime
, alltime
;
372 unsigned long size
, start
;
373 unsigned long threshold
;
377 alltime
= mfctl(16) - alltime
;
379 size
= (unsigned long)(_end
- _text
);
380 rangetime
= mfctl(16);
381 flush_kernel_dcache_range((unsigned long)_text
, size
);
382 rangetime
= mfctl(16) - rangetime
;
384 printk(KERN_DEBUG
"Whole cache flush %lu cycles, flushing %lu bytes %lu cycles\n",
385 alltime
, size
, rangetime
);
387 threshold
= L1_CACHE_ALIGN(size
* alltime
/ rangetime
);
388 if (threshold
> cache_info
.dc_size
)
389 threshold
= cache_info
.dc_size
;
391 parisc_cache_flush_threshold
= threshold
;
392 printk(KERN_INFO
"Cache flush threshold set to %lu KiB\n",
393 parisc_cache_flush_threshold
/1024);
395 /* calculate TLB flush threshold */
397 /* On SMP machines, skip the TLB measure of kernel text which
398 * has been mapped as huge pages. */
399 if (num_online_cpus() > 1 && !parisc_requires_coherency()) {
400 threshold
= max(cache_info
.it_size
, cache_info
.dt_size
);
401 threshold
*= PAGE_SIZE
;
402 threshold
/= num_online_cpus();
403 goto set_tlb_threshold
;
408 alltime
= mfctl(16) - alltime
;
411 start
= (unsigned long) _text
;
412 rangetime
= mfctl(16);
413 while (start
< (unsigned long) _end
) {
414 flush_tlb_kernel_range(start
, start
+ PAGE_SIZE
);
418 rangetime
= mfctl(16) - rangetime
;
420 printk(KERN_DEBUG
"Whole TLB flush %lu cycles, flushing %lu bytes %lu cycles\n",
421 alltime
, size
, rangetime
);
423 threshold
= PAGE_ALIGN(num_online_cpus() * size
* alltime
/ rangetime
);
427 parisc_tlb_flush_threshold
= threshold
;
428 printk(KERN_INFO
"TLB flush threshold set to %lu KiB\n",
429 parisc_tlb_flush_threshold
/1024);
432 extern void purge_kernel_dcache_page_asm(unsigned long);
433 extern void clear_user_page_asm(void *, unsigned long);
434 extern void copy_user_page_asm(void *, void *, unsigned long);
436 void flush_kernel_dcache_page_addr(void *addr
)
440 flush_kernel_dcache_page_asm(addr
);
441 purge_tlb_start(flags
);
443 purge_tlb_end(flags
);
445 EXPORT_SYMBOL(flush_kernel_dcache_page_addr
);
447 void copy_user_page(void *vto
, void *vfrom
, unsigned long vaddr
,
450 /* Copy using kernel mapping. No coherency is needed (all in
451 kunmap) for the `to' page. However, the `from' page needs to
452 be flushed through a mapping equivalent to the user mapping
453 before it can be accessed through the kernel mapping. */
455 flush_dcache_page_asm(__pa(vfrom
), vaddr
);
456 copy_page_asm(vto
, vfrom
);
459 EXPORT_SYMBOL(copy_user_page
);
461 /* __flush_tlb_range()
463 * returns 1 if all TLBs were flushed.
465 int __flush_tlb_range(unsigned long sid
, unsigned long start
,
468 unsigned long flags
, size
;
470 size
= (end
- start
);
471 if (size
>= parisc_tlb_flush_threshold
) {
476 /* Purge TLB entries for small ranges using the pdtlb and
477 pitlb instructions. These instructions execute locally
478 but cause a purge request to be broadcast to other TLBs. */
479 if (likely(!split_tlb
)) {
480 while (start
< end
) {
481 purge_tlb_start(flags
);
484 purge_tlb_end(flags
);
491 while (start
< end
) {
492 purge_tlb_start(flags
);
496 purge_tlb_end(flags
);
502 static void cacheflush_h_tmp_function(void *dummy
)
504 flush_cache_all_local();
507 void flush_cache_all(void)
509 on_each_cpu(cacheflush_h_tmp_function
, NULL
, 1);
512 static inline unsigned long mm_total_size(struct mm_struct
*mm
)
514 struct vm_area_struct
*vma
;
515 unsigned long usize
= 0;
517 for (vma
= mm
->mmap
; vma
; vma
= vma
->vm_next
)
518 usize
+= vma
->vm_end
- vma
->vm_start
;
522 static inline pte_t
*get_ptep(pgd_t
*pgd
, unsigned long addr
)
526 if (!pgd_none(*pgd
)) {
527 pud_t
*pud
= pud_offset(pgd
, addr
);
528 if (!pud_none(*pud
)) {
529 pmd_t
*pmd
= pmd_offset(pud
, addr
);
531 ptep
= pte_offset_map(pmd
, addr
);
537 void flush_cache_mm(struct mm_struct
*mm
)
539 struct vm_area_struct
*vma
;
542 /* Flush the TLB to avoid speculation if coherency is required. */
543 if (parisc_requires_coherency())
546 /* Flushing the whole cache on each cpu takes forever on
547 rp3440, etc. So, avoid it if the mm isn't too big. */
548 if (mm_total_size(mm
) >= parisc_cache_flush_threshold
) {
553 if (mm
->context
== mfsp(3)) {
554 for (vma
= mm
->mmap
; vma
; vma
= vma
->vm_next
) {
555 flush_user_dcache_range_asm(vma
->vm_start
, vma
->vm_end
);
556 if ((vma
->vm_flags
& VM_EXEC
) == 0)
558 flush_user_icache_range_asm(vma
->vm_start
, vma
->vm_end
);
564 for (vma
= mm
->mmap
; vma
; vma
= vma
->vm_next
) {
567 for (addr
= vma
->vm_start
; addr
< vma
->vm_end
;
570 pte_t
*ptep
= get_ptep(pgd
, addr
);
573 pfn
= pte_pfn(*ptep
);
576 __flush_cache_page(vma
, addr
, PFN_PHYS(pfn
));
581 void flush_cache_range(struct vm_area_struct
*vma
,
582 unsigned long start
, unsigned long end
)
584 BUG_ON(!vma
->vm_mm
->context
);
586 /* Flush the TLB to avoid speculation if coherency is required. */
587 if (parisc_requires_coherency())
588 flush_tlb_range(vma
, start
, end
);
590 if ((end
- start
) >= parisc_cache_flush_threshold
591 || vma
->vm_mm
->context
!= mfsp(3)) {
596 flush_user_dcache_range_asm(start
, end
);
597 if (vma
->vm_flags
& VM_EXEC
)
598 flush_user_icache_range_asm(start
, end
);
602 flush_cache_page(struct vm_area_struct
*vma
, unsigned long vmaddr
, unsigned long pfn
)
604 BUG_ON(!vma
->vm_mm
->context
);
606 if (pfn_valid(pfn
)) {
607 if (parisc_requires_coherency())
608 flush_tlb_page(vma
, vmaddr
);
609 __flush_cache_page(vma
, vmaddr
, PFN_PHYS(pfn
));
613 void flush_kernel_vmap_range(void *vaddr
, int size
)
615 unsigned long start
= (unsigned long)vaddr
;
617 if ((unsigned long)size
> parisc_cache_flush_threshold
)
620 flush_kernel_dcache_range_asm(start
, start
+ size
);
622 EXPORT_SYMBOL(flush_kernel_vmap_range
);
624 void invalidate_kernel_vmap_range(void *vaddr
, int size
)
626 unsigned long start
= (unsigned long)vaddr
;
628 if ((unsigned long)size
> parisc_cache_flush_threshold
)
631 flush_kernel_dcache_range_asm(start
, start
+ size
);
633 EXPORT_SYMBOL(invalidate_kernel_vmap_range
);