Loading...
1/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1999-2006 Helge Deller <deller@gmx.de> (07-13-1999)
7 * Copyright (C) 1999 SuSE GmbH Nuernberg
8 * Copyright (C) 2000 Philipp Rumpf (prumpf@tux.org)
9 *
10 * Cache and TLB management
11 *
12 */
13
14#include <linux/init.h>
15#include <linux/kernel.h>
16#include <linux/mm.h>
17#include <linux/module.h>
18#include <linux/seq_file.h>
19#include <linux/pagemap.h>
20#include <linux/sched.h>
21#include <linux/sched/mm.h>
22#include <asm/pdc.h>
23#include <asm/cache.h>
24#include <asm/cacheflush.h>
25#include <asm/tlbflush.h>
26#include <asm/page.h>
27#include <asm/processor.h>
28#include <asm/sections.h>
29#include <asm/shmparam.h>
30
31int split_tlb __ro_after_init;
32int dcache_stride __ro_after_init;
33int icache_stride __ro_after_init;
34EXPORT_SYMBOL(dcache_stride);
35
36void flush_dcache_page_asm(unsigned long phys_addr, unsigned long vaddr);
37EXPORT_SYMBOL(flush_dcache_page_asm);
38void purge_dcache_page_asm(unsigned long phys_addr, unsigned long vaddr);
39void flush_icache_page_asm(unsigned long phys_addr, unsigned long vaddr);
40
41
42/* On some machines (i.e., ones with the Merced bus), there can be
43 * only a single PxTLB broadcast at a time; this must be guaranteed
44 * by software. We need a spinlock around all TLB flushes to ensure
45 * this.
46 */
47DEFINE_SPINLOCK(pa_tlb_flush_lock);
48
49/* Swapper page setup lock. */
50DEFINE_SPINLOCK(pa_swapper_pg_lock);
51
52#if defined(CONFIG_64BIT) && defined(CONFIG_SMP)
53int pa_serialize_tlb_flushes __ro_after_init;
54#endif
55
56struct pdc_cache_info cache_info __ro_after_init;
57#ifndef CONFIG_PA20
58static struct pdc_btlb_info btlb_info __ro_after_init;
59#endif
60
61#ifdef CONFIG_SMP
62void
63flush_data_cache(void)
64{
65 on_each_cpu(flush_data_cache_local, NULL, 1);
66}
67void
68flush_instruction_cache(void)
69{
70 on_each_cpu(flush_instruction_cache_local, NULL, 1);
71}
72#endif
73
74void
75flush_cache_all_local(void)
76{
77 flush_instruction_cache_local(NULL);
78 flush_data_cache_local(NULL);
79}
80EXPORT_SYMBOL(flush_cache_all_local);
81
82/* Virtual address of pfn. */
83#define pfn_va(pfn) __va(PFN_PHYS(pfn))
84
85void
86update_mmu_cache(struct vm_area_struct *vma, unsigned long address, pte_t *ptep)
87{
88 unsigned long pfn = pte_pfn(*ptep);
89 struct page *page;
90
91 /* We don't have pte special. As a result, we can be called with
92 an invalid pfn and we don't need to flush the kernel dcache page.
93 This occurs with FireGL card in C8000. */
94 if (!pfn_valid(pfn))
95 return;
96
97 page = pfn_to_page(pfn);
98 if (page_mapping_file(page) &&
99 test_bit(PG_dcache_dirty, &page->flags)) {
100 flush_kernel_dcache_page_addr(pfn_va(pfn));
101 clear_bit(PG_dcache_dirty, &page->flags);
102 } else if (parisc_requires_coherency())
103 flush_kernel_dcache_page_addr(pfn_va(pfn));
104}
105
106void
107show_cache_info(struct seq_file *m)
108{
109 char buf[32];
110
111 seq_printf(m, "I-cache\t\t: %ld KB\n",
112 cache_info.ic_size/1024 );
113 if (cache_info.dc_loop != 1)
114 snprintf(buf, 32, "%lu-way associative", cache_info.dc_loop);
115 seq_printf(m, "D-cache\t\t: %ld KB (%s%s, %s)\n",
116 cache_info.dc_size/1024,
117 (cache_info.dc_conf.cc_wt ? "WT":"WB"),
118 (cache_info.dc_conf.cc_sh ? ", shared I/D":""),
119 ((cache_info.dc_loop == 1) ? "direct mapped" : buf));
120 seq_printf(m, "ITLB entries\t: %ld\n" "DTLB entries\t: %ld%s\n",
121 cache_info.it_size,
122 cache_info.dt_size,
123 cache_info.dt_conf.tc_sh ? " - shared with ITLB":""
124 );
125
126#ifndef CONFIG_PA20
127 /* BTLB - Block TLB */
128 if (btlb_info.max_size==0) {
129 seq_printf(m, "BTLB\t\t: not supported\n" );
130 } else {
131 seq_printf(m,
132 "BTLB fixed\t: max. %d pages, pagesize=%d (%dMB)\n"
133 "BTLB fix-entr.\t: %d instruction, %d data (%d combined)\n"
134 "BTLB var-entr.\t: %d instruction, %d data (%d combined)\n",
135 btlb_info.max_size, (int)4096,
136 btlb_info.max_size>>8,
137 btlb_info.fixed_range_info.num_i,
138 btlb_info.fixed_range_info.num_d,
139 btlb_info.fixed_range_info.num_comb,
140 btlb_info.variable_range_info.num_i,
141 btlb_info.variable_range_info.num_d,
142 btlb_info.variable_range_info.num_comb
143 );
144 }
145#endif
146}
147
148void __init
149parisc_cache_init(void)
150{
151 if (pdc_cache_info(&cache_info) < 0)
152 panic("parisc_cache_init: pdc_cache_info failed");
153
154#if 0
155 printk("ic_size %lx dc_size %lx it_size %lx\n",
156 cache_info.ic_size,
157 cache_info.dc_size,
158 cache_info.it_size);
159
160 printk("DC base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx\n",
161 cache_info.dc_base,
162 cache_info.dc_stride,
163 cache_info.dc_count,
164 cache_info.dc_loop);
165
166 printk("dc_conf = 0x%lx alias %d blk %d line %d shift %d\n",
167 *(unsigned long *) (&cache_info.dc_conf),
168 cache_info.dc_conf.cc_alias,
169 cache_info.dc_conf.cc_block,
170 cache_info.dc_conf.cc_line,
171 cache_info.dc_conf.cc_shift);
172 printk(" wt %d sh %d cst %d hv %d\n",
173 cache_info.dc_conf.cc_wt,
174 cache_info.dc_conf.cc_sh,
175 cache_info.dc_conf.cc_cst,
176 cache_info.dc_conf.cc_hv);
177
178 printk("IC base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx\n",
179 cache_info.ic_base,
180 cache_info.ic_stride,
181 cache_info.ic_count,
182 cache_info.ic_loop);
183
184 printk("IT base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx off_base 0x%lx off_stride 0x%lx off_count 0x%lx\n",
185 cache_info.it_sp_base,
186 cache_info.it_sp_stride,
187 cache_info.it_sp_count,
188 cache_info.it_loop,
189 cache_info.it_off_base,
190 cache_info.it_off_stride,
191 cache_info.it_off_count);
192
193 printk("DT base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx off_base 0x%lx off_stride 0x%lx off_count 0x%lx\n",
194 cache_info.dt_sp_base,
195 cache_info.dt_sp_stride,
196 cache_info.dt_sp_count,
197 cache_info.dt_loop,
198 cache_info.dt_off_base,
199 cache_info.dt_off_stride,
200 cache_info.dt_off_count);
201
202 printk("ic_conf = 0x%lx alias %d blk %d line %d shift %d\n",
203 *(unsigned long *) (&cache_info.ic_conf),
204 cache_info.ic_conf.cc_alias,
205 cache_info.ic_conf.cc_block,
206 cache_info.ic_conf.cc_line,
207 cache_info.ic_conf.cc_shift);
208 printk(" wt %d sh %d cst %d hv %d\n",
209 cache_info.ic_conf.cc_wt,
210 cache_info.ic_conf.cc_sh,
211 cache_info.ic_conf.cc_cst,
212 cache_info.ic_conf.cc_hv);
213
214 printk("D-TLB conf: sh %d page %d cst %d aid %d sr %d\n",
215 cache_info.dt_conf.tc_sh,
216 cache_info.dt_conf.tc_page,
217 cache_info.dt_conf.tc_cst,
218 cache_info.dt_conf.tc_aid,
219 cache_info.dt_conf.tc_sr);
220
221 printk("I-TLB conf: sh %d page %d cst %d aid %d sr %d\n",
222 cache_info.it_conf.tc_sh,
223 cache_info.it_conf.tc_page,
224 cache_info.it_conf.tc_cst,
225 cache_info.it_conf.tc_aid,
226 cache_info.it_conf.tc_sr);
227#endif
228
229 split_tlb = 0;
230 if (cache_info.dt_conf.tc_sh == 0 || cache_info.dt_conf.tc_sh == 2) {
231 if (cache_info.dt_conf.tc_sh == 2)
232 printk(KERN_WARNING "Unexpected TLB configuration. "
233 "Will flush I/D separately (could be optimized).\n");
234
235 split_tlb = 1;
236 }
237
238 /* "New and Improved" version from Jim Hull
239 * (1 << (cc_block-1)) * (cc_line << (4 + cnf.cc_shift))
240 * The following CAFL_STRIDE is an optimized version, see
241 * http://lists.parisc-linux.org/pipermail/parisc-linux/2004-June/023625.html
242 * http://lists.parisc-linux.org/pipermail/parisc-linux/2004-June/023671.html
243 */
244#define CAFL_STRIDE(cnf) (cnf.cc_line << (3 + cnf.cc_block + cnf.cc_shift))
245 dcache_stride = CAFL_STRIDE(cache_info.dc_conf);
246 icache_stride = CAFL_STRIDE(cache_info.ic_conf);
247#undef CAFL_STRIDE
248
249#ifndef CONFIG_PA20
250 if (pdc_btlb_info(&btlb_info) < 0) {
251 memset(&btlb_info, 0, sizeof btlb_info);
252 }
253#endif
254
255 if ((boot_cpu_data.pdc.capabilities & PDC_MODEL_NVA_MASK) ==
256 PDC_MODEL_NVA_UNSUPPORTED) {
257 printk(KERN_WARNING "parisc_cache_init: Only equivalent aliasing supported!\n");
258#if 0
259 panic("SMP kernel required to avoid non-equivalent aliasing");
260#endif
261 }
262}
263
264void __init disable_sr_hashing(void)
265{
266 int srhash_type, retval;
267 unsigned long space_bits;
268
269 switch (boot_cpu_data.cpu_type) {
270 case pcx: /* We shouldn't get this far. setup.c should prevent it. */
271 BUG();
272 return;
273
274 case pcxs:
275 case pcxt:
276 case pcxt_:
277 srhash_type = SRHASH_PCXST;
278 break;
279
280 case pcxl:
281 srhash_type = SRHASH_PCXL;
282 break;
283
284 case pcxl2: /* pcxl2 doesn't support space register hashing */
285 return;
286
287 default: /* Currently all PA2.0 machines use the same ins. sequence */
288 srhash_type = SRHASH_PA20;
289 break;
290 }
291
292 disable_sr_hashing_asm(srhash_type);
293
294 retval = pdc_spaceid_bits(&space_bits);
295 /* If this procedure isn't implemented, don't panic. */
296 if (retval < 0 && retval != PDC_BAD_OPTION)
297 panic("pdc_spaceid_bits call failed.\n");
298 if (space_bits != 0)
299 panic("SpaceID hashing is still on!\n");
300}
301
302static inline void
303__flush_cache_page(struct vm_area_struct *vma, unsigned long vmaddr,
304 unsigned long physaddr)
305{
306 preempt_disable();
307 flush_dcache_page_asm(physaddr, vmaddr);
308 if (vma->vm_flags & VM_EXEC)
309 flush_icache_page_asm(physaddr, vmaddr);
310 preempt_enable();
311}
312
313static inline void
314__purge_cache_page(struct vm_area_struct *vma, unsigned long vmaddr,
315 unsigned long physaddr)
316{
317 preempt_disable();
318 purge_dcache_page_asm(physaddr, vmaddr);
319 if (vma->vm_flags & VM_EXEC)
320 flush_icache_page_asm(physaddr, vmaddr);
321 preempt_enable();
322}
323
324void flush_dcache_page(struct page *page)
325{
326 struct address_space *mapping = page_mapping_file(page);
327 struct vm_area_struct *mpnt;
328 unsigned long offset;
329 unsigned long addr, old_addr = 0;
330 pgoff_t pgoff;
331
332 if (mapping && !mapping_mapped(mapping)) {
333 set_bit(PG_dcache_dirty, &page->flags);
334 return;
335 }
336
337 flush_kernel_dcache_page(page);
338
339 if (!mapping)
340 return;
341
342 pgoff = page->index;
343
344 /* We have carefully arranged in arch_get_unmapped_area() that
345 * *any* mappings of a file are always congruently mapped (whether
346 * declared as MAP_PRIVATE or MAP_SHARED), so we only need
347 * to flush one address here for them all to become coherent */
348
349 flush_dcache_mmap_lock(mapping);
350 vma_interval_tree_foreach(mpnt, &mapping->i_mmap, pgoff, pgoff) {
351 offset = (pgoff - mpnt->vm_pgoff) << PAGE_SHIFT;
352 addr = mpnt->vm_start + offset;
353
354 /* The TLB is the engine of coherence on parisc: The
355 * CPU is entitled to speculate any page with a TLB
356 * mapping, so here we kill the mapping then flush the
357 * page along a special flush only alias mapping.
358 * This guarantees that the page is no-longer in the
359 * cache for any process and nor may it be
360 * speculatively read in (until the user or kernel
361 * specifically accesses it, of course) */
362
363 flush_tlb_page(mpnt, addr);
364 if (old_addr == 0 || (old_addr & (SHM_COLOUR - 1))
365 != (addr & (SHM_COLOUR - 1))) {
366 __flush_cache_page(mpnt, addr, page_to_phys(page));
367 if (parisc_requires_coherency() && old_addr)
368 printk(KERN_ERR "INEQUIVALENT ALIASES 0x%lx and 0x%lx in file %pD\n", old_addr, addr, mpnt->vm_file);
369 old_addr = addr;
370 }
371 }
372 flush_dcache_mmap_unlock(mapping);
373}
374EXPORT_SYMBOL(flush_dcache_page);
375
376/* Defined in arch/parisc/kernel/pacache.S */
377EXPORT_SYMBOL(flush_kernel_dcache_range_asm);
378EXPORT_SYMBOL(flush_kernel_dcache_page_asm);
379EXPORT_SYMBOL(flush_data_cache_local);
380EXPORT_SYMBOL(flush_kernel_icache_range_asm);
381
382#define FLUSH_THRESHOLD 0x80000 /* 0.5MB */
383static unsigned long parisc_cache_flush_threshold __ro_after_init = FLUSH_THRESHOLD;
384
385#define FLUSH_TLB_THRESHOLD (16*1024) /* 16 KiB minimum TLB threshold */
386static unsigned long parisc_tlb_flush_threshold __ro_after_init = FLUSH_TLB_THRESHOLD;
387
388void __init parisc_setup_cache_timing(void)
389{
390 unsigned long rangetime, alltime;
391 unsigned long size, start;
392 unsigned long threshold;
393
394 alltime = mfctl(16);
395 flush_data_cache();
396 alltime = mfctl(16) - alltime;
397
398 size = (unsigned long)(_end - _text);
399 rangetime = mfctl(16);
400 flush_kernel_dcache_range((unsigned long)_text, size);
401 rangetime = mfctl(16) - rangetime;
402
403 printk(KERN_DEBUG "Whole cache flush %lu cycles, flushing %lu bytes %lu cycles\n",
404 alltime, size, rangetime);
405
406 threshold = L1_CACHE_ALIGN(size * alltime / rangetime);
407 if (threshold > cache_info.dc_size)
408 threshold = cache_info.dc_size;
409 if (threshold)
410 parisc_cache_flush_threshold = threshold;
411 printk(KERN_INFO "Cache flush threshold set to %lu KiB\n",
412 parisc_cache_flush_threshold/1024);
413
414 /* calculate TLB flush threshold */
415
416 /* On SMP machines, skip the TLB measure of kernel text which
417 * has been mapped as huge pages. */
418 if (num_online_cpus() > 1 && !parisc_requires_coherency()) {
419 threshold = max(cache_info.it_size, cache_info.dt_size);
420 threshold *= PAGE_SIZE;
421 threshold /= num_online_cpus();
422 goto set_tlb_threshold;
423 }
424
425 size = 0;
426 start = (unsigned long) _text;
427 rangetime = mfctl(16);
428 while (start < (unsigned long) _end) {
429 flush_tlb_kernel_range(start, start + PAGE_SIZE);
430 start += PAGE_SIZE;
431 size += PAGE_SIZE;
432 }
433 rangetime = mfctl(16) - rangetime;
434
435 alltime = mfctl(16);
436 flush_tlb_all();
437 alltime = mfctl(16) - alltime;
438
439 printk(KERN_INFO "Whole TLB flush %lu cycles, Range flush %lu bytes %lu cycles\n",
440 alltime, size, rangetime);
441
442 threshold = PAGE_ALIGN((num_online_cpus() * size * alltime) / rangetime);
443 printk(KERN_INFO "Calculated TLB flush threshold %lu KiB\n",
444 threshold/1024);
445
446set_tlb_threshold:
447 if (threshold > parisc_tlb_flush_threshold)
448 parisc_tlb_flush_threshold = threshold;
449 printk(KERN_INFO "TLB flush threshold set to %lu KiB\n",
450 parisc_tlb_flush_threshold/1024);
451}
452
453extern void purge_kernel_dcache_page_asm(unsigned long);
454extern void clear_user_page_asm(void *, unsigned long);
455extern void copy_user_page_asm(void *, void *, unsigned long);
456
457void flush_kernel_dcache_page_addr(void *addr)
458{
459 unsigned long flags;
460
461 flush_kernel_dcache_page_asm(addr);
462 purge_tlb_start(flags);
463 pdtlb_kernel(addr);
464 purge_tlb_end(flags);
465}
466EXPORT_SYMBOL(flush_kernel_dcache_page_addr);
467
468void copy_user_page(void *vto, void *vfrom, unsigned long vaddr,
469 struct page *pg)
470{
471 /* Copy using kernel mapping. No coherency is needed (all in
472 kunmap) for the `to' page. However, the `from' page needs to
473 be flushed through a mapping equivalent to the user mapping
474 before it can be accessed through the kernel mapping. */
475 preempt_disable();
476 flush_dcache_page_asm(__pa(vfrom), vaddr);
477 copy_page_asm(vto, vfrom);
478 preempt_enable();
479}
480EXPORT_SYMBOL(copy_user_page);
481
482/* __flush_tlb_range()
483 *
484 * returns 1 if all TLBs were flushed.
485 */
486int __flush_tlb_range(unsigned long sid, unsigned long start,
487 unsigned long end)
488{
489 unsigned long flags;
490
491 if ((!IS_ENABLED(CONFIG_SMP) || !arch_irqs_disabled()) &&
492 end - start >= parisc_tlb_flush_threshold) {
493 flush_tlb_all();
494 return 1;
495 }
496
497 /* Purge TLB entries for small ranges using the pdtlb and
498 pitlb instructions. These instructions execute locally
499 but cause a purge request to be broadcast to other TLBs. */
500 while (start < end) {
501 purge_tlb_start(flags);
502 mtsp(sid, 1);
503 pdtlb(start);
504 pitlb(start);
505 purge_tlb_end(flags);
506 start += PAGE_SIZE;
507 }
508 return 0;
509}
510
511static void cacheflush_h_tmp_function(void *dummy)
512{
513 flush_cache_all_local();
514}
515
516void flush_cache_all(void)
517{
518 on_each_cpu(cacheflush_h_tmp_function, NULL, 1);
519}
520
521static inline unsigned long mm_total_size(struct mm_struct *mm)
522{
523 struct vm_area_struct *vma;
524 unsigned long usize = 0;
525
526 for (vma = mm->mmap; vma; vma = vma->vm_next)
527 usize += vma->vm_end - vma->vm_start;
528 return usize;
529}
530
531static inline pte_t *get_ptep(pgd_t *pgd, unsigned long addr)
532{
533 pte_t *ptep = NULL;
534
535 if (!pgd_none(*pgd)) {
536 p4d_t *p4d = p4d_offset(pgd, addr);
537 if (!p4d_none(*p4d)) {
538 pud_t *pud = pud_offset(p4d, addr);
539 if (!pud_none(*pud)) {
540 pmd_t *pmd = pmd_offset(pud, addr);
541 if (!pmd_none(*pmd))
542 ptep = pte_offset_map(pmd, addr);
543 }
544 }
545 }
546 return ptep;
547}
548
549void flush_cache_mm(struct mm_struct *mm)
550{
551 struct vm_area_struct *vma;
552 pgd_t *pgd;
553
554 /* Flushing the whole cache on each cpu takes forever on
555 rp3440, etc. So, avoid it if the mm isn't too big. */
556 if ((!IS_ENABLED(CONFIG_SMP) || !arch_irqs_disabled()) &&
557 mm_total_size(mm) >= parisc_cache_flush_threshold) {
558 if (mm->context)
559 flush_tlb_all();
560 flush_cache_all();
561 return;
562 }
563
564 if (mm->context == mfsp(3)) {
565 for (vma = mm->mmap; vma; vma = vma->vm_next) {
566 flush_user_dcache_range_asm(vma->vm_start, vma->vm_end);
567 if (vma->vm_flags & VM_EXEC)
568 flush_user_icache_range_asm(vma->vm_start, vma->vm_end);
569 flush_tlb_range(vma, vma->vm_start, vma->vm_end);
570 }
571 return;
572 }
573
574 pgd = mm->pgd;
575 for (vma = mm->mmap; vma; vma = vma->vm_next) {
576 unsigned long addr;
577
578 for (addr = vma->vm_start; addr < vma->vm_end;
579 addr += PAGE_SIZE) {
580 unsigned long pfn;
581 pte_t *ptep = get_ptep(pgd, addr);
582 if (!ptep)
583 continue;
584 pfn = pte_pfn(*ptep);
585 if (!pfn_valid(pfn))
586 continue;
587 if (unlikely(mm->context)) {
588 flush_tlb_page(vma, addr);
589 __flush_cache_page(vma, addr, PFN_PHYS(pfn));
590 } else {
591 __purge_cache_page(vma, addr, PFN_PHYS(pfn));
592 }
593 }
594 }
595}
596
597void flush_cache_range(struct vm_area_struct *vma,
598 unsigned long start, unsigned long end)
599{
600 pgd_t *pgd;
601 unsigned long addr;
602
603 if ((!IS_ENABLED(CONFIG_SMP) || !arch_irqs_disabled()) &&
604 end - start >= parisc_cache_flush_threshold) {
605 if (vma->vm_mm->context)
606 flush_tlb_range(vma, start, end);
607 flush_cache_all();
608 return;
609 }
610
611 if (vma->vm_mm->context == mfsp(3)) {
612 flush_user_dcache_range_asm(start, end);
613 if (vma->vm_flags & VM_EXEC)
614 flush_user_icache_range_asm(start, end);
615 flush_tlb_range(vma, start, end);
616 return;
617 }
618
619 pgd = vma->vm_mm->pgd;
620 for (addr = vma->vm_start; addr < vma->vm_end; addr += PAGE_SIZE) {
621 unsigned long pfn;
622 pte_t *ptep = get_ptep(pgd, addr);
623 if (!ptep)
624 continue;
625 pfn = pte_pfn(*ptep);
626 if (pfn_valid(pfn)) {
627 if (unlikely(vma->vm_mm->context)) {
628 flush_tlb_page(vma, addr);
629 __flush_cache_page(vma, addr, PFN_PHYS(pfn));
630 } else {
631 __purge_cache_page(vma, addr, PFN_PHYS(pfn));
632 }
633 }
634 }
635}
636
637void
638flush_cache_page(struct vm_area_struct *vma, unsigned long vmaddr, unsigned long pfn)
639{
640 if (pfn_valid(pfn)) {
641 if (likely(vma->vm_mm->context)) {
642 flush_tlb_page(vma, vmaddr);
643 __flush_cache_page(vma, vmaddr, PFN_PHYS(pfn));
644 } else {
645 __purge_cache_page(vma, vmaddr, PFN_PHYS(pfn));
646 }
647 }
648}
649
650void flush_kernel_vmap_range(void *vaddr, int size)
651{
652 unsigned long start = (unsigned long)vaddr;
653 unsigned long end = start + size;
654
655 if ((!IS_ENABLED(CONFIG_SMP) || !arch_irqs_disabled()) &&
656 (unsigned long)size >= parisc_cache_flush_threshold) {
657 flush_tlb_kernel_range(start, end);
658 flush_data_cache();
659 return;
660 }
661
662 flush_kernel_dcache_range_asm(start, end);
663 flush_tlb_kernel_range(start, end);
664}
665EXPORT_SYMBOL(flush_kernel_vmap_range);
666
667void invalidate_kernel_vmap_range(void *vaddr, int size)
668{
669 unsigned long start = (unsigned long)vaddr;
670 unsigned long end = start + size;
671
672 if ((!IS_ENABLED(CONFIG_SMP) || !arch_irqs_disabled()) &&
673 (unsigned long)size >= parisc_cache_flush_threshold) {
674 flush_tlb_kernel_range(start, end);
675 flush_data_cache();
676 return;
677 }
678
679 purge_kernel_dcache_range_asm(start, end);
680 flush_tlb_kernel_range(start, end);
681}
682EXPORT_SYMBOL(invalidate_kernel_vmap_range);
1/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1999-2006 Helge Deller <deller@gmx.de> (07-13-1999)
7 * Copyright (C) 1999 SuSE GmbH Nuernberg
8 * Copyright (C) 2000 Philipp Rumpf (prumpf@tux.org)
9 *
10 * Cache and TLB management
11 *
12 */
13
14#include <linux/init.h>
15#include <linux/kernel.h>
16#include <linux/mm.h>
17#include <linux/module.h>
18#include <linux/seq_file.h>
19#include <linux/pagemap.h>
20#include <linux/sched.h>
21#include <asm/pdc.h>
22#include <asm/cache.h>
23#include <asm/cacheflush.h>
24#include <asm/tlbflush.h>
25#include <asm/page.h>
26#include <asm/pgalloc.h>
27#include <asm/processor.h>
28#include <asm/sections.h>
29#include <asm/shmparam.h>
30
31int split_tlb __read_mostly;
32int dcache_stride __read_mostly;
33int icache_stride __read_mostly;
34EXPORT_SYMBOL(dcache_stride);
35
36void flush_dcache_page_asm(unsigned long phys_addr, unsigned long vaddr);
37EXPORT_SYMBOL(flush_dcache_page_asm);
38void flush_icache_page_asm(unsigned long phys_addr, unsigned long vaddr);
39
40
41/* On some machines (e.g. ones with the Merced bus), there can be
42 * only a single PxTLB broadcast at a time; this must be guaranteed
43 * by software. We put a spinlock around all TLB flushes to
44 * ensure this.
45 */
46DEFINE_SPINLOCK(pa_tlb_lock);
47
48struct pdc_cache_info cache_info __read_mostly;
49#ifndef CONFIG_PA20
50static struct pdc_btlb_info btlb_info __read_mostly;
51#endif
52
53#ifdef CONFIG_SMP
54void
55flush_data_cache(void)
56{
57 on_each_cpu(flush_data_cache_local, NULL, 1);
58}
59void
60flush_instruction_cache(void)
61{
62 on_each_cpu(flush_instruction_cache_local, NULL, 1);
63}
64#endif
65
66void
67flush_cache_all_local(void)
68{
69 flush_instruction_cache_local(NULL);
70 flush_data_cache_local(NULL);
71}
72EXPORT_SYMBOL(flush_cache_all_local);
73
74/* Virtual address of pfn. */
75#define pfn_va(pfn) __va(PFN_PHYS(pfn))
76
77void
78update_mmu_cache(struct vm_area_struct *vma, unsigned long address, pte_t *ptep)
79{
80 unsigned long pfn = pte_pfn(*ptep);
81 struct page *page;
82
83 /* We don't have pte special. As a result, we can be called with
84 an invalid pfn and we don't need to flush the kernel dcache page.
85 This occurs with FireGL card in C8000. */
86 if (!pfn_valid(pfn))
87 return;
88
89 page = pfn_to_page(pfn);
90 if (page_mapping(page) && test_bit(PG_dcache_dirty, &page->flags)) {
91 flush_kernel_dcache_page_addr(pfn_va(pfn));
92 clear_bit(PG_dcache_dirty, &page->flags);
93 } else if (parisc_requires_coherency())
94 flush_kernel_dcache_page_addr(pfn_va(pfn));
95}
96
97void
98show_cache_info(struct seq_file *m)
99{
100 char buf[32];
101
102 seq_printf(m, "I-cache\t\t: %ld KB\n",
103 cache_info.ic_size/1024 );
104 if (cache_info.dc_loop != 1)
105 snprintf(buf, 32, "%lu-way associative", cache_info.dc_loop);
106 seq_printf(m, "D-cache\t\t: %ld KB (%s%s, %s)\n",
107 cache_info.dc_size/1024,
108 (cache_info.dc_conf.cc_wt ? "WT":"WB"),
109 (cache_info.dc_conf.cc_sh ? ", shared I/D":""),
110 ((cache_info.dc_loop == 1) ? "direct mapped" : buf));
111 seq_printf(m, "ITLB entries\t: %ld\n" "DTLB entries\t: %ld%s\n",
112 cache_info.it_size,
113 cache_info.dt_size,
114 cache_info.dt_conf.tc_sh ? " - shared with ITLB":""
115 );
116
117#ifndef CONFIG_PA20
118 /* BTLB - Block TLB */
119 if (btlb_info.max_size==0) {
120 seq_printf(m, "BTLB\t\t: not supported\n" );
121 } else {
122 seq_printf(m,
123 "BTLB fixed\t: max. %d pages, pagesize=%d (%dMB)\n"
124 "BTLB fix-entr.\t: %d instruction, %d data (%d combined)\n"
125 "BTLB var-entr.\t: %d instruction, %d data (%d combined)\n",
126 btlb_info.max_size, (int)4096,
127 btlb_info.max_size>>8,
128 btlb_info.fixed_range_info.num_i,
129 btlb_info.fixed_range_info.num_d,
130 btlb_info.fixed_range_info.num_comb,
131 btlb_info.variable_range_info.num_i,
132 btlb_info.variable_range_info.num_d,
133 btlb_info.variable_range_info.num_comb
134 );
135 }
136#endif
137}
138
139void __init
140parisc_cache_init(void)
141{
142 if (pdc_cache_info(&cache_info) < 0)
143 panic("parisc_cache_init: pdc_cache_info failed");
144
145#if 0
146 printk("ic_size %lx dc_size %lx it_size %lx\n",
147 cache_info.ic_size,
148 cache_info.dc_size,
149 cache_info.it_size);
150
151 printk("DC base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx\n",
152 cache_info.dc_base,
153 cache_info.dc_stride,
154 cache_info.dc_count,
155 cache_info.dc_loop);
156
157 printk("dc_conf = 0x%lx alias %d blk %d line %d shift %d\n",
158 *(unsigned long *) (&cache_info.dc_conf),
159 cache_info.dc_conf.cc_alias,
160 cache_info.dc_conf.cc_block,
161 cache_info.dc_conf.cc_line,
162 cache_info.dc_conf.cc_shift);
163 printk(" wt %d sh %d cst %d hv %d\n",
164 cache_info.dc_conf.cc_wt,
165 cache_info.dc_conf.cc_sh,
166 cache_info.dc_conf.cc_cst,
167 cache_info.dc_conf.cc_hv);
168
169 printk("IC base 0x%lx stride 0x%lx count 0x%lx loop 0x%lx\n",
170 cache_info.ic_base,
171 cache_info.ic_stride,
172 cache_info.ic_count,
173 cache_info.ic_loop);
174
175 printk("ic_conf = 0x%lx alias %d blk %d line %d shift %d\n",
176 *(unsigned long *) (&cache_info.ic_conf),
177 cache_info.ic_conf.cc_alias,
178 cache_info.ic_conf.cc_block,
179 cache_info.ic_conf.cc_line,
180 cache_info.ic_conf.cc_shift);
181 printk(" wt %d sh %d cst %d hv %d\n",
182 cache_info.ic_conf.cc_wt,
183 cache_info.ic_conf.cc_sh,
184 cache_info.ic_conf.cc_cst,
185 cache_info.ic_conf.cc_hv);
186
187 printk("D-TLB conf: sh %d page %d cst %d aid %d pad1 %d\n",
188 cache_info.dt_conf.tc_sh,
189 cache_info.dt_conf.tc_page,
190 cache_info.dt_conf.tc_cst,
191 cache_info.dt_conf.tc_aid,
192 cache_info.dt_conf.tc_pad1);
193
194 printk("I-TLB conf: sh %d page %d cst %d aid %d pad1 %d\n",
195 cache_info.it_conf.tc_sh,
196 cache_info.it_conf.tc_page,
197 cache_info.it_conf.tc_cst,
198 cache_info.it_conf.tc_aid,
199 cache_info.it_conf.tc_pad1);
200#endif
201
202 split_tlb = 0;
203 if (cache_info.dt_conf.tc_sh == 0 || cache_info.dt_conf.tc_sh == 2) {
204 if (cache_info.dt_conf.tc_sh == 2)
205 printk(KERN_WARNING "Unexpected TLB configuration. "
206 "Will flush I/D separately (could be optimized).\n");
207
208 split_tlb = 1;
209 }
210
211 /* "New and Improved" version from Jim Hull
212 * (1 << (cc_block-1)) * (cc_line << (4 + cnf.cc_shift))
213 * The following CAFL_STRIDE is an optimized version, see
214 * http://lists.parisc-linux.org/pipermail/parisc-linux/2004-June/023625.html
215 * http://lists.parisc-linux.org/pipermail/parisc-linux/2004-June/023671.html
216 */
217#define CAFL_STRIDE(cnf) (cnf.cc_line << (3 + cnf.cc_block + cnf.cc_shift))
218 dcache_stride = CAFL_STRIDE(cache_info.dc_conf);
219 icache_stride = CAFL_STRIDE(cache_info.ic_conf);
220#undef CAFL_STRIDE
221
222#ifndef CONFIG_PA20
223 if (pdc_btlb_info(&btlb_info) < 0) {
224 memset(&btlb_info, 0, sizeof btlb_info);
225 }
226#endif
227
228 if ((boot_cpu_data.pdc.capabilities & PDC_MODEL_NVA_MASK) ==
229 PDC_MODEL_NVA_UNSUPPORTED) {
230 printk(KERN_WARNING "parisc_cache_init: Only equivalent aliasing supported!\n");
231#if 0
232 panic("SMP kernel required to avoid non-equivalent aliasing");
233#endif
234 }
235}
236
237void disable_sr_hashing(void)
238{
239 int srhash_type, retval;
240 unsigned long space_bits;
241
242 switch (boot_cpu_data.cpu_type) {
243 case pcx: /* We shouldn't get this far. setup.c should prevent it. */
244 BUG();
245 return;
246
247 case pcxs:
248 case pcxt:
249 case pcxt_:
250 srhash_type = SRHASH_PCXST;
251 break;
252
253 case pcxl:
254 srhash_type = SRHASH_PCXL;
255 break;
256
257 case pcxl2: /* pcxl2 doesn't support space register hashing */
258 return;
259
260 default: /* Currently all PA2.0 machines use the same ins. sequence */
261 srhash_type = SRHASH_PA20;
262 break;
263 }
264
265 disable_sr_hashing_asm(srhash_type);
266
267 retval = pdc_spaceid_bits(&space_bits);
268 /* If this procedure isn't implemented, don't panic. */
269 if (retval < 0 && retval != PDC_BAD_OPTION)
270 panic("pdc_spaceid_bits call failed.\n");
271 if (space_bits != 0)
272 panic("SpaceID hashing is still on!\n");
273}
274
275static inline void
276__flush_cache_page(struct vm_area_struct *vma, unsigned long vmaddr,
277 unsigned long physaddr)
278{
279 preempt_disable();
280 flush_dcache_page_asm(physaddr, vmaddr);
281 if (vma->vm_flags & VM_EXEC)
282 flush_icache_page_asm(physaddr, vmaddr);
283 preempt_enable();
284}
285
286void flush_dcache_page(struct page *page)
287{
288 struct address_space *mapping = page_mapping(page);
289 struct vm_area_struct *mpnt;
290 unsigned long offset;
291 unsigned long addr, old_addr = 0;
292 pgoff_t pgoff;
293
294 if (mapping && !mapping_mapped(mapping)) {
295 set_bit(PG_dcache_dirty, &page->flags);
296 return;
297 }
298
299 flush_kernel_dcache_page(page);
300
301 if (!mapping)
302 return;
303
304 pgoff = page->index << (PAGE_CACHE_SHIFT - PAGE_SHIFT);
305
306 /* We have carefully arranged in arch_get_unmapped_area() that
307 * *any* mappings of a file are always congruently mapped (whether
308 * declared as MAP_PRIVATE or MAP_SHARED), so we only need
309 * to flush one address here for them all to become coherent */
310
311 flush_dcache_mmap_lock(mapping);
312 vma_interval_tree_foreach(mpnt, &mapping->i_mmap, pgoff, pgoff) {
313 offset = (pgoff - mpnt->vm_pgoff) << PAGE_SHIFT;
314 addr = mpnt->vm_start + offset;
315
316 /* The TLB is the engine of coherence on parisc: The
317 * CPU is entitled to speculate any page with a TLB
318 * mapping, so here we kill the mapping then flush the
319 * page along a special flush only alias mapping.
320 * This guarantees that the page is no-longer in the
321 * cache for any process and nor may it be
322 * speculatively read in (until the user or kernel
323 * specifically accesses it, of course) */
324
325 flush_tlb_page(mpnt, addr);
326 if (old_addr == 0 || (old_addr & (SHM_COLOUR - 1))
327 != (addr & (SHM_COLOUR - 1))) {
328 __flush_cache_page(mpnt, addr, page_to_phys(page));
329 if (old_addr)
330 printk(KERN_ERR "INEQUIVALENT ALIASES 0x%lx and 0x%lx in file %s\n", old_addr, addr, mpnt->vm_file ? (char *)mpnt->vm_file->f_path.dentry->d_name.name : "(null)");
331 old_addr = addr;
332 }
333 }
334 flush_dcache_mmap_unlock(mapping);
335}
336EXPORT_SYMBOL(flush_dcache_page);
337
338/* Defined in arch/parisc/kernel/pacache.S */
339EXPORT_SYMBOL(flush_kernel_dcache_range_asm);
340EXPORT_SYMBOL(flush_kernel_dcache_page_asm);
341EXPORT_SYMBOL(flush_data_cache_local);
342EXPORT_SYMBOL(flush_kernel_icache_range_asm);
343
344#define FLUSH_THRESHOLD 0x80000 /* 0.5MB */
345int parisc_cache_flush_threshold __read_mostly = FLUSH_THRESHOLD;
346
347void __init parisc_setup_cache_timing(void)
348{
349 unsigned long rangetime, alltime;
350 unsigned long size;
351
352 alltime = mfctl(16);
353 flush_data_cache();
354 alltime = mfctl(16) - alltime;
355
356 size = (unsigned long)(_end - _text);
357 rangetime = mfctl(16);
358 flush_kernel_dcache_range((unsigned long)_text, size);
359 rangetime = mfctl(16) - rangetime;
360
361 printk(KERN_DEBUG "Whole cache flush %lu cycles, flushing %lu bytes %lu cycles\n",
362 alltime, size, rangetime);
363
364 /* Racy, but if we see an intermediate value, it's ok too... */
365 parisc_cache_flush_threshold = size * alltime / rangetime;
366
367 parisc_cache_flush_threshold = (parisc_cache_flush_threshold + L1_CACHE_BYTES - 1) &~ (L1_CACHE_BYTES - 1);
368 if (!parisc_cache_flush_threshold)
369 parisc_cache_flush_threshold = FLUSH_THRESHOLD;
370
371 if (parisc_cache_flush_threshold > cache_info.dc_size)
372 parisc_cache_flush_threshold = cache_info.dc_size;
373
374 printk(KERN_INFO "Setting cache flush threshold to %x (%d CPUs online)\n", parisc_cache_flush_threshold, num_online_cpus());
375}
376
377extern void purge_kernel_dcache_page_asm(unsigned long);
378extern void clear_user_page_asm(void *, unsigned long);
379extern void copy_user_page_asm(void *, void *, unsigned long);
380
381void flush_kernel_dcache_page_addr(void *addr)
382{
383 unsigned long flags;
384
385 flush_kernel_dcache_page_asm(addr);
386 purge_tlb_start(flags);
387 pdtlb_kernel(addr);
388 purge_tlb_end(flags);
389}
390EXPORT_SYMBOL(flush_kernel_dcache_page_addr);
391
392void copy_user_page(void *vto, void *vfrom, unsigned long vaddr,
393 struct page *pg)
394{
395 /* Copy using kernel mapping. No coherency is needed (all in
396 kunmap) for the `to' page. However, the `from' page needs to
397 be flushed through a mapping equivalent to the user mapping
398 before it can be accessed through the kernel mapping. */
399 preempt_disable();
400 flush_dcache_page_asm(__pa(vfrom), vaddr);
401 preempt_enable();
402 copy_page_asm(vto, vfrom);
403}
404EXPORT_SYMBOL(copy_user_page);
405
406void purge_tlb_entries(struct mm_struct *mm, unsigned long addr)
407{
408 unsigned long flags;
409
410 /* Note: purge_tlb_entries can be called at startup with
411 no context. */
412
413 purge_tlb_start(flags);
414 mtsp(mm->context, 1);
415 pdtlb(addr);
416 pitlb(addr);
417 purge_tlb_end(flags);
418}
419EXPORT_SYMBOL(purge_tlb_entries);
420
421void __flush_tlb_range(unsigned long sid, unsigned long start,
422 unsigned long end)
423{
424 unsigned long npages;
425
426 npages = ((end - (start & PAGE_MASK)) + (PAGE_SIZE - 1)) >> PAGE_SHIFT;
427 if (npages >= 512) /* 2MB of space: arbitrary, should be tuned */
428 flush_tlb_all();
429 else {
430 unsigned long flags;
431
432 purge_tlb_start(flags);
433 mtsp(sid, 1);
434 if (split_tlb) {
435 while (npages--) {
436 pdtlb(start);
437 pitlb(start);
438 start += PAGE_SIZE;
439 }
440 } else {
441 while (npages--) {
442 pdtlb(start);
443 start += PAGE_SIZE;
444 }
445 }
446 purge_tlb_end(flags);
447 }
448}
449
450static void cacheflush_h_tmp_function(void *dummy)
451{
452 flush_cache_all_local();
453}
454
455void flush_cache_all(void)
456{
457 on_each_cpu(cacheflush_h_tmp_function, NULL, 1);
458}
459
460static inline unsigned long mm_total_size(struct mm_struct *mm)
461{
462 struct vm_area_struct *vma;
463 unsigned long usize = 0;
464
465 for (vma = mm->mmap; vma; vma = vma->vm_next)
466 usize += vma->vm_end - vma->vm_start;
467 return usize;
468}
469
470static inline pte_t *get_ptep(pgd_t *pgd, unsigned long addr)
471{
472 pte_t *ptep = NULL;
473
474 if (!pgd_none(*pgd)) {
475 pud_t *pud = pud_offset(pgd, addr);
476 if (!pud_none(*pud)) {
477 pmd_t *pmd = pmd_offset(pud, addr);
478 if (!pmd_none(*pmd))
479 ptep = pte_offset_map(pmd, addr);
480 }
481 }
482 return ptep;
483}
484
485void flush_cache_mm(struct mm_struct *mm)
486{
487 struct vm_area_struct *vma;
488 pgd_t *pgd;
489
490 /* Flushing the whole cache on each cpu takes forever on
491 rp3440, etc. So, avoid it if the mm isn't too big. */
492 if (mm_total_size(mm) >= parisc_cache_flush_threshold) {
493 flush_cache_all();
494 return;
495 }
496
497 if (mm->context == mfsp(3)) {
498 for (vma = mm->mmap; vma; vma = vma->vm_next) {
499 flush_user_dcache_range_asm(vma->vm_start, vma->vm_end);
500 if ((vma->vm_flags & VM_EXEC) == 0)
501 continue;
502 flush_user_icache_range_asm(vma->vm_start, vma->vm_end);
503 }
504 return;
505 }
506
507 pgd = mm->pgd;
508 for (vma = mm->mmap; vma; vma = vma->vm_next) {
509 unsigned long addr;
510
511 for (addr = vma->vm_start; addr < vma->vm_end;
512 addr += PAGE_SIZE) {
513 unsigned long pfn;
514 pte_t *ptep = get_ptep(pgd, addr);
515 if (!ptep)
516 continue;
517 pfn = pte_pfn(*ptep);
518 if (!pfn_valid(pfn))
519 continue;
520 __flush_cache_page(vma, addr, PFN_PHYS(pfn));
521 }
522 }
523}
524
525void
526flush_user_dcache_range(unsigned long start, unsigned long end)
527{
528 if ((end - start) < parisc_cache_flush_threshold)
529 flush_user_dcache_range_asm(start,end);
530 else
531 flush_data_cache();
532}
533
534void
535flush_user_icache_range(unsigned long start, unsigned long end)
536{
537 if ((end - start) < parisc_cache_flush_threshold)
538 flush_user_icache_range_asm(start,end);
539 else
540 flush_instruction_cache();
541}
542
543void flush_cache_range(struct vm_area_struct *vma,
544 unsigned long start, unsigned long end)
545{
546 unsigned long addr;
547 pgd_t *pgd;
548
549 BUG_ON(!vma->vm_mm->context);
550
551 if ((end - start) >= parisc_cache_flush_threshold) {
552 flush_cache_all();
553 return;
554 }
555
556 if (vma->vm_mm->context == mfsp(3)) {
557 flush_user_dcache_range_asm(start, end);
558 if (vma->vm_flags & VM_EXEC)
559 flush_user_icache_range_asm(start, end);
560 return;
561 }
562
563 pgd = vma->vm_mm->pgd;
564 for (addr = start & PAGE_MASK; addr < end; addr += PAGE_SIZE) {
565 unsigned long pfn;
566 pte_t *ptep = get_ptep(pgd, addr);
567 if (!ptep)
568 continue;
569 pfn = pte_pfn(*ptep);
570 if (pfn_valid(pfn))
571 __flush_cache_page(vma, addr, PFN_PHYS(pfn));
572 }
573}
574
575void
576flush_cache_page(struct vm_area_struct *vma, unsigned long vmaddr, unsigned long pfn)
577{
578 BUG_ON(!vma->vm_mm->context);
579
580 if (pfn_valid(pfn)) {
581 flush_tlb_page(vma, vmaddr);
582 __flush_cache_page(vma, vmaddr, PFN_PHYS(pfn));
583 }
584}