Loading...
1/*
2 * arch/arm/include/asm/tlb.h
3 *
4 * Copyright (C) 2002 Russell King
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
9 *
10 * Experimentation shows that on a StrongARM, it appears to be faster
11 * to use the "invalidate whole tlb" rather than "invalidate single
12 * tlb" for this.
13 *
14 * This appears true for both the process fork+exit case, as well as
15 * the munmap-large-area case.
16 */
17#ifndef __ASMARM_TLB_H
18#define __ASMARM_TLB_H
19
20#include <asm/cacheflush.h>
21
22#ifndef CONFIG_MMU
23
24#include <linux/pagemap.h>
25
26#define tlb_flush(tlb) ((void) tlb)
27
28#include <asm-generic/tlb.h>
29
30#else /* !CONFIG_MMU */
31
32#include <linux/swap.h>
33#include <asm/pgalloc.h>
34#include <asm/tlbflush.h>
35
36/*
37 * We need to delay page freeing for SMP as other CPUs can access pages
38 * which have been removed but not yet had their TLB entries invalidated.
39 * Also, as ARMv7 speculative prefetch can drag new entries into the TLB,
40 * we need to apply this same delaying tactic to ensure correct operation.
41 */
42#if defined(CONFIG_SMP) || defined(CONFIG_CPU_32v7)
43#define tlb_fast_mode(tlb) 0
44#else
45#define tlb_fast_mode(tlb) 1
46#endif
47
48#define MMU_GATHER_BUNDLE 8
49
50/*
51 * TLB handling. This allows us to remove pages from the page
52 * tables, and efficiently handle the TLB issues.
53 */
54struct mmu_gather {
55 struct mm_struct *mm;
56 unsigned int fullmm;
57 struct vm_area_struct *vma;
58 unsigned long range_start;
59 unsigned long range_end;
60 unsigned int nr;
61 unsigned int max;
62 struct page **pages;
63 struct page *local[MMU_GATHER_BUNDLE];
64};
65
66DECLARE_PER_CPU(struct mmu_gather, mmu_gathers);
67
68/*
69 * This is unnecessarily complex. There's three ways the TLB shootdown
70 * code is used:
71 * 1. Unmapping a range of vmas. See zap_page_range(), unmap_region().
72 * tlb->fullmm = 0, and tlb_start_vma/tlb_end_vma will be called.
73 * tlb->vma will be non-NULL.
74 * 2. Unmapping all vmas. See exit_mmap().
75 * tlb->fullmm = 1, and tlb_start_vma/tlb_end_vma will be called.
76 * tlb->vma will be non-NULL. Additionally, page tables will be freed.
77 * 3. Unmapping argument pages. See shift_arg_pages().
78 * tlb->fullmm = 0, but tlb_start_vma/tlb_end_vma will not be called.
79 * tlb->vma will be NULL.
80 */
81static inline void tlb_flush(struct mmu_gather *tlb)
82{
83 if (tlb->fullmm || !tlb->vma)
84 flush_tlb_mm(tlb->mm);
85 else if (tlb->range_end > 0) {
86 flush_tlb_range(tlb->vma, tlb->range_start, tlb->range_end);
87 tlb->range_start = TASK_SIZE;
88 tlb->range_end = 0;
89 }
90}
91
92static inline void tlb_add_flush(struct mmu_gather *tlb, unsigned long addr)
93{
94 if (!tlb->fullmm) {
95 if (addr < tlb->range_start)
96 tlb->range_start = addr;
97 if (addr + PAGE_SIZE > tlb->range_end)
98 tlb->range_end = addr + PAGE_SIZE;
99 }
100}
101
102static inline void __tlb_alloc_page(struct mmu_gather *tlb)
103{
104 unsigned long addr = __get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);
105
106 if (addr) {
107 tlb->pages = (void *)addr;
108 tlb->max = PAGE_SIZE / sizeof(struct page *);
109 }
110}
111
112static inline void tlb_flush_mmu(struct mmu_gather *tlb)
113{
114 tlb_flush(tlb);
115 if (!tlb_fast_mode(tlb)) {
116 free_pages_and_swap_cache(tlb->pages, tlb->nr);
117 tlb->nr = 0;
118 if (tlb->pages == tlb->local)
119 __tlb_alloc_page(tlb);
120 }
121}
122
123static inline void
124tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, unsigned int fullmm)
125{
126 tlb->mm = mm;
127 tlb->fullmm = fullmm;
128 tlb->vma = NULL;
129 tlb->max = ARRAY_SIZE(tlb->local);
130 tlb->pages = tlb->local;
131 tlb->nr = 0;
132 __tlb_alloc_page(tlb);
133}
134
135static inline void
136tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
137{
138 tlb_flush_mmu(tlb);
139
140 /* keep the page table cache within bounds */
141 check_pgt_cache();
142
143 if (tlb->pages != tlb->local)
144 free_pages((unsigned long)tlb->pages, 0);
145}
146
147/*
148 * Memorize the range for the TLB flush.
149 */
150static inline void
151tlb_remove_tlb_entry(struct mmu_gather *tlb, pte_t *ptep, unsigned long addr)
152{
153 tlb_add_flush(tlb, addr);
154}
155
156/*
157 * In the case of tlb vma handling, we can optimise these away in the
158 * case where we're doing a full MM flush. When we're doing a munmap,
159 * the vmas are adjusted to only cover the region to be torn down.
160 */
161static inline void
162tlb_start_vma(struct mmu_gather *tlb, struct vm_area_struct *vma)
163{
164 if (!tlb->fullmm) {
165 flush_cache_range(vma, vma->vm_start, vma->vm_end);
166 tlb->vma = vma;
167 tlb->range_start = TASK_SIZE;
168 tlb->range_end = 0;
169 }
170}
171
172static inline void
173tlb_end_vma(struct mmu_gather *tlb, struct vm_area_struct *vma)
174{
175 if (!tlb->fullmm)
176 tlb_flush(tlb);
177}
178
179static inline int __tlb_remove_page(struct mmu_gather *tlb, struct page *page)
180{
181 if (tlb_fast_mode(tlb)) {
182 free_page_and_swap_cache(page);
183 return 1; /* avoid calling tlb_flush_mmu */
184 }
185
186 tlb->pages[tlb->nr++] = page;
187 VM_BUG_ON(tlb->nr > tlb->max);
188 return tlb->max - tlb->nr;
189}
190
191static inline void tlb_remove_page(struct mmu_gather *tlb, struct page *page)
192{
193 if (!__tlb_remove_page(tlb, page))
194 tlb_flush_mmu(tlb);
195}
196
197static inline void __pte_free_tlb(struct mmu_gather *tlb, pgtable_t pte,
198 unsigned long addr)
199{
200 pgtable_page_dtor(pte);
201 tlb_add_flush(tlb, addr);
202 tlb_remove_page(tlb, pte);
203}
204
205#define pte_free_tlb(tlb, ptep, addr) __pte_free_tlb(tlb, ptep, addr)
206#define pmd_free_tlb(tlb, pmdp, addr) pmd_free((tlb)->mm, pmdp)
207
208#define tlb_migrate_finish(mm) do { } while (0)
209
210#endif /* CONFIG_MMU */
211#endif
1/*
2 * arch/arm/include/asm/tlb.h
3 *
4 * Copyright (C) 2002 Russell King
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
9 *
10 * Experimentation shows that on a StrongARM, it appears to be faster
11 * to use the "invalidate whole tlb" rather than "invalidate single
12 * tlb" for this.
13 *
14 * This appears true for both the process fork+exit case, as well as
15 * the munmap-large-area case.
16 */
17#ifndef __ASMARM_TLB_H
18#define __ASMARM_TLB_H
19
20#include <asm/cacheflush.h>
21
22#ifndef CONFIG_MMU
23
24#include <linux/pagemap.h>
25
26#define tlb_flush(tlb) ((void) tlb)
27
28#include <asm-generic/tlb.h>
29
30#else /* !CONFIG_MMU */
31
32#include <linux/swap.h>
33#include <asm/pgalloc.h>
34#include <asm/tlbflush.h>
35
36#define MMU_GATHER_BUNDLE 8
37
38#ifdef CONFIG_HAVE_RCU_TABLE_FREE
39static inline void __tlb_remove_table(void *_table)
40{
41 free_page_and_swap_cache((struct page *)_table);
42}
43
44struct mmu_table_batch {
45 struct rcu_head rcu;
46 unsigned int nr;
47 void *tables[0];
48};
49
50#define MAX_TABLE_BATCH \
51 ((PAGE_SIZE - sizeof(struct mmu_table_batch)) / sizeof(void *))
52
53extern void tlb_table_flush(struct mmu_gather *tlb);
54extern void tlb_remove_table(struct mmu_gather *tlb, void *table);
55
56#define tlb_remove_entry(tlb, entry) tlb_remove_table(tlb, entry)
57#else
58#define tlb_remove_entry(tlb, entry) tlb_remove_page(tlb, entry)
59#endif /* CONFIG_HAVE_RCU_TABLE_FREE */
60
61/*
62 * TLB handling. This allows us to remove pages from the page
63 * tables, and efficiently handle the TLB issues.
64 */
65struct mmu_gather {
66 struct mm_struct *mm;
67#ifdef CONFIG_HAVE_RCU_TABLE_FREE
68 struct mmu_table_batch *batch;
69 unsigned int need_flush;
70#endif
71 unsigned int fullmm;
72 struct vm_area_struct *vma;
73 unsigned long start, end;
74 unsigned long range_start;
75 unsigned long range_end;
76 unsigned int nr;
77 unsigned int max;
78 struct page **pages;
79 struct page *local[MMU_GATHER_BUNDLE];
80};
81
82DECLARE_PER_CPU(struct mmu_gather, mmu_gathers);
83
84/*
85 * This is unnecessarily complex. There's three ways the TLB shootdown
86 * code is used:
87 * 1. Unmapping a range of vmas. See zap_page_range(), unmap_region().
88 * tlb->fullmm = 0, and tlb_start_vma/tlb_end_vma will be called.
89 * tlb->vma will be non-NULL.
90 * 2. Unmapping all vmas. See exit_mmap().
91 * tlb->fullmm = 1, and tlb_start_vma/tlb_end_vma will be called.
92 * tlb->vma will be non-NULL. Additionally, page tables will be freed.
93 * 3. Unmapping argument pages. See shift_arg_pages().
94 * tlb->fullmm = 0, but tlb_start_vma/tlb_end_vma will not be called.
95 * tlb->vma will be NULL.
96 */
97static inline void tlb_flush(struct mmu_gather *tlb)
98{
99 if (tlb->fullmm || !tlb->vma)
100 flush_tlb_mm(tlb->mm);
101 else if (tlb->range_end > 0) {
102 flush_tlb_range(tlb->vma, tlb->range_start, tlb->range_end);
103 tlb->range_start = TASK_SIZE;
104 tlb->range_end = 0;
105 }
106}
107
108static inline void tlb_add_flush(struct mmu_gather *tlb, unsigned long addr)
109{
110 if (!tlb->fullmm) {
111 if (addr < tlb->range_start)
112 tlb->range_start = addr;
113 if (addr + PAGE_SIZE > tlb->range_end)
114 tlb->range_end = addr + PAGE_SIZE;
115 }
116}
117
118static inline void __tlb_alloc_page(struct mmu_gather *tlb)
119{
120 unsigned long addr = __get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);
121
122 if (addr) {
123 tlb->pages = (void *)addr;
124 tlb->max = PAGE_SIZE / sizeof(struct page *);
125 }
126}
127
128static inline void tlb_flush_mmu_tlbonly(struct mmu_gather *tlb)
129{
130 tlb_flush(tlb);
131#ifdef CONFIG_HAVE_RCU_TABLE_FREE
132 tlb_table_flush(tlb);
133#endif
134}
135
136static inline void tlb_flush_mmu_free(struct mmu_gather *tlb)
137{
138 free_pages_and_swap_cache(tlb->pages, tlb->nr);
139 tlb->nr = 0;
140 if (tlb->pages == tlb->local)
141 __tlb_alloc_page(tlb);
142}
143
144static inline void tlb_flush_mmu(struct mmu_gather *tlb)
145{
146 tlb_flush_mmu_tlbonly(tlb);
147 tlb_flush_mmu_free(tlb);
148}
149
150static inline void
151tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, unsigned long start, unsigned long end)
152{
153 tlb->mm = mm;
154 tlb->fullmm = !(start | (end+1));
155 tlb->start = start;
156 tlb->end = end;
157 tlb->vma = NULL;
158 tlb->max = ARRAY_SIZE(tlb->local);
159 tlb->pages = tlb->local;
160 tlb->nr = 0;
161 __tlb_alloc_page(tlb);
162
163#ifdef CONFIG_HAVE_RCU_TABLE_FREE
164 tlb->batch = NULL;
165#endif
166}
167
168static inline void
169tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
170{
171 tlb_flush_mmu(tlb);
172
173 /* keep the page table cache within bounds */
174 check_pgt_cache();
175
176 if (tlb->pages != tlb->local)
177 free_pages((unsigned long)tlb->pages, 0);
178}
179
180/*
181 * Memorize the range for the TLB flush.
182 */
183static inline void
184tlb_remove_tlb_entry(struct mmu_gather *tlb, pte_t *ptep, unsigned long addr)
185{
186 tlb_add_flush(tlb, addr);
187}
188
189/*
190 * In the case of tlb vma handling, we can optimise these away in the
191 * case where we're doing a full MM flush. When we're doing a munmap,
192 * the vmas are adjusted to only cover the region to be torn down.
193 */
194static inline void
195tlb_start_vma(struct mmu_gather *tlb, struct vm_area_struct *vma)
196{
197 if (!tlb->fullmm) {
198 flush_cache_range(vma, vma->vm_start, vma->vm_end);
199 tlb->vma = vma;
200 tlb->range_start = TASK_SIZE;
201 tlb->range_end = 0;
202 }
203}
204
205static inline void
206tlb_end_vma(struct mmu_gather *tlb, struct vm_area_struct *vma)
207{
208 if (!tlb->fullmm)
209 tlb_flush(tlb);
210}
211
212static inline int __tlb_remove_page(struct mmu_gather *tlb, struct page *page)
213{
214 tlb->pages[tlb->nr++] = page;
215 VM_BUG_ON(tlb->nr > tlb->max);
216 return tlb->max - tlb->nr;
217}
218
219static inline void tlb_remove_page(struct mmu_gather *tlb, struct page *page)
220{
221 if (!__tlb_remove_page(tlb, page))
222 tlb_flush_mmu(tlb);
223}
224
225static inline void __pte_free_tlb(struct mmu_gather *tlb, pgtable_t pte,
226 unsigned long addr)
227{
228 pgtable_page_dtor(pte);
229
230#ifdef CONFIG_ARM_LPAE
231 tlb_add_flush(tlb, addr);
232#else
233 /*
234 * With the classic ARM MMU, a pte page has two corresponding pmd
235 * entries, each covering 1MB.
236 */
237 addr &= PMD_MASK;
238 tlb_add_flush(tlb, addr + SZ_1M - PAGE_SIZE);
239 tlb_add_flush(tlb, addr + SZ_1M);
240#endif
241
242 tlb_remove_entry(tlb, pte);
243}
244
245static inline void __pmd_free_tlb(struct mmu_gather *tlb, pmd_t *pmdp,
246 unsigned long addr)
247{
248#ifdef CONFIG_ARM_LPAE
249 tlb_add_flush(tlb, addr);
250 tlb_remove_entry(tlb, virt_to_page(pmdp));
251#endif
252}
253
254static inline void
255tlb_remove_pmd_tlb_entry(struct mmu_gather *tlb, pmd_t *pmdp, unsigned long addr)
256{
257 tlb_add_flush(tlb, addr);
258}
259
260#define pte_free_tlb(tlb, ptep, addr) __pte_free_tlb(tlb, ptep, addr)
261#define pmd_free_tlb(tlb, pmdp, addr) __pmd_free_tlb(tlb, pmdp, addr)
262#define pud_free_tlb(tlb, pudp, addr) pud_free((tlb)->mm, pudp)
263
264#define tlb_migrate_finish(mm) do { } while (0)
265
266#endif /* CONFIG_MMU */
267#endif