]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blame - arch/ia64/include/asm/tlb.h
ia64: mmu_gather rework
[mirror_ubuntu-zesty-kernel.git] / arch / ia64 / include / asm / tlb.h
CommitLineData
1da177e4
LT
1#ifndef _ASM_IA64_TLB_H
2#define _ASM_IA64_TLB_H
3/*
4 * Based on <asm-generic/tlb.h>.
5 *
6 * Copyright (C) 2002-2003 Hewlett-Packard Co
7 * David Mosberger-Tang <davidm@hpl.hp.com>
8 */
9/*
10 * Removing a translation from a page table (including TLB-shootdown) is a four-step
11 * procedure:
12 *
13 * (1) Flush (virtual) caches --- ensures virtual memory is coherent with kernel memory
14 * (this is a no-op on ia64).
15 * (2) Clear the relevant portions of the page-table
16 * (3) Flush the TLBs --- ensures that stale content is gone from CPU TLBs
17 * (4) Release the pages that were freed up in step (2).
18 *
19 * Note that the ordering of these steps is crucial to avoid races on MP machines.
20 *
21 * The Linux kernel defines several platform-specific hooks for TLB-shootdown. When
22 * unmapping a portion of the virtual address space, these hooks are called according to
23 * the following template:
24 *
25 * tlb <- tlb_gather_mmu(mm, full_mm_flush); // start unmap for address space MM
26 * {
27 * for each vma that needs a shootdown do {
28 * tlb_start_vma(tlb, vma);
29 * for each page-table-entry PTE that needs to be removed do {
30 * tlb_remove_tlb_entry(tlb, pte, address);
31 * if (pte refers to a normal page) {
32 * tlb_remove_page(tlb, page);
33 * }
34 * }
35 * tlb_end_vma(tlb, vma);
36 * }
37 * }
38 * tlb_finish_mmu(tlb, start, end); // finish unmap for address space MM
39 */
1da177e4
LT
40#include <linux/mm.h>
41#include <linux/pagemap.h>
42#include <linux/swap.h>
43
44#include <asm/pgalloc.h>
45#include <asm/processor.h>
46#include <asm/tlbflush.h>
47#include <asm/machvec.h>
48
49#ifdef CONFIG_SMP
1da177e4
LT
50# define tlb_fast_mode(tlb) ((tlb)->nr == ~0U)
51#else
1da177e4
LT
52# define tlb_fast_mode(tlb) (1)
53#endif
54
7a95a2c8
PZ
55/*
56 * If we can't allocate a page to make a big batch of page pointers
57 * to work on, then just handle a few from the on-stack structure.
58 */
59#define IA64_GATHER_BUNDLE 8
60
1da177e4
LT
61struct mmu_gather {
62 struct mm_struct *mm;
63 unsigned int nr; /* == ~0U => fast mode */
7a95a2c8 64 unsigned int max;
1da177e4
LT
65 unsigned char fullmm; /* non-zero means full mm flush */
66 unsigned char need_flush; /* really unmapped some PTEs? */
1da177e4
LT
67 unsigned long start_addr;
68 unsigned long end_addr;
7a95a2c8
PZ
69 struct page **pages;
70 struct page *local[IA64_GATHER_BUNDLE];
1da177e4
LT
71};
72
96651896
XZ
73struct ia64_tr_entry {
74 u64 ifa;
75 u64 itir;
76 u64 pte;
77 u64 rr;
78}; /*Record for tr entry!*/
79
80extern int ia64_itr_entry(u64 target_mask, u64 va, u64 pte, u64 log_size);
81extern void ia64_ptr_entry(u64 target_mask, int slot);
82
6c57a332 83extern struct ia64_tr_entry *ia64_idtrs[NR_CPUS];
96651896
XZ
84
85/*
86 region register macros
87*/
88#define RR_TO_VE(val) (((val) >> 0) & 0x0000000000000001)
89#define RR_VE(val) (((val) & 0x0000000000000001) << 0)
90#define RR_VE_MASK 0x0000000000000001L
91#define RR_VE_SHIFT 0
92#define RR_TO_PS(val) (((val) >> 2) & 0x000000000000003f)
93#define RR_PS(val) (((val) & 0x000000000000003f) << 2)
94#define RR_PS_MASK 0x00000000000000fcL
95#define RR_PS_SHIFT 2
96#define RR_RID_MASK 0x00000000ffffff00L
97#define RR_TO_RID(val) ((val >> 8) & 0xffffff)
98
1da177e4
LT
99/*
100 * Flush the TLB for address range START to END and, if not in fast mode, release the
101 * freed pages that where gathered up to this point.
102 */
103static inline void
104ia64_tlb_flush_mmu (struct mmu_gather *tlb, unsigned long start, unsigned long end)
105{
106 unsigned int nr;
107
108 if (!tlb->need_flush)
109 return;
110 tlb->need_flush = 0;
111
112 if (tlb->fullmm) {
113 /*
114 * Tearing down the entire address space. This happens both as a result
115 * of exit() and execve(). The latter case necessitates the call to
116 * flush_tlb_mm() here.
117 */
118 flush_tlb_mm(tlb->mm);
119 } else if (unlikely (end - start >= 1024*1024*1024*1024UL
120 || REGION_NUMBER(start) != REGION_NUMBER(end - 1)))
121 {
122 /*
123 * If we flush more than a tera-byte or across regions, we're probably
124 * better off just flushing the entire TLB(s). This should be very rare
125 * and is not worth optimizing for.
126 */
127 flush_tlb_all();
128 } else {
129 /*
130 * XXX fix me: flush_tlb_range() should take an mm pointer instead of a
131 * vma pointer.
132 */
133 struct vm_area_struct vma;
134
135 vma.vm_mm = tlb->mm;
136 /* flush the address range from the tlb: */
137 flush_tlb_range(&vma, start, end);
138 /* now flush the virt. page-table area mapping the address range: */
139 flush_tlb_range(&vma, ia64_thash(start), ia64_thash(end));
140 }
141
142 /* lastly, release the freed pages */
143 nr = tlb->nr;
144 if (!tlb_fast_mode(tlb)) {
145 unsigned long i;
146 tlb->nr = 0;
147 tlb->start_addr = ~0UL;
148 for (i = 0; i < nr; ++i)
149 free_page_and_swap_cache(tlb->pages[i]);
150 }
151}
152
7a95a2c8 153static inline void __tlb_alloc_page(struct mmu_gather *tlb)
1da177e4 154{
7a95a2c8 155 unsigned long addr = __get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);
1da177e4 156
7a95a2c8
PZ
157 if (addr) {
158 tlb->pages = (void *)addr;
159 tlb->max = PAGE_SIZE / sizeof(void *);
160 }
161}
162
163
164static inline void
165tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, unsigned int full_mm_flush)
166{
1da177e4 167 tlb->mm = mm;
7a95a2c8
PZ
168 tlb->max = ARRAY_SIZE(tlb->local);
169 tlb->pages = tlb->local;
1da177e4
LT
170 /*
171 * Use fast mode if only 1 CPU is online.
172 *
173 * It would be tempting to turn on fast-mode for full_mm_flush as well. But this
174 * doesn't work because of speculative accesses and software prefetching: the page
175 * table of "mm" may (and usually is) the currently active page table and even
176 * though the kernel won't do any user-space accesses during the TLB shoot down, a
177 * compiler might use speculation or lfetch.fault on what happens to be a valid
178 * user-space address. This in turn could trigger a TLB miss fault (or a VHPT
179 * walk) and re-insert a TLB entry we just removed. Slow mode avoids such
180 * problems. (We could make fast-mode work by switching the current task to a
181 * different "mm" during the shootdown.) --davidm 08/02/2002
182 */
183 tlb->nr = (num_online_cpus() == 1) ? ~0U : 0;
184 tlb->fullmm = full_mm_flush;
1da177e4 185 tlb->start_addr = ~0UL;
1da177e4
LT
186}
187
188/*
189 * Called at the end of the shootdown operation to free up any resources that were
15a23ffa 190 * collected.
1da177e4
LT
191 */
192static inline void
7a95a2c8 193tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
1da177e4 194{
1da177e4
LT
195 /*
196 * Note: tlb->nr may be 0 at this point, so we can't rely on tlb->start_addr and
197 * tlb->end_addr.
198 */
199 ia64_tlb_flush_mmu(tlb, start, end);
200
201 /* keep the page table cache within bounds */
202 check_pgt_cache();
15a23ffa 203
7a95a2c8
PZ
204 if (tlb->pages != tlb->local)
205 free_pages((unsigned long)tlb->pages, 0);
1da177e4
LT
206}
207
1da177e4
LT
208/*
209 * Logically, this routine frees PAGE. On MP machines, the actual freeing of the page
210 * must be delayed until after the TLB has been flushed (see comments at the beginning of
211 * this file).
212 */
7a95a2c8 213static inline int __tlb_remove_page(struct mmu_gather *tlb, struct page *page)
1da177e4
LT
214{
215 tlb->need_flush = 1;
216
217 if (tlb_fast_mode(tlb)) {
218 free_page_and_swap_cache(page);
7a95a2c8 219 return 1; /* avoid calling tlb_flush_mmu */
1da177e4 220 }
7a95a2c8
PZ
221
222 if (!tlb->nr && tlb->pages == tlb->local)
223 __tlb_alloc_page(tlb);
224
1da177e4 225 tlb->pages[tlb->nr++] = page;
7a95a2c8
PZ
226 VM_BUG_ON(tlb->nr > tlb->max);
227
228 return tlb->max - tlb->nr;
229}
230
231static inline void tlb_flush_mmu(struct mmu_gather *tlb)
232{
233 ia64_tlb_flush_mmu(tlb, tlb->start_addr, tlb->end_addr);
234}
235
236static inline void tlb_remove_page(struct mmu_gather *tlb, struct page *page)
237{
238 if (!__tlb_remove_page(tlb, page))
239 tlb_flush_mmu(tlb);
1da177e4
LT
240}
241
242/*
243 * Remove TLB entry for PTE mapped at virtual address ADDRESS. This is called for any
244 * PTE, not just those pointing to (normal) physical memory.
245 */
246static inline void
247__tlb_remove_tlb_entry (struct mmu_gather *tlb, pte_t *ptep, unsigned long address)
248{
249 if (tlb->start_addr == ~0UL)
250 tlb->start_addr = address;
251 tlb->end_addr = address + PAGE_SIZE;
252}
253
254#define tlb_migrate_finish(mm) platform_tlb_migrate_finish(mm)
255
256#define tlb_start_vma(tlb, vma) do { } while (0)
257#define tlb_end_vma(tlb, vma) do { } while (0)
258
259#define tlb_remove_tlb_entry(tlb, ptep, addr) \
260do { \
261 tlb->need_flush = 1; \
262 __tlb_remove_tlb_entry(tlb, ptep, addr); \
263} while (0)
264
9e1b32ca 265#define pte_free_tlb(tlb, ptep, address) \
1da177e4
LT
266do { \
267 tlb->need_flush = 1; \
9e1b32ca 268 __pte_free_tlb(tlb, ptep, address); \
1da177e4
LT
269} while (0)
270
9e1b32ca 271#define pmd_free_tlb(tlb, ptep, address) \
1da177e4
LT
272do { \
273 tlb->need_flush = 1; \
9e1b32ca 274 __pmd_free_tlb(tlb, ptep, address); \
1da177e4
LT
275} while (0)
276
9e1b32ca 277#define pud_free_tlb(tlb, pudp, address) \
1da177e4
LT
278do { \
279 tlb->need_flush = 1; \
9e1b32ca 280 __pud_free_tlb(tlb, pudp, address); \
1da177e4
LT
281} while (0)
282
283#endif /* _ASM_IA64_TLB_H */