]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blame - arch/x86/include/asm/pgtable_types.h
x86: require x86-64 for automatic NUMA balancing
[mirror_ubuntu-bionic-kernel.git] / arch / x86 / include / asm / pgtable_types.h
CommitLineData
8d19c99f
JF
1#ifndef _ASM_X86_PGTABLE_DEFS_H
2#define _ASM_X86_PGTABLE_DEFS_H
3
4#include <linux/const.h>
e43623b4 5#include <asm/page_types.h>
8d19c99f
JF
6
7#define FIRST_USER_ADDRESS 0
8
9#define _PAGE_BIT_PRESENT 0 /* is present */
10#define _PAGE_BIT_RW 1 /* writeable */
11#define _PAGE_BIT_USER 2 /* userspace addressable */
12#define _PAGE_BIT_PWT 3 /* page write through */
13#define _PAGE_BIT_PCD 4 /* page cache disabled */
14#define _PAGE_BIT_ACCESSED 5 /* was accessed (raised by CPU) */
15#define _PAGE_BIT_DIRTY 6 /* was written to (raised by CPU) */
16#define _PAGE_BIT_PSE 7 /* 4 MB (or 2MB) page */
17#define _PAGE_BIT_PAT 7 /* on 4KB pages */
18#define _PAGE_BIT_GLOBAL 8 /* Global TLB entry PPro+ */
19#define _PAGE_BIT_UNUSED1 9 /* available for programmer */
20#define _PAGE_BIT_IOMAP 10 /* flag used to indicate IO mapping */
dfec072e 21#define _PAGE_BIT_HIDDEN 11 /* hidden by kmemcheck */
8d19c99f
JF
22#define _PAGE_BIT_PAT_LARGE 12 /* On 2MB or 1GB pages */
23#define _PAGE_BIT_SPECIAL _PAGE_BIT_UNUSED1
24#define _PAGE_BIT_CPA_TEST _PAGE_BIT_UNUSED1
5f6e8da7 25#define _PAGE_BIT_SPLITTING _PAGE_BIT_UNUSED1 /* only valid on a PSE pmd */
8d19c99f
JF
26#define _PAGE_BIT_NX 63 /* No execute: only valid after cpuid check */
27
28/* If _PAGE_BIT_PRESENT is clear, we use these: */
29/* - if the user mapped it with PROT_NONE; pte_present gives true */
30#define _PAGE_BIT_PROTNONE _PAGE_BIT_GLOBAL
31/* - set: nonlinear file mapping, saved PTE; unset:swap */
32#define _PAGE_BIT_FILE _PAGE_BIT_DIRTY
33
34#define _PAGE_PRESENT (_AT(pteval_t, 1) << _PAGE_BIT_PRESENT)
35#define _PAGE_RW (_AT(pteval_t, 1) << _PAGE_BIT_RW)
36#define _PAGE_USER (_AT(pteval_t, 1) << _PAGE_BIT_USER)
37#define _PAGE_PWT (_AT(pteval_t, 1) << _PAGE_BIT_PWT)
38#define _PAGE_PCD (_AT(pteval_t, 1) << _PAGE_BIT_PCD)
39#define _PAGE_ACCESSED (_AT(pteval_t, 1) << _PAGE_BIT_ACCESSED)
40#define _PAGE_DIRTY (_AT(pteval_t, 1) << _PAGE_BIT_DIRTY)
41#define _PAGE_PSE (_AT(pteval_t, 1) << _PAGE_BIT_PSE)
42#define _PAGE_GLOBAL (_AT(pteval_t, 1) << _PAGE_BIT_GLOBAL)
43#define _PAGE_UNUSED1 (_AT(pteval_t, 1) << _PAGE_BIT_UNUSED1)
44#define _PAGE_IOMAP (_AT(pteval_t, 1) << _PAGE_BIT_IOMAP)
8d19c99f
JF
45#define _PAGE_PAT (_AT(pteval_t, 1) << _PAGE_BIT_PAT)
46#define _PAGE_PAT_LARGE (_AT(pteval_t, 1) << _PAGE_BIT_PAT_LARGE)
47#define _PAGE_SPECIAL (_AT(pteval_t, 1) << _PAGE_BIT_SPECIAL)
48#define _PAGE_CPA_TEST (_AT(pteval_t, 1) << _PAGE_BIT_CPA_TEST)
5f6e8da7 49#define _PAGE_SPLITTING (_AT(pteval_t, 1) << _PAGE_BIT_SPLITTING)
8d19c99f
JF
50#define __HAVE_ARCH_PTE_SPECIAL
51
9d31c506
JF
52#ifdef CONFIG_KMEMCHECK
53#define _PAGE_HIDDEN (_AT(pteval_t, 1) << _PAGE_BIT_HIDDEN)
54#else
55#define _PAGE_HIDDEN (_AT(pteval_t, 0))
56#endif
57
0f8975ec
PE
58/*
59 * The same hidden bit is used by kmemcheck, but since kmemcheck
60 * works on kernel pages while soft-dirty engine on user space,
61 * they do not conflict with each other.
62 */
63
41bb3476
CG
64#define _PAGE_BIT_SOFT_DIRTY _PAGE_BIT_HIDDEN
65
0f8975ec 66#ifdef CONFIG_MEM_SOFT_DIRTY
41bb3476 67#define _PAGE_SOFT_DIRTY (_AT(pteval_t, 1) << _PAGE_BIT_SOFT_DIRTY)
0f8975ec
PE
68#else
69#define _PAGE_SOFT_DIRTY (_AT(pteval_t, 0))
70#endif
71
179ef71c
CG
72/*
73 * Tracking soft dirty bit when a page goes to a swap is tricky.
74 * We need a bit which can be stored in pte _and_ not conflict
75 * with swap entry format. On x86 bits 6 and 7 are *not* involved
76 * into swap entry computation, but bit 6 is used for nonlinear
77 * file mapping, so we borrow bit 7 for soft dirty tracking.
fa0f281c
CG
78 *
79 * Please note that this bit must be treated as swap dirty page
80 * mark if and only if the PTE has present bit clear!
179ef71c
CG
81 */
82#ifdef CONFIG_MEM_SOFT_DIRTY
83#define _PAGE_SWP_SOFT_DIRTY _PAGE_PSE
84#else
85#define _PAGE_SWP_SOFT_DIRTY (_AT(pteval_t, 0))
86#endif
87
8d19c99f
JF
88#if defined(CONFIG_X86_64) || defined(CONFIG_X86_PAE)
89#define _PAGE_NX (_AT(pteval_t, 1) << _PAGE_BIT_NX)
90#else
91#define _PAGE_NX (_AT(pteval_t, 0))
92#endif
93
94#define _PAGE_FILE (_AT(pteval_t, 1) << _PAGE_BIT_FILE)
95#define _PAGE_PROTNONE (_AT(pteval_t, 1) << _PAGE_BIT_PROTNONE)
96
dbe4d203
AA
97/*
98 * _PAGE_NUMA indicates that this page will trigger a numa hinting
99 * minor page fault to gather numa placement statistics (see
100 * pte_numa()). The bit picked (8) is within the range between
101 * _PAGE_FILE (6) and _PAGE_PROTNONE (8) bits. Therefore, it doesn't
102 * require changes to the swp entry format because that bit is always
103 * zero when the pte is not present.
104 *
105 * The bit picked must be always zero when the pmd is present and not
106 * present, so that we don't lose information when we set it while
107 * atomically clearing the present bit.
108 *
109 * Because we shared the same bit (8) with _PAGE_PROTNONE this can be
110 * interpreted as _PAGE_NUMA only in places that _PAGE_PROTNONE
111 * couldn't reach, like handle_mm_fault() (see access_error in
112 * arch/x86/mm/fault.c, the vma protection must not be PROT_NONE for
113 * handle_mm_fault() to be invoked).
114 */
115#define _PAGE_NUMA _PAGE_PROTNONE
116
8d19c99f
JF
117#define _PAGE_TABLE (_PAGE_PRESENT | _PAGE_RW | _PAGE_USER | \
118 _PAGE_ACCESSED | _PAGE_DIRTY)
119#define _KERNPG_TABLE (_PAGE_PRESENT | _PAGE_RW | _PAGE_ACCESSED | \
120 _PAGE_DIRTY)
121
122/* Set of bits not changed in pte_modify */
123#define _PAGE_CHG_MASK (PTE_PFN_MASK | _PAGE_PCD | _PAGE_PWT | \
24f91eba
AV
124 _PAGE_SPECIAL | _PAGE_ACCESSED | _PAGE_DIRTY | \
125 _PAGE_SOFT_DIRTY)
c489f125 126#define _HPAGE_CHG_MASK (_PAGE_CHG_MASK | _PAGE_PSE)
8d19c99f
JF
127
128#define _PAGE_CACHE_MASK (_PAGE_PCD | _PAGE_PWT)
129#define _PAGE_CACHE_WB (0)
130#define _PAGE_CACHE_WC (_PAGE_PWT)
131#define _PAGE_CACHE_UC_MINUS (_PAGE_PCD)
132#define _PAGE_CACHE_UC (_PAGE_PCD | _PAGE_PWT)
133
134#define PAGE_NONE __pgprot(_PAGE_PROTNONE | _PAGE_ACCESSED)
135#define PAGE_SHARED __pgprot(_PAGE_PRESENT | _PAGE_RW | _PAGE_USER | \
136 _PAGE_ACCESSED | _PAGE_NX)
137
138#define PAGE_SHARED_EXEC __pgprot(_PAGE_PRESENT | _PAGE_RW | \
139 _PAGE_USER | _PAGE_ACCESSED)
140#define PAGE_COPY_NOEXEC __pgprot(_PAGE_PRESENT | _PAGE_USER | \
141 _PAGE_ACCESSED | _PAGE_NX)
142#define PAGE_COPY_EXEC __pgprot(_PAGE_PRESENT | _PAGE_USER | \
143 _PAGE_ACCESSED)
144#define PAGE_COPY PAGE_COPY_NOEXEC
145#define PAGE_READONLY __pgprot(_PAGE_PRESENT | _PAGE_USER | \
146 _PAGE_ACCESSED | _PAGE_NX)
147#define PAGE_READONLY_EXEC __pgprot(_PAGE_PRESENT | _PAGE_USER | \
148 _PAGE_ACCESSED)
149
150#define __PAGE_KERNEL_EXEC \
151 (_PAGE_PRESENT | _PAGE_RW | _PAGE_DIRTY | _PAGE_ACCESSED | _PAGE_GLOBAL)
152#define __PAGE_KERNEL (__PAGE_KERNEL_EXEC | _PAGE_NX)
153
154#define __PAGE_KERNEL_RO (__PAGE_KERNEL & ~_PAGE_RW)
155#define __PAGE_KERNEL_RX (__PAGE_KERNEL_EXEC & ~_PAGE_RW)
156#define __PAGE_KERNEL_EXEC_NOCACHE (__PAGE_KERNEL_EXEC | _PAGE_PCD | _PAGE_PWT)
157#define __PAGE_KERNEL_WC (__PAGE_KERNEL | _PAGE_CACHE_WC)
158#define __PAGE_KERNEL_NOCACHE (__PAGE_KERNEL | _PAGE_PCD | _PAGE_PWT)
159#define __PAGE_KERNEL_UC_MINUS (__PAGE_KERNEL | _PAGE_PCD)
160#define __PAGE_KERNEL_VSYSCALL (__PAGE_KERNEL_RX | _PAGE_USER)
9fd67b4e 161#define __PAGE_KERNEL_VVAR (__PAGE_KERNEL_RO | _PAGE_USER)
d319bb79 162#define __PAGE_KERNEL_VVAR_NOCACHE (__PAGE_KERNEL_VVAR | _PAGE_PCD | _PAGE_PWT)
8d19c99f
JF
163#define __PAGE_KERNEL_LARGE (__PAGE_KERNEL | _PAGE_PSE)
164#define __PAGE_KERNEL_LARGE_NOCACHE (__PAGE_KERNEL | _PAGE_CACHE_UC | _PAGE_PSE)
165#define __PAGE_KERNEL_LARGE_EXEC (__PAGE_KERNEL_EXEC | _PAGE_PSE)
166
167#define __PAGE_KERNEL_IO (__PAGE_KERNEL | _PAGE_IOMAP)
168#define __PAGE_KERNEL_IO_NOCACHE (__PAGE_KERNEL_NOCACHE | _PAGE_IOMAP)
169#define __PAGE_KERNEL_IO_UC_MINUS (__PAGE_KERNEL_UC_MINUS | _PAGE_IOMAP)
170#define __PAGE_KERNEL_IO_WC (__PAGE_KERNEL_WC | _PAGE_IOMAP)
171
172#define PAGE_KERNEL __pgprot(__PAGE_KERNEL)
173#define PAGE_KERNEL_RO __pgprot(__PAGE_KERNEL_RO)
174#define PAGE_KERNEL_EXEC __pgprot(__PAGE_KERNEL_EXEC)
175#define PAGE_KERNEL_RX __pgprot(__PAGE_KERNEL_RX)
176#define PAGE_KERNEL_WC __pgprot(__PAGE_KERNEL_WC)
177#define PAGE_KERNEL_NOCACHE __pgprot(__PAGE_KERNEL_NOCACHE)
178#define PAGE_KERNEL_UC_MINUS __pgprot(__PAGE_KERNEL_UC_MINUS)
179#define PAGE_KERNEL_EXEC_NOCACHE __pgprot(__PAGE_KERNEL_EXEC_NOCACHE)
180#define PAGE_KERNEL_LARGE __pgprot(__PAGE_KERNEL_LARGE)
181#define PAGE_KERNEL_LARGE_NOCACHE __pgprot(__PAGE_KERNEL_LARGE_NOCACHE)
182#define PAGE_KERNEL_LARGE_EXEC __pgprot(__PAGE_KERNEL_LARGE_EXEC)
183#define PAGE_KERNEL_VSYSCALL __pgprot(__PAGE_KERNEL_VSYSCALL)
9fd67b4e 184#define PAGE_KERNEL_VVAR __pgprot(__PAGE_KERNEL_VVAR)
d319bb79 185#define PAGE_KERNEL_VVAR_NOCACHE __pgprot(__PAGE_KERNEL_VVAR_NOCACHE)
8d19c99f
JF
186
187#define PAGE_KERNEL_IO __pgprot(__PAGE_KERNEL_IO)
188#define PAGE_KERNEL_IO_NOCACHE __pgprot(__PAGE_KERNEL_IO_NOCACHE)
189#define PAGE_KERNEL_IO_UC_MINUS __pgprot(__PAGE_KERNEL_IO_UC_MINUS)
190#define PAGE_KERNEL_IO_WC __pgprot(__PAGE_KERNEL_IO_WC)
191
192/* xwr */
193#define __P000 PAGE_NONE
194#define __P001 PAGE_READONLY
195#define __P010 PAGE_COPY
196#define __P011 PAGE_COPY
197#define __P100 PAGE_READONLY_EXEC
198#define __P101 PAGE_READONLY_EXEC
199#define __P110 PAGE_COPY_EXEC
200#define __P111 PAGE_COPY_EXEC
201
202#define __S000 PAGE_NONE
203#define __S001 PAGE_READONLY
204#define __S010 PAGE_SHARED
205#define __S011 PAGE_SHARED
206#define __S100 PAGE_READONLY_EXEC
207#define __S101 PAGE_READONLY_EXEC
208#define __S110 PAGE_SHARED_EXEC
209#define __S111 PAGE_SHARED_EXEC
210
211/*
212 * early identity mapping pte attrib macros.
213 */
214#ifdef CONFIG_X86_64
215#define __PAGE_KERNEL_IDENT_LARGE_EXEC __PAGE_KERNEL_LARGE_EXEC
216#else
8d19c99f 217#define PTE_IDENT_ATTR 0x003 /* PRESENT+RW */
7dda0387 218#define PDE_IDENT_ATTR 0x063 /* PRESENT+RW+DIRTY+ACCESSED */
8d19c99f
JF
219#define PGD_IDENT_ATTR 0x001 /* PRESENT (no other attributes) */
220#endif
221
54321d94 222#ifdef CONFIG_X86_32
a1ce3928 223# include <asm/pgtable_32_types.h>
54321d94 224#else
a1ce3928 225# include <asm/pgtable_64_types.h>
54321d94
JF
226#endif
227
8d19c99f
JF
228#ifndef __ASSEMBLY__
229
54321d94
JF
230#include <linux/types.h>
231
9b3651cb
JF
232/* PTE_PFN_MASK extracts the PFN from a (pte|pmd|pud|pgd)val_t */
233#define PTE_PFN_MASK ((pteval_t)PHYSICAL_PAGE_MASK)
234
235/* PTE_FLAGS_MASK extracts the flags from a (pte|pmd|pud|pgd)val_t */
236#define PTE_FLAGS_MASK (~PTE_PFN_MASK)
237
54321d94
JF
238typedef struct pgprot { pgprotval_t pgprot; } pgprot_t;
239
240typedef struct { pgdval_t pgd; } pgd_t;
241
242static inline pgd_t native_make_pgd(pgdval_t val)
243{
244 return (pgd_t) { val };
245}
246
247static inline pgdval_t native_pgd_val(pgd_t pgd)
248{
249 return pgd.pgd;
250}
251
252static inline pgdval_t pgd_flags(pgd_t pgd)
253{
254 return native_pgd_val(pgd) & PTE_FLAGS_MASK;
255}
256
257#if PAGETABLE_LEVELS > 3
258typedef struct { pudval_t pud; } pud_t;
259
260static inline pud_t native_make_pud(pmdval_t val)
261{
262 return (pud_t) { val };
263}
264
265static inline pudval_t native_pud_val(pud_t pud)
266{
267 return pud.pud;
268}
269#else
270#include <asm-generic/pgtable-nopud.h>
271
272static inline pudval_t native_pud_val(pud_t pud)
273{
274 return native_pgd_val(pud.pgd);
275}
276#endif
277
278#if PAGETABLE_LEVELS > 2
279typedef struct { pmdval_t pmd; } pmd_t;
280
281static inline pmd_t native_make_pmd(pmdval_t val)
282{
283 return (pmd_t) { val };
284}
285
286static inline pmdval_t native_pmd_val(pmd_t pmd)
287{
288 return pmd.pmd;
289}
290#else
291#include <asm-generic/pgtable-nopmd.h>
292
293static inline pmdval_t native_pmd_val(pmd_t pmd)
294{
295 return native_pgd_val(pmd.pud.pgd);
296}
297#endif
298
299static inline pudval_t pud_flags(pud_t pud)
300{
301 return native_pud_val(pud) & PTE_FLAGS_MASK;
302}
303
304static inline pmdval_t pmd_flags(pmd_t pmd)
305{
306 return native_pmd_val(pmd) & PTE_FLAGS_MASK;
307}
308
309static inline pte_t native_make_pte(pteval_t val)
310{
311 return (pte_t) { .pte = val };
312}
313
314static inline pteval_t native_pte_val(pte_t pte)
315{
316 return pte.pte;
317}
318
319static inline pteval_t pte_flags(pte_t pte)
320{
321 return native_pte_val(pte) & PTE_FLAGS_MASK;
322}
323
324#define pgprot_val(x) ((x).pgprot)
325#define __pgprot(x) ((pgprot_t) { (x) } )
326
327
328typedef struct page *pgtable_t;
329
8d19c99f 330extern pteval_t __supported_pte_mask;
c44c9ec0 331extern void set_nx(void);
54321d94 332extern int nx_enabled;
8d19c99f
JF
333
334#define pgprot_writecombine pgprot_writecombine
335extern pgprot_t pgprot_writecombine(pgprot_t prot);
336
337/* Indicate that x86 has its own track and untrack pfn vma functions */
338#define __HAVE_PFNMAP_TRACKING
339
340#define __HAVE_PHYS_MEM_ACCESS_PROT
341struct file;
342pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,
343 unsigned long size, pgprot_t vma_prot);
344int phys_mem_access_prot_allowed(struct file *file, unsigned long pfn,
345 unsigned long size, pgprot_t *vma_prot);
346
347/* Install a pte for a particular vaddr in kernel space. */
348void set_pte_vaddr(unsigned long vaddr, pte_t pte);
349
350#ifdef CONFIG_X86_32
7737b215 351extern void native_pagetable_init(void);
8d19c99f 352#else
843b8ed2 353#define native_pagetable_init paging_init
8d19c99f
JF
354#endif
355
356struct seq_file;
357extern void arch_report_meminfo(struct seq_file *m);
358
4cbeb51b 359enum pg_level {
8d19c99f
JF
360 PG_LEVEL_NONE,
361 PG_LEVEL_4K,
362 PG_LEVEL_2M,
363 PG_LEVEL_1G,
364 PG_LEVEL_NUM
365};
366
367#ifdef CONFIG_PROC_FS
368extern void update_page_count(int level, unsigned long pages);
369#else
370static inline void update_page_count(int level, unsigned long pages) { }
371#endif
372
373/*
374 * Helper function that returns the kernel pagetable entry controlling
375 * the virtual address 'address'. NULL means no pagetable entry present.
376 * NOTE: the return type is pte_t but if the pmd is PSE then we return it
377 * as a pte too.
378 */
379extern pte_t *lookup_address(unsigned long address, unsigned int *level);
426e34cc
MF
380extern pte_t *lookup_address_in_pgd(pgd_t *pgd, unsigned long address,
381 unsigned int *level);
d7656534 382extern phys_addr_t slow_virt_to_phys(void *__address);
d2f7cbe7
BP
383extern int kernel_map_pages_in_pgd(pgd_t *pgd, u64 pfn, unsigned long address,
384 unsigned numpages, unsigned long page_flags);
42a54772
BP
385void kernel_unmap_pages_in_pgd(pgd_t *root, unsigned long address,
386 unsigned numpages);
8d19c99f
JF
387#endif /* !__ASSEMBLY__ */
388
389#endif /* _ASM_X86_PGTABLE_DEFS_H */