]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - mm/Kconfig
mm/mmap.c: don't unlock VMAs in remap_file_pages()
[mirror_ubuntu-jammy-kernel.git] / mm / Kconfig
CommitLineData
ec8f24b7 1# SPDX-License-Identifier: GPL-2.0-only
59e0b520
CH
2
3menu "Memory Management options"
4
e1785e85
DH
5config SELECT_MEMORY_MODEL
6 def_bool y
a8826eeb 7 depends on ARCH_SELECT_MEMORY_MODEL
e1785e85 8
3a9da765
DH
9choice
10 prompt "Memory model"
e1785e85 11 depends on SELECT_MEMORY_MODEL
d41dee36 12 default SPARSEMEM_MANUAL if ARCH_SPARSEMEM_DEFAULT
e1785e85 13 default FLATMEM_MANUAL
d66d109d
MR
14 help
15 This option allows you to change some of the ways that
16 Linux manages its memory internally. Most users will
17 only have one option here selected by the architecture
18 configuration. This is normal.
3a9da765 19
e1785e85 20config FLATMEM_MANUAL
3a9da765 21 bool "Flat Memory"
c898ec16 22 depends on !(ARCH_DISCONTIGMEM_ENABLE || ARCH_SPARSEMEM_ENABLE) || ARCH_FLATMEM_ENABLE
3a9da765 23 help
d66d109d
MR
24 This option is best suited for non-NUMA systems with
25 flat address space. The FLATMEM is the most efficient
26 system in terms of performance and resource consumption
27 and it is the best option for smaller systems.
28
29 For systems that have holes in their physical address
30 spaces and for features like NUMA and memory hotplug,
dd33d29a 31 choose "Sparse Memory".
d41dee36
AW
32
33 If unsure, choose this option (Flat Memory) over any other.
3a9da765 34
e1785e85 35config DISCONTIGMEM_MANUAL
f3519f91 36 bool "Discontiguous Memory"
3a9da765
DH
37 depends on ARCH_DISCONTIGMEM_ENABLE
38 help
785dcd44
DH
39 This option provides enhanced support for discontiguous
40 memory systems, over FLATMEM. These systems have holes
41 in their physical address spaces, and this option provides
d66d109d 42 more efficient handling of these holes.
785dcd44 43
d66d109d
MR
44 Although "Discontiguous Memory" is still used by several
45 architectures, it is considered deprecated in favor of
46 "Sparse Memory".
785dcd44 47
d66d109d 48 If unsure, choose "Sparse Memory" over this option.
3a9da765 49
d41dee36
AW
50config SPARSEMEM_MANUAL
51 bool "Sparse Memory"
52 depends on ARCH_SPARSEMEM_ENABLE
53 help
54 This will be the only option for some systems, including
d66d109d 55 memory hot-plug systems. This is normal.
d41dee36 56
d66d109d
MR
57 This option provides efficient support for systems with
58 holes is their physical address space and allows memory
59 hot-plug and hot-remove.
d41dee36 60
d66d109d 61 If unsure, choose "Flat Memory" over this option.
d41dee36 62
3a9da765
DH
63endchoice
64
e1785e85
DH
65config DISCONTIGMEM
66 def_bool y
67 depends on (!SELECT_MEMORY_MODEL && ARCH_DISCONTIGMEM_ENABLE) || DISCONTIGMEM_MANUAL
68
d41dee36
AW
69config SPARSEMEM
70 def_bool y
1a83e175 71 depends on (!SELECT_MEMORY_MODEL && ARCH_SPARSEMEM_ENABLE) || SPARSEMEM_MANUAL
d41dee36 72
e1785e85
DH
73config FLATMEM
74 def_bool y
d41dee36
AW
75 depends on (!DISCONTIGMEM && !SPARSEMEM) || FLATMEM_MANUAL
76
77config FLAT_NODE_MEM_MAP
78 def_bool y
79 depends on !SPARSEMEM
e1785e85 80
93b7504e
DH
81#
82# Both the NUMA code and DISCONTIGMEM use arrays of pg_data_t's
83# to represent different areas of memory. This variable allows
84# those dependencies to exist individually.
85#
86config NEED_MULTIPLE_NODES
87 def_bool y
88 depends on DISCONTIGMEM || NUMA
af705362 89
3e347261
BP
90#
91# SPARSEMEM_EXTREME (which is the default) does some bootmem
c89ab04f 92# allocations when sparse_init() is called. If this cannot
3e347261
BP
93# be done on your architecture, select this option. However,
94# statically allocating the mem_section[] array can potentially
95# consume vast quantities of .bss, so be careful.
96#
97# This option will also potentially produce smaller runtime code
98# with gcc 3.4 and later.
99#
100config SPARSEMEM_STATIC
9ba16087 101 bool
3e347261 102
802f192e 103#
44c09201 104# Architecture platforms which require a two level mem_section in SPARSEMEM
802f192e
BP
105# must select this option. This is usually for architecture platforms with
106# an extremely sparse physical address space.
107#
3e347261
BP
108config SPARSEMEM_EXTREME
109 def_bool y
110 depends on SPARSEMEM && !SPARSEMEM_STATIC
4c21e2f2 111
29c71111 112config SPARSEMEM_VMEMMAP_ENABLE
9ba16087 113 bool
29c71111
AW
114
115config SPARSEMEM_VMEMMAP
a5ee6daa
GL
116 bool "Sparse Memory virtual memmap"
117 depends on SPARSEMEM && SPARSEMEM_VMEMMAP_ENABLE
118 default y
119 help
19fa40a0
KK
120 SPARSEMEM_VMEMMAP uses a virtually mapped memmap to optimise
121 pfn_to_page and page_to_pfn operations. This is the most
122 efficient option when sufficient kernel resources are available.
29c71111 123
70210ed9 124config HAVE_MEMBLOCK_PHYS_MAP
6341e62b 125 bool
70210ed9 126
67a929e0 127config HAVE_FAST_GUP
050a9adc 128 depends on MMU
6341e62b 129 bool
2667f50e 130
52219aea
DH
131# Don't discard allocated memory used to track "memory" and "reserved" memblocks
132# after early boot, so it can still be used to test for validity of memory.
133# Also, memblocks are updated with memory hot(un)plug.
350e88ba 134config ARCH_KEEP_MEMBLOCK
6341e62b 135 bool
c378ddd5 136
1e5d8e1e
DW
137# Keep arch NUMA mapping infrastructure post-init.
138config NUMA_KEEP_MEMINFO
139 bool
140
ee6f509c 141config MEMORY_ISOLATION
6341e62b 142 bool
ee6f509c 143
46723bfa
YI
144#
145# Only be set on architectures that have completely implemented memory hotplug
146# feature. If you are not sure, don't touch it.
147#
148config HAVE_BOOTMEM_INFO_NODE
149 def_bool n
150
3947be19
DH
151# eventually, we can have this option just 'select SPARSEMEM'
152config MEMORY_HOTPLUG
153 bool "Allow for memory hot-add"
b30c5927 154 select MEMORY_ISOLATION
ec69acbb 155 depends on SPARSEMEM || X86_64_ACPI_NUMA
40b31360 156 depends on ARCH_ENABLE_MEMORY_HOTPLUG
b59d02ed 157 depends on 64BIT || BROKEN
1e5d8e1e 158 select NUMA_KEEP_MEMINFO if NUMA
3947be19 159
ec69acbb
KM
160config MEMORY_HOTPLUG_SPARSE
161 def_bool y
162 depends on SPARSEMEM && MEMORY_HOTPLUG
163
8604d9e5 164config MEMORY_HOTPLUG_DEFAULT_ONLINE
19fa40a0
KK
165 bool "Online the newly added memory blocks by default"
166 depends on MEMORY_HOTPLUG
167 help
8604d9e5
VK
168 This option sets the default policy setting for memory hotplug
169 onlining policy (/sys/devices/system/memory/auto_online_blocks) which
170 determines what happens to newly added memory regions. Policy setting
171 can always be changed at runtime.
cb1aaebe 172 See Documentation/admin-guide/mm/memory-hotplug.rst for more information.
8604d9e5
VK
173
174 Say Y here if you want all hot-plugged memory blocks to appear in
175 'online' state by default.
176 Say N here if you want the default policy to keep all hot-plugged
177 memory blocks in 'offline' state.
178
0c0e6195
KH
179config MEMORY_HOTREMOVE
180 bool "Allow for memory hot remove"
f7e3334a 181 select HAVE_BOOTMEM_INFO_NODE if (X86_64 || PPC64)
0c0e6195
KH
182 depends on MEMORY_HOTPLUG && ARCH_ENABLE_MEMORY_HOTREMOVE
183 depends on MIGRATION
184
4c21e2f2
HD
185# Heavily threaded applications may benefit from splitting the mm-wide
186# page_table_lock, so that faults on different parts of the user address
187# space can be handled with less contention: split it at this NR_CPUS.
188# Default to 4 for wider testing, though 8 might be more appropriate.
189# ARM's adjust_pte (unused if VIPT) depends on mm-wide page_table_lock.
7b6ac9df 190# PA-RISC 7xxx's spinlock_t would enlarge struct page from 32 to 44 bytes.
60bccaa6
WD
191# SPARC32 allocates multiple pte tables within a single page, and therefore
192# a per-page lock leads to problems when multiple tables need to be locked
193# at the same time (e.g. copy_page_range()).
a70caa8b 194# DEBUG_SPINLOCK and DEBUG_LOCK_ALLOC spinlock_t also enlarge struct page.
4c21e2f2
HD
195#
196config SPLIT_PTLOCK_CPUS
197 int
9164550e 198 default "999999" if !MMU
a70caa8b
HD
199 default "999999" if ARM && !CPU_CACHE_VIPT
200 default "999999" if PARISC && !PA20
60bccaa6 201 default "999999" if SPARC32
4c21e2f2 202 default "4"
7cbe34cf 203
e009bb30 204config ARCH_ENABLE_SPLIT_PMD_PTLOCK
6341e62b 205 bool
e009bb30 206
09316c09
KK
207#
208# support for memory balloon
209config MEMORY_BALLOON
6341e62b 210 bool
09316c09 211
18468d93
RA
212#
213# support for memory balloon compaction
214config BALLOON_COMPACTION
215 bool "Allow for balloon memory compaction/migration"
216 def_bool y
09316c09 217 depends on COMPACTION && MEMORY_BALLOON
18468d93
RA
218 help
219 Memory fragmentation introduced by ballooning might reduce
220 significantly the number of 2MB contiguous memory blocks that can be
221 used within a guest, thus imposing performance penalties associated
222 with the reduced number of transparent huge pages that could be used
223 by the guest workload. Allowing the compaction & migration for memory
224 pages enlisted as being part of memory balloon devices avoids the
225 scenario aforementioned and helps improving memory defragmentation.
226
e9e96b39
MG
227#
228# support for memory compaction
229config COMPACTION
230 bool "Allow for memory compaction"
05106e6a 231 def_bool y
e9e96b39 232 select MIGRATION
33a93877 233 depends on MMU
e9e96b39 234 help
19fa40a0
KK
235 Compaction is the only memory management component to form
236 high order (larger physically contiguous) memory blocks
237 reliably. The page allocator relies on compaction heavily and
238 the lack of the feature can lead to unexpected OOM killer
239 invocations for high order memory requests. You shouldn't
240 disable this option unless there really is a strong reason for
241 it and then we would be really interested to hear about that at
242 linux-mm@kvack.org.
e9e96b39 243
36e66c55
AD
244#
245# support for free page reporting
246config PAGE_REPORTING
247 bool "Free page reporting"
248 def_bool n
249 help
250 Free page reporting allows for the incremental acquisition of
251 free pages from the buddy allocator for the purpose of reporting
252 those pages to another entity, such as a hypervisor, so that the
253 memory can be freed within the host for other uses.
254
7cbe34cf
CL
255#
256# support for page migration
257#
258config MIGRATION
b20a3503 259 bool "Page migration"
6c5240ae 260 def_bool y
de32a817 261 depends on (NUMA || ARCH_ENABLE_MEMORY_HOTREMOVE || COMPACTION || CMA) && MMU
b20a3503
CL
262 help
263 Allows the migration of the physical location of pages of processes
e9e96b39
MG
264 while the virtual addresses are not changed. This is useful in
265 two situations. The first is on NUMA systems to put pages nearer
266 to the processors accessing. The second is when allocating huge
267 pages as migration can relocate pages to satisfy a huge page
268 allocation instead of reclaiming.
6550e07f 269
c177c81e 270config ARCH_ENABLE_HUGEPAGE_MIGRATION
6341e62b 271 bool
c177c81e 272
9c670ea3
NH
273config ARCH_ENABLE_THP_MIGRATION
274 bool
275
4bfb68a0
AK
276config HUGETLB_PAGE_SIZE_VARIABLE
277 def_bool n
278 help
279 Allows the pageblock_order value to be dynamic instead of just standard
280 HUGETLB_PAGE_ORDER when there are multiple HugeTLB page sizes available
281 on a platform.
282
8df995f6 283config CONTIG_ALLOC
19fa40a0 284 def_bool (MEMORY_ISOLATION && COMPACTION) || CMA
8df995f6 285
600715dc 286config PHYS_ADDR_T_64BIT
d4a451d5 287 def_bool 64BIT
600715dc 288
2a7326b5 289config BOUNCE
9ca24e2e
VM
290 bool "Enable bounce buffers"
291 default y
ce288e05 292 depends on BLOCK && MMU && HIGHMEM
9ca24e2e 293 help
ce288e05
CH
294 Enable bounce buffers for devices that cannot access the full range of
295 memory available to the CPU. Enabled by default when HIGHMEM is
296 selected, but you may say n to override this.
2a7326b5 297
f057eac0 298config VIRT_TO_BUS
4febd95a
SR
299 bool
300 help
301 An architecture should select this if it implements the
302 deprecated interface virt_to_bus(). All new architectures
303 should probably not select this.
304
cddb8a5c
AA
305
306config MMU_NOTIFIER
307 bool
83fe27ea 308 select SRCU
99cb252f 309 select INTERVAL_TREE
fc4d5c29 310
f8af4da3
HD
311config KSM
312 bool "Enable KSM for page merging"
313 depends on MMU
59e1a2f4 314 select XXHASH
f8af4da3
HD
315 help
316 Enable Kernel Samepage Merging: KSM periodically scans those areas
317 of an application's address space that an app has advised may be
318 mergeable. When it finds pages of identical content, it replaces
d0f209f6 319 the many instances by a single page with that content, so
f8af4da3
HD
320 saving memory until one or another app needs to modify the content.
321 Recommended for use with KVM, or with other duplicative applications.
ad56b738 322 See Documentation/vm/ksm.rst for more information: KSM is inactive
c73602ad
HD
323 until a program has madvised that an area is MADV_MERGEABLE, and
324 root has set /sys/kernel/mm/ksm/run to 1 (if CONFIG_SYSFS is set).
f8af4da3 325
e0a94c2a 326config DEFAULT_MMAP_MIN_ADDR
19fa40a0 327 int "Low address space to protect from user allocation"
6e141546 328 depends on MMU
19fa40a0
KK
329 default 4096
330 help
e0a94c2a
CL
331 This is the portion of low virtual memory which should be protected
332 from userspace allocation. Keeping a user from writing to low pages
333 can help reduce the impact of kernel NULL pointer bugs.
334
335 For most ia64, ppc64 and x86 users with lots of address space
336 a value of 65536 is reasonable and should cause no problems.
337 On arm and other archs it should not be higher than 32768.
788084ab
EP
338 Programs which use vm86 functionality or have some need to map
339 this low address space will need CAP_SYS_RAWIO or disable this
340 protection by setting the value to 0.
e0a94c2a
CL
341
342 This value can be changed after boot using the
343 /proc/sys/vm/mmap_min_addr tunable.
344
d949f36f
LT
345config ARCH_SUPPORTS_MEMORY_FAILURE
346 bool
e0a94c2a 347
6a46079c
AK
348config MEMORY_FAILURE
349 depends on MMU
d949f36f 350 depends on ARCH_SUPPORTS_MEMORY_FAILURE
6a46079c 351 bool "Enable recovery from hardware memory errors"
ee6f509c 352 select MEMORY_ISOLATION
97f0b134 353 select RAS
6a46079c
AK
354 help
355 Enables code to recover from some memory failures on systems
356 with MCA recovery. This allows a system to continue running
357 even when some of its memory has uncorrected errors. This requires
358 special hardware support and typically ECC memory.
359
cae681fc 360config HWPOISON_INJECT
413f9efb 361 tristate "HWPoison pages injector"
27df5068 362 depends on MEMORY_FAILURE && DEBUG_KERNEL && PROC_FS
478c5ffc 363 select PROC_PAGE_MONITOR
cae681fc 364
fc4d5c29
DH
365config NOMMU_INITIAL_TRIM_EXCESS
366 int "Turn on mmap() excess space trimming before booting"
367 depends on !MMU
368 default 1
369 help
370 The NOMMU mmap() frequently needs to allocate large contiguous chunks
371 of memory on which to store mappings, but it can only ask the system
372 allocator for chunks in 2^N*PAGE_SIZE amounts - which is frequently
373 more than it requires. To deal with this, mmap() is able to trim off
374 the excess and return it to the allocator.
375
376 If trimming is enabled, the excess is trimmed off and returned to the
377 system allocator, which can cause extra fragmentation, particularly
378 if there are a lot of transient processes.
379
380 If trimming is disabled, the excess is kept, but not used, which for
381 long-term mappings means that the space is wasted.
382
383 Trimming can be dynamically controlled through a sysctl option
384 (/proc/sys/vm/nr_trim_pages) which specifies the minimum number of
385 excess pages there must be before trimming should occur, or zero if
386 no trimming is to occur.
387
388 This option specifies the initial value of this option. The default
389 of 1 says that all excess pages should be trimmed.
390
dd19d293 391 See Documentation/admin-guide/mm/nommu-mmap.rst for more information.
bbddff05 392
4c76d9d1 393config TRANSPARENT_HUGEPAGE
13ece886 394 bool "Transparent Hugepage Support"
15626062 395 depends on HAVE_ARCH_TRANSPARENT_HUGEPAGE
5d689240 396 select COMPACTION
3a08cd52 397 select XARRAY_MULTI
4c76d9d1
AA
398 help
399 Transparent Hugepages allows the kernel to use huge pages and
400 huge tlb transparently to the applications whenever possible.
401 This feature can improve computing performance to certain
402 applications by speeding up page faults during memory
403 allocation, by reducing the number of tlb misses and by speeding
404 up the pagetable walking.
405
406 If memory constrained on embedded, you may want to say N.
407
13ece886
AA
408choice
409 prompt "Transparent Hugepage Support sysfs defaults"
410 depends on TRANSPARENT_HUGEPAGE
411 default TRANSPARENT_HUGEPAGE_ALWAYS
412 help
413 Selects the sysfs defaults for Transparent Hugepage Support.
414
415 config TRANSPARENT_HUGEPAGE_ALWAYS
416 bool "always"
417 help
418 Enabling Transparent Hugepage always, can increase the
419 memory footprint of applications without a guaranteed
420 benefit but it will work automatically for all applications.
421
422 config TRANSPARENT_HUGEPAGE_MADVISE
423 bool "madvise"
424 help
425 Enabling Transparent Hugepage madvise, will only provide a
426 performance improvement benefit to the applications using
427 madvise(MADV_HUGEPAGE) but it won't risk to increase the
428 memory footprint of applications without a guaranteed
429 benefit.
430endchoice
431
38d8b4e6 432config ARCH_WANTS_THP_SWAP
19fa40a0 433 def_bool n
38d8b4e6
HY
434
435config THP_SWAP
436 def_bool y
14fef284 437 depends on TRANSPARENT_HUGEPAGE && ARCH_WANTS_THP_SWAP && SWAP
38d8b4e6
HY
438 help
439 Swap transparent huge pages in one piece, without splitting.
14fef284
HY
440 XXX: For now, swap cluster backing transparent huge page
441 will be split after swapout.
38d8b4e6
HY
442
443 For selection by architectures with reasonable THP sizes.
444
bbddff05
TH
445#
446# UP and nommu archs use km based percpu allocator
447#
448config NEED_PER_CPU_KM
449 depends on !SMP
450 bool
451 default y
077b1f83
DM
452
453config CLEANCACHE
454 bool "Enable cleancache driver to cache clean pages if tmem is present"
077b1f83
DM
455 help
456 Cleancache can be thought of as a page-granularity victim cache
457 for clean pages that the kernel's pageframe replacement algorithm
458 (PFRA) would like to keep around, but can't since there isn't enough
459 memory. So when the PFRA "evicts" a page, it first attempts to use
140a1ef2 460 cleancache code to put the data contained in that page into
077b1f83
DM
461 "transcendent memory", memory that is not directly accessible or
462 addressable by the kernel and is of unknown and possibly
463 time-varying size. And when a cleancache-enabled
464 filesystem wishes to access a page in a file on disk, it first
465 checks cleancache to see if it already contains it; if it does,
466 the page is copied into the kernel and a disk access is avoided.
467 When a transcendent memory driver is available (such as zcache or
468 Xen transcendent memory), a significant I/O reduction
469 may be achieved. When none is available, all cleancache calls
470 are reduced to a single pointer-compare-against-NULL resulting
471 in a negligible performance hit.
472
473 If unsure, say Y to enable cleancache
27c6aec2
DM
474
475config FRONTSWAP
476 bool "Enable frontswap to cache swap pages if tmem is present"
477 depends on SWAP
27c6aec2
DM
478 help
479 Frontswap is so named because it can be thought of as the opposite
480 of a "backing" store for a swap device. The data is stored into
481 "transcendent memory", memory that is not directly accessible or
482 addressable by the kernel and is of unknown and possibly
483 time-varying size. When space in transcendent memory is available,
484 a significant swap I/O reduction may be achieved. When none is
485 available, all frontswap calls are reduced to a single pointer-
486 compare-against-NULL resulting in a negligible performance hit
487 and swap data is stored as normal on the matching swap device.
488
489 If unsure, say Y to enable frontswap.
f825c736
AK
490
491config CMA
492 bool "Contiguous Memory Allocator"
aca52c39 493 depends on MMU
f825c736
AK
494 select MIGRATION
495 select MEMORY_ISOLATION
496 help
497 This enables the Contiguous Memory Allocator which allows other
498 subsystems to allocate big physically-contiguous blocks of memory.
499 CMA reserves a region of memory and allows only movable pages to
500 be allocated from it. This way, the kernel can use the memory for
501 pagecache and when a subsystem requests for contiguous area, the
502 allocated pages are migrated away to serve the contiguous request.
503
504 If unsure, say "n".
505
506config CMA_DEBUG
507 bool "CMA debug messages (DEVELOPMENT)"
508 depends on DEBUG_KERNEL && CMA
509 help
510 Turns on debug messages in CMA. This produces KERN_DEBUG
511 messages for every CMA call as well as various messages while
512 processing calls such as dma_alloc_from_contiguous().
513 This option does not affect warning and error messages.
bf550fc9 514
28b24c1f
SL
515config CMA_DEBUGFS
516 bool "CMA debugfs interface"
517 depends on CMA && DEBUG_FS
518 help
519 Turns on the DebugFS interface for CMA.
520
43ca106f
MK
521config CMA_SYSFS
522 bool "CMA information through sysfs interface"
523 depends on CMA && SYSFS
524 help
525 This option exposes some sysfs attributes to get information
526 from CMA.
527
a254129e
JK
528config CMA_AREAS
529 int "Maximum count of the CMA areas"
530 depends on CMA
b7176c26 531 default 19 if NUMA
a254129e
JK
532 default 7
533 help
534 CMA allows to create CMA areas for particular purpose, mainly,
535 used as device private area. This parameter sets the maximum
536 number of CMA area in the system.
537
b7176c26 538 If unsure, leave the default value "7" in UMA and "19" in NUMA.
a254129e 539
af8d417a
DS
540config MEM_SOFT_DIRTY
541 bool "Track memory changes"
542 depends on CHECKPOINT_RESTORE && HAVE_ARCH_SOFT_DIRTY && PROC_FS
543 select PROC_PAGE_MONITOR
4e2e2770 544 help
af8d417a
DS
545 This option enables memory changes tracking by introducing a
546 soft-dirty bit on pte-s. This bit it set when someone writes
547 into a page just as regular dirty bit, but unlike the latter
548 it can be cleared by hands.
549
1ad1335d 550 See Documentation/admin-guide/mm/soft-dirty.rst for more details.
4e2e2770 551
2b281117
SJ
552config ZSWAP
553 bool "Compressed cache for swap pages (EXPERIMENTAL)"
554 depends on FRONTSWAP && CRYPTO=y
12d79d64 555 select ZPOOL
2b281117
SJ
556 help
557 A lightweight compressed cache for swap pages. It takes
558 pages that are in the process of being swapped out and attempts to
559 compress them into a dynamically allocated RAM-based memory pool.
560 This can result in a significant I/O reduction on swap device and,
561 in the case where decompressing from RAM is faster that swap device
562 reads, can also improve workload performance.
563
564 This is marked experimental because it is a new feature (as of
565 v3.11) that interacts heavily with memory reclaim. While these
566 interactions don't cause any known issues on simple memory setups,
567 they have not be fully explored on the large set of potential
568 configurations and workloads that exist.
569
bb8b93b5
MS
570choice
571 prompt "Compressed cache for swap pages default compressor"
572 depends on ZSWAP
573 default ZSWAP_COMPRESSOR_DEFAULT_LZO
574 help
575 Selects the default compression algorithm for the compressed cache
576 for swap pages.
577
578 For an overview what kind of performance can be expected from
579 a particular compression algorithm please refer to the benchmarks
580 available at the following LWN page:
581 https://lwn.net/Articles/751795/
582
583 If in doubt, select 'LZO'.
584
585 The selection made here can be overridden by using the kernel
586 command line 'zswap.compressor=' option.
587
588config ZSWAP_COMPRESSOR_DEFAULT_DEFLATE
589 bool "Deflate"
590 select CRYPTO_DEFLATE
591 help
592 Use the Deflate algorithm as the default compression algorithm.
593
594config ZSWAP_COMPRESSOR_DEFAULT_LZO
595 bool "LZO"
596 select CRYPTO_LZO
597 help
598 Use the LZO algorithm as the default compression algorithm.
599
600config ZSWAP_COMPRESSOR_DEFAULT_842
601 bool "842"
602 select CRYPTO_842
603 help
604 Use the 842 algorithm as the default compression algorithm.
605
606config ZSWAP_COMPRESSOR_DEFAULT_LZ4
607 bool "LZ4"
608 select CRYPTO_LZ4
609 help
610 Use the LZ4 algorithm as the default compression algorithm.
611
612config ZSWAP_COMPRESSOR_DEFAULT_LZ4HC
613 bool "LZ4HC"
614 select CRYPTO_LZ4HC
615 help
616 Use the LZ4HC algorithm as the default compression algorithm.
617
618config ZSWAP_COMPRESSOR_DEFAULT_ZSTD
619 bool "zstd"
620 select CRYPTO_ZSTD
621 help
622 Use the zstd algorithm as the default compression algorithm.
623endchoice
624
625config ZSWAP_COMPRESSOR_DEFAULT
626 string
627 depends on ZSWAP
628 default "deflate" if ZSWAP_COMPRESSOR_DEFAULT_DEFLATE
629 default "lzo" if ZSWAP_COMPRESSOR_DEFAULT_LZO
630 default "842" if ZSWAP_COMPRESSOR_DEFAULT_842
631 default "lz4" if ZSWAP_COMPRESSOR_DEFAULT_LZ4
632 default "lz4hc" if ZSWAP_COMPRESSOR_DEFAULT_LZ4HC
633 default "zstd" if ZSWAP_COMPRESSOR_DEFAULT_ZSTD
634 default ""
635
636choice
637 prompt "Compressed cache for swap pages default allocator"
638 depends on ZSWAP
639 default ZSWAP_ZPOOL_DEFAULT_ZBUD
640 help
641 Selects the default allocator for the compressed cache for
642 swap pages.
643 The default is 'zbud' for compatibility, however please do
644 read the description of each of the allocators below before
645 making a right choice.
646
647 The selection made here can be overridden by using the kernel
648 command line 'zswap.zpool=' option.
649
650config ZSWAP_ZPOOL_DEFAULT_ZBUD
651 bool "zbud"
652 select ZBUD
653 help
654 Use the zbud allocator as the default allocator.
655
656config ZSWAP_ZPOOL_DEFAULT_Z3FOLD
657 bool "z3fold"
658 select Z3FOLD
659 help
660 Use the z3fold allocator as the default allocator.
661
662config ZSWAP_ZPOOL_DEFAULT_ZSMALLOC
663 bool "zsmalloc"
664 select ZSMALLOC
665 help
666 Use the zsmalloc allocator as the default allocator.
667endchoice
668
669config ZSWAP_ZPOOL_DEFAULT
670 string
671 depends on ZSWAP
672 default "zbud" if ZSWAP_ZPOOL_DEFAULT_ZBUD
673 default "z3fold" if ZSWAP_ZPOOL_DEFAULT_Z3FOLD
674 default "zsmalloc" if ZSWAP_ZPOOL_DEFAULT_ZSMALLOC
675 default ""
676
677config ZSWAP_DEFAULT_ON
678 bool "Enable the compressed cache for swap pages by default"
679 depends on ZSWAP
680 help
681 If selected, the compressed cache for swap pages will be enabled
682 at boot, otherwise it will be disabled.
683
684 The selection made here can be overridden by using the kernel
685 command line 'zswap.enabled=' option.
686
af8d417a
DS
687config ZPOOL
688 tristate "Common API for compressed memory storage"
0f8975ec 689 help
af8d417a
DS
690 Compressed memory storage API. This allows using either zbud or
691 zsmalloc.
0f8975ec 692
af8d417a 693config ZBUD
9a001fc1 694 tristate "Low (Up to 2x) density storage for compressed pages"
af8d417a
DS
695 help
696 A special purpose allocator for storing compressed pages.
697 It is designed to store up to two compressed pages per physical
698 page. While this design limits storage density, it has simple and
699 deterministic reclaim properties that make it preferable to a higher
700 density approach when reclaim will be used.
bcf1647d 701
9a001fc1
VW
702config Z3FOLD
703 tristate "Up to 3x density storage for compressed pages"
704 depends on ZPOOL
9a001fc1
VW
705 help
706 A special purpose allocator for storing compressed pages.
707 It is designed to store up to three compressed pages per physical
708 page. It is a ZBUD derivative so the simplicity and determinism are
709 still there.
710
bcf1647d 711config ZSMALLOC
d867f203 712 tristate "Memory allocator for compressed pages"
bcf1647d 713 depends on MMU
bcf1647d
MK
714 help
715 zsmalloc is a slab-based memory allocator designed to store
716 compressed RAM pages. zsmalloc uses virtual memory mapping
717 in order to reduce fragmentation. However, this results in a
718 non-standard allocator interface where a handle, not a pointer, is
719 returned by an alloc(). This handle must be mapped in order to
720 access the allocated space.
721
0f050d99
GM
722config ZSMALLOC_STAT
723 bool "Export zsmalloc statistics"
724 depends on ZSMALLOC
725 select DEBUG_FS
726 help
727 This option enables code in the zsmalloc to collect various
01ab1ede 728 statistics about what's happening in zsmalloc and exports that
0f050d99
GM
729 information to userspace via debugfs.
730 If unsure, say N.
731
9e5c33d7
MS
732config GENERIC_EARLY_IOREMAP
733 bool
042d27ac 734
22ee3ea5
HD
735config STACK_MAX_DEFAULT_SIZE_MB
736 int "Default maximum user stack size for 32-bit processes (MB)"
737 default 100
042d27ac
HD
738 range 8 2048
739 depends on STACK_GROWSUP && (!64BIT || COMPAT)
740 help
741 This is the maximum stack size in Megabytes in the VM layout of 32-bit
742 user processes when the stack grows upwards (currently only on parisc
22ee3ea5 743 arch) when the RLIMIT_STACK hard limit is unlimited.
042d27ac 744
22ee3ea5 745 A sane initial value is 100 MB.
3a80a7fa 746
3a80a7fa 747config DEFERRED_STRUCT_PAGE_INIT
1ce22103 748 bool "Defer initialisation of struct pages to kthreads"
d39f8fb4 749 depends on SPARSEMEM
ab1e8d89 750 depends on !NEED_PER_CPU_KM
889c695d 751 depends on 64BIT
e4443149 752 select PADATA
3a80a7fa
MG
753 help
754 Ordinarily all struct pages are initialised during early boot in a
755 single thread. On very large machines this can take a considerable
756 amount of time. If this option is set, large machines will bring up
e4443149
DJ
757 a subset of memmap at boot and then initialise the rest in parallel.
758 This has a potential performance impact on tasks running early in the
1ce22103
VB
759 lifetime of the system until these kthreads finish the
760 initialisation.
033fbae9 761
33c3fc71
VD
762config IDLE_PAGE_TRACKING
763 bool "Enable idle page tracking"
764 depends on SYSFS && MMU
765 select PAGE_EXTENSION if !64BIT
766 help
767 This feature allows to estimate the amount of user pages that have
768 not been touched during a given period of time. This information can
769 be useful to tune memory cgroup limits and/or for job placement
770 within a compute cluster.
771
1ad1335d
MR
772 See Documentation/admin-guide/mm/idle_page_tracking.rst for
773 more details.
33c3fc71 774
17596731 775config ARCH_HAS_PTE_DEVMAP
65f7d049
OH
776 bool
777
033fbae9 778config ZONE_DEVICE
5042db43 779 bool "Device memory (pmem, HMM, etc...) hotplug support"
033fbae9
DW
780 depends on MEMORY_HOTPLUG
781 depends on MEMORY_HOTREMOVE
99490f16 782 depends on SPARSEMEM_VMEMMAP
17596731 783 depends on ARCH_HAS_PTE_DEVMAP
3a08cd52 784 select XARRAY_MULTI
033fbae9
DW
785
786 help
787 Device memory hotplug support allows for establishing pmem,
788 or other device driver discovered memory regions, in the
789 memmap. This allows pfn_to_page() lookups of otherwise
790 "device-physical" addresses which is needed for using a DAX
791 mapping in an O_DIRECT operation, among other things.
792
793 If FS_DAX is enabled, then say Y.
06a660ad 794
e7638488
DW
795config DEV_PAGEMAP_OPS
796 bool
797
9c240a7b
CH
798#
799# Helpers to mirror range of the CPU page tables of a process into device page
800# tables.
801#
c0b12405 802config HMM_MIRROR
9c240a7b 803 bool
f442c283 804 depends on MMU
c0b12405 805
5042db43
JG
806config DEVICE_PRIVATE
807 bool "Unaddressable device memory (GPU memory, ...)"
7328d9cc 808 depends on ZONE_DEVICE
e7638488 809 select DEV_PAGEMAP_OPS
5042db43
JG
810
811 help
812 Allows creation of struct pages to represent unaddressable device
813 memory; i.e., memory that is only accessible from the device (or
814 group of devices). You likely also want to select HMM_MIRROR.
815
3e9a9e25
CH
816config VMAP_PFN
817 bool
818
63c17fb8
DH
819config ARCH_USES_HIGH_VMA_FLAGS
820 bool
66d37570
DH
821config ARCH_HAS_PKEYS
822 bool
30a5b536
DZ
823
824config PERCPU_STATS
825 bool "Collect percpu memory statistics"
30a5b536
DZ
826 help
827 This feature collects and exposes statistics via debugfs. The
828 information includes global and per chunk statistics, which can
829 be used to help understand percpu memory usage.
64c349f4 830
9c84f229
JH
831config GUP_TEST
832 bool "Enable infrastructure for get_user_pages()-related unit tests"
d0de8241 833 depends on DEBUG_FS
64c349f4 834 help
9c84f229
JH
835 Provides /sys/kernel/debug/gup_test, which in turn provides a way
836 to make ioctl calls that can launch kernel-based unit tests for
837 the get_user_pages*() and pin_user_pages*() family of API calls.
64c349f4 838
9c84f229
JH
839 These tests include benchmark testing of the _fast variants of
840 get_user_pages*() and pin_user_pages*(), as well as smoke tests of
841 the non-_fast variants.
842
f4f9bda4
JH
843 There is also a sub-test that allows running dump_page() on any
844 of up to eight pages (selected by command line args) within the
845 range of user-space addresses. These pages are either pinned via
846 pin_user_pages*(), or pinned via get_user_pages*(), as specified
847 by other command line arguments.
848
9c84f229 849 See tools/testing/selftests/vm/gup_test.c
3010a5ea 850
d0de8241
BS
851comment "GUP_TEST needs to have DEBUG_FS enabled"
852 depends on !GUP_TEST && !DEBUG_FS
3010a5ea 853
39656e83
CH
854config GUP_GET_PTE_LOW_HIGH
855 bool
856
99cb0dbd
SL
857config READ_ONLY_THP_FOR_FS
858 bool "Read-only THP for filesystems (EXPERIMENTAL)"
396bcc52 859 depends on TRANSPARENT_HUGEPAGE && SHMEM
99cb0dbd
SL
860
861 help
862 Allow khugepaged to put read-only file-backed pages in THP.
863
864 This is marked experimental because it is a new feature. Write
865 support of file THPs will be developed in the next few release
866 cycles.
867
3010a5ea
LD
868config ARCH_HAS_PTE_SPECIAL
869 bool
59e0b520 870
cbd34da7
CH
871#
872# Some architectures require a special hugepage directory format that is
873# required to support multiple hugepage sizes. For example a4fe3ce76
874# "powerpc/mm: Allow more flexible layouts for hugepage pagetables"
875# introduced it on powerpc. This allows for a more flexible hugepage
876# pagetable layouts.
877#
878config ARCH_HAS_HUGEPD
879 bool
880
c5acad84
TH
881config MAPPING_DIRTY_HELPERS
882 bool
883
298fa1ad
TG
884config KMAP_LOCAL
885 bool
886
1fbaf8fc
CH
887# struct io_mapping based helper. Selected by drivers that need them
888config IO_MAPPING
889 bool
59e0b520 890endmenu