]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blob - include/linux/vmstat.h
Merge git://git.kernel.org/pub/scm/linux/kernel/git/netdev/net
[mirror_ubuntu-jammy-kernel.git] / include / linux / vmstat.h
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _LINUX_VMSTAT_H
3 #define _LINUX_VMSTAT_H
4
5 #include <linux/types.h>
6 #include <linux/percpu.h>
7 #include <linux/mmzone.h>
8 #include <linux/vm_event_item.h>
9 #include <linux/atomic.h>
10 #include <linux/static_key.h>
11
12 extern int sysctl_stat_interval;
13
14 #ifdef CONFIG_NUMA
15 #define ENABLE_NUMA_STAT 1
16 #define DISABLE_NUMA_STAT 0
17 extern int sysctl_vm_numa_stat;
18 DECLARE_STATIC_KEY_TRUE(vm_numa_stat_key);
19 extern int sysctl_vm_numa_stat_handler(struct ctl_table *table,
20 int write, void __user *buffer, size_t *length, loff_t *ppos);
21 #endif
22
23 struct reclaim_stat {
24 unsigned nr_dirty;
25 unsigned nr_unqueued_dirty;
26 unsigned nr_congested;
27 unsigned nr_writeback;
28 unsigned nr_immediate;
29 unsigned nr_activate[2];
30 unsigned nr_ref_keep;
31 unsigned nr_unmap_fail;
32 };
33
34 enum writeback_stat_item {
35 NR_DIRTY_THRESHOLD,
36 NR_DIRTY_BG_THRESHOLD,
37 NR_VM_WRITEBACK_STAT_ITEMS,
38 };
39
40 #ifdef CONFIG_VM_EVENT_COUNTERS
41 /*
42 * Light weight per cpu counter implementation.
43 *
44 * Counters should only be incremented and no critical kernel component
45 * should rely on the counter values.
46 *
47 * Counters are handled completely inline. On many platforms the code
48 * generated will simply be the increment of a global address.
49 */
50
51 struct vm_event_state {
52 unsigned long event[NR_VM_EVENT_ITEMS];
53 };
54
55 DECLARE_PER_CPU(struct vm_event_state, vm_event_states);
56
57 /*
58 * vm counters are allowed to be racy. Use raw_cpu_ops to avoid the
59 * local_irq_disable overhead.
60 */
61 static inline void __count_vm_event(enum vm_event_item item)
62 {
63 raw_cpu_inc(vm_event_states.event[item]);
64 }
65
66 static inline void count_vm_event(enum vm_event_item item)
67 {
68 this_cpu_inc(vm_event_states.event[item]);
69 }
70
71 static inline void __count_vm_events(enum vm_event_item item, long delta)
72 {
73 raw_cpu_add(vm_event_states.event[item], delta);
74 }
75
76 static inline void count_vm_events(enum vm_event_item item, long delta)
77 {
78 this_cpu_add(vm_event_states.event[item], delta);
79 }
80
81 extern void all_vm_events(unsigned long *);
82
83 extern void vm_events_fold_cpu(int cpu);
84
85 #else
86
87 /* Disable counters */
88 static inline void count_vm_event(enum vm_event_item item)
89 {
90 }
91 static inline void count_vm_events(enum vm_event_item item, long delta)
92 {
93 }
94 static inline void __count_vm_event(enum vm_event_item item)
95 {
96 }
97 static inline void __count_vm_events(enum vm_event_item item, long delta)
98 {
99 }
100 static inline void all_vm_events(unsigned long *ret)
101 {
102 }
103 static inline void vm_events_fold_cpu(int cpu)
104 {
105 }
106
107 #endif /* CONFIG_VM_EVENT_COUNTERS */
108
109 #ifdef CONFIG_NUMA_BALANCING
110 #define count_vm_numa_event(x) count_vm_event(x)
111 #define count_vm_numa_events(x, y) count_vm_events(x, y)
112 #else
113 #define count_vm_numa_event(x) do {} while (0)
114 #define count_vm_numa_events(x, y) do { (void)(y); } while (0)
115 #endif /* CONFIG_NUMA_BALANCING */
116
117 #ifdef CONFIG_DEBUG_TLBFLUSH
118 #define count_vm_tlb_event(x) count_vm_event(x)
119 #define count_vm_tlb_events(x, y) count_vm_events(x, y)
120 #else
121 #define count_vm_tlb_event(x) do {} while (0)
122 #define count_vm_tlb_events(x, y) do { (void)(y); } while (0)
123 #endif
124
125 #ifdef CONFIG_DEBUG_VM_VMACACHE
126 #define count_vm_vmacache_event(x) count_vm_event(x)
127 #else
128 #define count_vm_vmacache_event(x) do {} while (0)
129 #endif
130
131 #define __count_zid_vm_events(item, zid, delta) \
132 __count_vm_events(item##_NORMAL - ZONE_NORMAL + zid, delta)
133
134 /*
135 * Zone and node-based page accounting with per cpu differentials.
136 */
137 extern atomic_long_t vm_zone_stat[NR_VM_ZONE_STAT_ITEMS];
138 extern atomic_long_t vm_numa_stat[NR_VM_NUMA_STAT_ITEMS];
139 extern atomic_long_t vm_node_stat[NR_VM_NODE_STAT_ITEMS];
140
141 #ifdef CONFIG_NUMA
142 static inline void zone_numa_state_add(long x, struct zone *zone,
143 enum numa_stat_item item)
144 {
145 atomic_long_add(x, &zone->vm_numa_stat[item]);
146 atomic_long_add(x, &vm_numa_stat[item]);
147 }
148
149 static inline unsigned long global_numa_state(enum numa_stat_item item)
150 {
151 long x = atomic_long_read(&vm_numa_stat[item]);
152
153 return x;
154 }
155
156 static inline unsigned long zone_numa_state_snapshot(struct zone *zone,
157 enum numa_stat_item item)
158 {
159 long x = atomic_long_read(&zone->vm_numa_stat[item]);
160 int cpu;
161
162 for_each_online_cpu(cpu)
163 x += per_cpu_ptr(zone->pageset, cpu)->vm_numa_stat_diff[item];
164
165 return x;
166 }
167 #endif /* CONFIG_NUMA */
168
169 static inline void zone_page_state_add(long x, struct zone *zone,
170 enum zone_stat_item item)
171 {
172 atomic_long_add(x, &zone->vm_stat[item]);
173 atomic_long_add(x, &vm_zone_stat[item]);
174 }
175
176 static inline void node_page_state_add(long x, struct pglist_data *pgdat,
177 enum node_stat_item item)
178 {
179 atomic_long_add(x, &pgdat->vm_stat[item]);
180 atomic_long_add(x, &vm_node_stat[item]);
181 }
182
183 static inline unsigned long global_zone_page_state(enum zone_stat_item item)
184 {
185 long x = atomic_long_read(&vm_zone_stat[item]);
186 #ifdef CONFIG_SMP
187 if (x < 0)
188 x = 0;
189 #endif
190 return x;
191 }
192
193 static inline unsigned long global_node_page_state(enum node_stat_item item)
194 {
195 long x = atomic_long_read(&vm_node_stat[item]);
196 #ifdef CONFIG_SMP
197 if (x < 0)
198 x = 0;
199 #endif
200 return x;
201 }
202
203 static inline unsigned long zone_page_state(struct zone *zone,
204 enum zone_stat_item item)
205 {
206 long x = atomic_long_read(&zone->vm_stat[item]);
207 #ifdef CONFIG_SMP
208 if (x < 0)
209 x = 0;
210 #endif
211 return x;
212 }
213
214 /*
215 * More accurate version that also considers the currently pending
216 * deltas. For that we need to loop over all cpus to find the current
217 * deltas. There is no synchronization so the result cannot be
218 * exactly accurate either.
219 */
220 static inline unsigned long zone_page_state_snapshot(struct zone *zone,
221 enum zone_stat_item item)
222 {
223 long x = atomic_long_read(&zone->vm_stat[item]);
224
225 #ifdef CONFIG_SMP
226 int cpu;
227 for_each_online_cpu(cpu)
228 x += per_cpu_ptr(zone->pageset, cpu)->vm_stat_diff[item];
229
230 if (x < 0)
231 x = 0;
232 #endif
233 return x;
234 }
235
236 #ifdef CONFIG_NUMA
237 extern void __inc_numa_state(struct zone *zone, enum numa_stat_item item);
238 extern unsigned long sum_zone_node_page_state(int node,
239 enum zone_stat_item item);
240 extern unsigned long sum_zone_numa_state(int node, enum numa_stat_item item);
241 extern unsigned long node_page_state(struct pglist_data *pgdat,
242 enum node_stat_item item);
243 #else
244 #define sum_zone_node_page_state(node, item) global_zone_page_state(item)
245 #define node_page_state(node, item) global_node_page_state(item)
246 #endif /* CONFIG_NUMA */
247
248 #ifdef CONFIG_SMP
249 void __mod_zone_page_state(struct zone *, enum zone_stat_item item, long);
250 void __inc_zone_page_state(struct page *, enum zone_stat_item);
251 void __dec_zone_page_state(struct page *, enum zone_stat_item);
252
253 void __mod_node_page_state(struct pglist_data *, enum node_stat_item item, long);
254 void __inc_node_page_state(struct page *, enum node_stat_item);
255 void __dec_node_page_state(struct page *, enum node_stat_item);
256
257 void mod_zone_page_state(struct zone *, enum zone_stat_item, long);
258 void inc_zone_page_state(struct page *, enum zone_stat_item);
259 void dec_zone_page_state(struct page *, enum zone_stat_item);
260
261 void mod_node_page_state(struct pglist_data *, enum node_stat_item, long);
262 void inc_node_page_state(struct page *, enum node_stat_item);
263 void dec_node_page_state(struct page *, enum node_stat_item);
264
265 extern void inc_node_state(struct pglist_data *, enum node_stat_item);
266 extern void __inc_zone_state(struct zone *, enum zone_stat_item);
267 extern void __inc_node_state(struct pglist_data *, enum node_stat_item);
268 extern void dec_zone_state(struct zone *, enum zone_stat_item);
269 extern void __dec_zone_state(struct zone *, enum zone_stat_item);
270 extern void __dec_node_state(struct pglist_data *, enum node_stat_item);
271
272 void quiet_vmstat(void);
273 void cpu_vm_stats_fold(int cpu);
274 void refresh_zone_stat_thresholds(void);
275
276 struct ctl_table;
277 int vmstat_refresh(struct ctl_table *, int write,
278 void __user *buffer, size_t *lenp, loff_t *ppos);
279
280 void drain_zonestat(struct zone *zone, struct per_cpu_pageset *);
281
282 int calculate_pressure_threshold(struct zone *zone);
283 int calculate_normal_threshold(struct zone *zone);
284 void set_pgdat_percpu_threshold(pg_data_t *pgdat,
285 int (*calculate_pressure)(struct zone *));
286 #else /* CONFIG_SMP */
287
288 /*
289 * We do not maintain differentials in a single processor configuration.
290 * The functions directly modify the zone and global counters.
291 */
292 static inline void __mod_zone_page_state(struct zone *zone,
293 enum zone_stat_item item, long delta)
294 {
295 zone_page_state_add(delta, zone, item);
296 }
297
298 static inline void __mod_node_page_state(struct pglist_data *pgdat,
299 enum node_stat_item item, int delta)
300 {
301 node_page_state_add(delta, pgdat, item);
302 }
303
304 static inline void __inc_zone_state(struct zone *zone, enum zone_stat_item item)
305 {
306 atomic_long_inc(&zone->vm_stat[item]);
307 atomic_long_inc(&vm_zone_stat[item]);
308 }
309
310 static inline void __inc_node_state(struct pglist_data *pgdat, enum node_stat_item item)
311 {
312 atomic_long_inc(&pgdat->vm_stat[item]);
313 atomic_long_inc(&vm_node_stat[item]);
314 }
315
316 static inline void __dec_zone_state(struct zone *zone, enum zone_stat_item item)
317 {
318 atomic_long_dec(&zone->vm_stat[item]);
319 atomic_long_dec(&vm_zone_stat[item]);
320 }
321
322 static inline void __dec_node_state(struct pglist_data *pgdat, enum node_stat_item item)
323 {
324 atomic_long_dec(&pgdat->vm_stat[item]);
325 atomic_long_dec(&vm_node_stat[item]);
326 }
327
328 static inline void __inc_zone_page_state(struct page *page,
329 enum zone_stat_item item)
330 {
331 __inc_zone_state(page_zone(page), item);
332 }
333
334 static inline void __inc_node_page_state(struct page *page,
335 enum node_stat_item item)
336 {
337 __inc_node_state(page_pgdat(page), item);
338 }
339
340
341 static inline void __dec_zone_page_state(struct page *page,
342 enum zone_stat_item item)
343 {
344 __dec_zone_state(page_zone(page), item);
345 }
346
347 static inline void __dec_node_page_state(struct page *page,
348 enum node_stat_item item)
349 {
350 __dec_node_state(page_pgdat(page), item);
351 }
352
353
354 /*
355 * We only use atomic operations to update counters. So there is no need to
356 * disable interrupts.
357 */
358 #define inc_zone_page_state __inc_zone_page_state
359 #define dec_zone_page_state __dec_zone_page_state
360 #define mod_zone_page_state __mod_zone_page_state
361
362 #define inc_node_page_state __inc_node_page_state
363 #define dec_node_page_state __dec_node_page_state
364 #define mod_node_page_state __mod_node_page_state
365
366 #define inc_zone_state __inc_zone_state
367 #define inc_node_state __inc_node_state
368 #define dec_zone_state __dec_zone_state
369
370 #define set_pgdat_percpu_threshold(pgdat, callback) { }
371
372 static inline void refresh_zone_stat_thresholds(void) { }
373 static inline void cpu_vm_stats_fold(int cpu) { }
374 static inline void quiet_vmstat(void) { }
375
376 static inline void drain_zonestat(struct zone *zone,
377 struct per_cpu_pageset *pset) { }
378 #endif /* CONFIG_SMP */
379
380 static inline void __mod_zone_freepage_state(struct zone *zone, int nr_pages,
381 int migratetype)
382 {
383 __mod_zone_page_state(zone, NR_FREE_PAGES, nr_pages);
384 if (is_migrate_cma(migratetype))
385 __mod_zone_page_state(zone, NR_FREE_CMA_PAGES, nr_pages);
386 }
387
388 extern const char * const vmstat_text[];
389
390 static inline const char *zone_stat_name(enum zone_stat_item item)
391 {
392 return vmstat_text[item];
393 }
394
395 #ifdef CONFIG_NUMA
396 static inline const char *numa_stat_name(enum numa_stat_item item)
397 {
398 return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
399 item];
400 }
401 #endif /* CONFIG_NUMA */
402
403 static inline const char *node_stat_name(enum node_stat_item item)
404 {
405 return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
406 NR_VM_NUMA_STAT_ITEMS +
407 item];
408 }
409
410 static inline const char *lru_list_name(enum lru_list lru)
411 {
412 return node_stat_name(NR_LRU_BASE + lru) + 3; // skip "nr_"
413 }
414
415 static inline const char *writeback_stat_name(enum writeback_stat_item item)
416 {
417 return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
418 NR_VM_NUMA_STAT_ITEMS +
419 NR_VM_NODE_STAT_ITEMS +
420 item];
421 }
422
423 #if defined(CONFIG_VM_EVENT_COUNTERS) || defined(CONFIG_MEMCG)
424 static inline const char *vm_event_name(enum vm_event_item item)
425 {
426 return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
427 NR_VM_NUMA_STAT_ITEMS +
428 NR_VM_NODE_STAT_ITEMS +
429 NR_VM_WRITEBACK_STAT_ITEMS +
430 item];
431 }
432 #endif /* CONFIG_VM_EVENT_COUNTERS || CONFIG_MEMCG */
433
434 #endif /* _LINUX_VMSTAT_H */