1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _LINUX_VMSTAT_H
3 #define _LINUX_VMSTAT_H
4
5 #include <linux/types.h>
6 #include <linux/percpu.h>
7 #include <linux/mmzone.h>
8 #include <linux/vm_event_item.h>
9 #include <linux/atomic.h>
10 #include <linux/static_key.h>
11
12 extern int sysctl_stat_interval;
13
14 #ifdef CONFIG_NUMA
15 #define ENABLE_NUMA_STAT 1
16 #define DISABLE_NUMA_STAT 0
17 extern int sysctl_vm_numa_stat;
18 DECLARE_STATIC_KEY_TRUE(vm_numa_stat_key);
19 extern int sysctl_vm_numa_stat_handler(struct ctl_table *table,
20 int write, void __user *buffer, size_t *length, loff_t *ppos);
21 #endif
22
23 struct reclaim_stat {
24 unsigned nr_dirty;
25 unsigned nr_unqueued_dirty;
26 unsigned nr_congested;
27 unsigned nr_writeback;
28 unsigned nr_immediate;
29 unsigned nr_activate;
30 unsigned nr_ref_keep;
31 unsigned nr_unmap_fail;
32 };
33
34 #ifdef CONFIG_VM_EVENT_COUNTERS
35 /*
36 * Light weight per cpu counter implementation.
37 *
38 * Counters should only be incremented and no critical kernel component
39 * should rely on the counter values.
40 *
41 * Counters are handled completely inline. On many platforms the code
42 * generated will simply be the increment of a global address.
43 */
44
45 struct vm_event_state {
46 unsigned long event[NR_VM_EVENT_ITEMS];
47 };
48
49 DECLARE_PER_CPU(struct vm_event_state, vm_event_states);
50
51 /*
52 * vm counters are allowed to be racy. Use raw_cpu_ops to avoid the
53 * local_irq_disable overhead.
54 */
__count_vm_event(enum vm_event_item item)55 static inline void __count_vm_event(enum vm_event_item item)
56 {
57 raw_cpu_inc(vm_event_states.event[item]);
58 }
59
count_vm_event(enum vm_event_item item)60 static inline void count_vm_event(enum vm_event_item item)
61 {
62 this_cpu_inc(vm_event_states.event[item]);
63 }
64
__count_vm_events(enum vm_event_item item,long delta)65 static inline void __count_vm_events(enum vm_event_item item, long delta)
66 {
67 raw_cpu_add(vm_event_states.event[item], delta);
68 }
69
count_vm_events(enum vm_event_item item,long delta)70 static inline void count_vm_events(enum vm_event_item item, long delta)
71 {
72 this_cpu_add(vm_event_states.event[item], delta);
73 }
74
75 extern void all_vm_events(unsigned long *);
76
77 extern void vm_events_fold_cpu(int cpu);
78
79 #else
80
81 /* Disable counters */
count_vm_event(enum vm_event_item item)82 static inline void count_vm_event(enum vm_event_item item)
83 {
84 }
count_vm_events(enum vm_event_item item,long delta)85 static inline void count_vm_events(enum vm_event_item item, long delta)
86 {
87 }
__count_vm_event(enum vm_event_item item)88 static inline void __count_vm_event(enum vm_event_item item)
89 {
90 }
__count_vm_events(enum vm_event_item item,long delta)91 static inline void __count_vm_events(enum vm_event_item item, long delta)
92 {
93 }
all_vm_events(unsigned long * ret)94 static inline void all_vm_events(unsigned long *ret)
95 {
96 }
vm_events_fold_cpu(int cpu)97 static inline void vm_events_fold_cpu(int cpu)
98 {
99 }
100
101 #endif /* CONFIG_VM_EVENT_COUNTERS */
102
103 #ifdef CONFIG_NUMA_BALANCING
104 #define count_vm_numa_event(x) count_vm_event(x)
105 #define count_vm_numa_events(x, y) count_vm_events(x, y)
106 #else
107 #define count_vm_numa_event(x) do {} while (0)
108 #define count_vm_numa_events(x, y) do { (void)(y); } while (0)
109 #endif /* CONFIG_NUMA_BALANCING */
110
111 #ifdef CONFIG_DEBUG_TLBFLUSH
112 #define count_vm_tlb_event(x) count_vm_event(x)
113 #define count_vm_tlb_events(x, y) count_vm_events(x, y)
114 #else
115 #define count_vm_tlb_event(x) do {} while (0)
116 #define count_vm_tlb_events(x, y) do { (void)(y); } while (0)
117 #endif
118
119 #ifdef CONFIG_DEBUG_VM_VMACACHE
120 #define count_vm_vmacache_event(x) count_vm_event(x)
121 #else
122 #define count_vm_vmacache_event(x) do {} while (0)
123 #endif
124
125 #define __count_zid_vm_events(item, zid, delta) \
126 __count_vm_events(item##_NORMAL - ZONE_NORMAL + zid, delta)
127
128 /*
129 * Zone and node-based page accounting with per cpu differentials.
130 */
131 extern atomic_long_t vm_zone_stat[NR_VM_ZONE_STAT_ITEMS];
132 extern atomic_long_t vm_numa_stat[NR_VM_NUMA_STAT_ITEMS];
133 extern atomic_long_t vm_node_stat[NR_VM_NODE_STAT_ITEMS];
134
135 #ifdef CONFIG_NUMA
zone_numa_state_add(long x,struct zone * zone,enum numa_stat_item item)136 static inline void zone_numa_state_add(long x, struct zone *zone,
137 enum numa_stat_item item)
138 {
139 atomic_long_add(x, &zone->vm_numa_stat[item]);
140 atomic_long_add(x, &vm_numa_stat[item]);
141 }
142
global_numa_state(enum numa_stat_item item)143 static inline unsigned long global_numa_state(enum numa_stat_item item)
144 {
145 long x = atomic_long_read(&vm_numa_stat[item]);
146
147 return x;
148 }
149
zone_numa_state_snapshot(struct zone * zone,enum numa_stat_item item)150 static inline unsigned long zone_numa_state_snapshot(struct zone *zone,
151 enum numa_stat_item item)
152 {
153 long x = atomic_long_read(&zone->vm_numa_stat[item]);
154 int cpu;
155
156 for_each_online_cpu(cpu)
157 x += per_cpu_ptr(zone->pageset, cpu)->vm_numa_stat_diff[item];
158
159 return x;
160 }
161 #endif /* CONFIG_NUMA */
162
zone_page_state_add(long x,struct zone * zone,enum zone_stat_item item)163 static inline void zone_page_state_add(long x, struct zone *zone,
164 enum zone_stat_item item)
165 {
166 atomic_long_add(x, &zone->vm_stat[item]);
167 atomic_long_add(x, &vm_zone_stat[item]);
168 }
169
node_page_state_add(long x,struct pglist_data * pgdat,enum node_stat_item item)170 static inline void node_page_state_add(long x, struct pglist_data *pgdat,
171 enum node_stat_item item)
172 {
173 atomic_long_add(x, &pgdat->vm_stat[item]);
174 atomic_long_add(x, &vm_node_stat[item]);
175 }
176
global_zone_page_state(enum zone_stat_item item)177 static inline unsigned long global_zone_page_state(enum zone_stat_item item)
178 {
179 long x = atomic_long_read(&vm_zone_stat[item]);
180 #ifdef CONFIG_SMP
181 if (x < 0)
182 x = 0;
183 #endif
184 return x;
185 }
186
global_node_page_state(enum node_stat_item item)187 static inline unsigned long global_node_page_state(enum node_stat_item item)
188 {
189 long x = atomic_long_read(&vm_node_stat[item]);
190 #ifdef CONFIG_SMP
191 if (x < 0)
192 x = 0;
193 #endif
194 return x;
195 }
196
zone_page_state(struct zone * zone,enum zone_stat_item item)197 static inline unsigned long zone_page_state(struct zone *zone,
198 enum zone_stat_item item)
199 {
200 long x = atomic_long_read(&zone->vm_stat[item]);
201 #ifdef CONFIG_SMP
202 if (x < 0)
203 x = 0;
204 #endif
205 return x;
206 }
207
208 /*
209 * More accurate version that also considers the currently pending
210 * deltas. For that we need to loop over all cpus to find the current
211 * deltas. There is no synchronization so the result cannot be
212 * exactly accurate either.
213 */
zone_page_state_snapshot(struct zone * zone,enum zone_stat_item item)214 static inline unsigned long zone_page_state_snapshot(struct zone *zone,
215 enum zone_stat_item item)
216 {
217 long x = atomic_long_read(&zone->vm_stat[item]);
218
219 #ifdef CONFIG_SMP
220 int cpu;
221 for_each_online_cpu(cpu)
222 x += per_cpu_ptr(zone->pageset, cpu)->vm_stat_diff[item];
223
224 if (x < 0)
225 x = 0;
226 #endif
227 return x;
228 }
229
230 #ifdef CONFIG_NUMA
231 extern void __inc_numa_state(struct zone *zone, enum numa_stat_item item);
232 extern unsigned long sum_zone_node_page_state(int node,
233 enum zone_stat_item item);
234 extern unsigned long sum_zone_numa_state(int node, enum numa_stat_item item);
235 extern unsigned long node_page_state(struct pglist_data *pgdat,
236 enum node_stat_item item);
237 #else
238 #define sum_zone_node_page_state(node, item) global_zone_page_state(item)
239 #define node_page_state(node, item) global_node_page_state(item)
240 #endif /* CONFIG_NUMA */
241
242 #define add_zone_page_state(__z, __i, __d) mod_zone_page_state(__z, __i, __d)
243 #define sub_zone_page_state(__z, __i, __d) mod_zone_page_state(__z, __i, -(__d))
244 #define add_node_page_state(__p, __i, __d) mod_node_page_state(__p, __i, __d)
245 #define sub_node_page_state(__p, __i, __d) mod_node_page_state(__p, __i, -(__d))
246
247 #ifdef CONFIG_SMP
248 void __mod_zone_page_state(struct zone *, enum zone_stat_item item, long);
249 void __inc_zone_page_state(struct page *, enum zone_stat_item);
250 void __dec_zone_page_state(struct page *, enum zone_stat_item);
251
252 void __mod_node_page_state(struct pglist_data *, enum node_stat_item item, long);
253 void __inc_node_page_state(struct page *, enum node_stat_item);
254 void __dec_node_page_state(struct page *, enum node_stat_item);
255
256 void mod_zone_page_state(struct zone *, enum zone_stat_item, long);
257 void inc_zone_page_state(struct page *, enum zone_stat_item);
258 void dec_zone_page_state(struct page *, enum zone_stat_item);
259
260 void mod_node_page_state(struct pglist_data *, enum node_stat_item, long);
261 void inc_node_page_state(struct page *, enum node_stat_item);
262 void dec_node_page_state(struct page *, enum node_stat_item);
263
264 extern void inc_node_state(struct pglist_data *, enum node_stat_item);
265 extern void __inc_zone_state(struct zone *, enum zone_stat_item);
266 extern void __inc_node_state(struct pglist_data *, enum node_stat_item);
267 extern void dec_zone_state(struct zone *, enum zone_stat_item);
268 extern void __dec_zone_state(struct zone *, enum zone_stat_item);
269 extern void __dec_node_state(struct pglist_data *, enum node_stat_item);
270
271 void quiet_vmstat(void);
272 void cpu_vm_stats_fold(int cpu);
273 void refresh_zone_stat_thresholds(void);
274
275 struct ctl_table;
276 int vmstat_refresh(struct ctl_table *, int write,
277 void __user *buffer, size_t *lenp, loff_t *ppos);
278
279 void drain_zonestat(struct zone *zone, struct per_cpu_pageset *);
280
281 int calculate_pressure_threshold(struct zone *zone);
282 int calculate_normal_threshold(struct zone *zone);
283 void set_pgdat_percpu_threshold(pg_data_t *pgdat,
284 int (*calculate_pressure)(struct zone *));
285 #else /* CONFIG_SMP */
286
287 /*
288 * We do not maintain differentials in a single processor configuration.
289 * The functions directly modify the zone and global counters.
290 */
__mod_zone_page_state(struct zone * zone,enum zone_stat_item item,long delta)291 static inline void __mod_zone_page_state(struct zone *zone,
292 enum zone_stat_item item, long delta)
293 {
294 zone_page_state_add(delta, zone, item);
295 }
296
__mod_node_page_state(struct pglist_data * pgdat,enum node_stat_item item,int delta)297 static inline void __mod_node_page_state(struct pglist_data *pgdat,
298 enum node_stat_item item, int delta)
299 {
300 node_page_state_add(delta, pgdat, item);
301 }
302
__inc_zone_state(struct zone * zone,enum zone_stat_item item)303 static inline void __inc_zone_state(struct zone *zone, enum zone_stat_item item)
304 {
305 atomic_long_inc(&zone->vm_stat[item]);
306 atomic_long_inc(&vm_zone_stat[item]);
307 }
308
__inc_node_state(struct pglist_data * pgdat,enum node_stat_item item)309 static inline void __inc_node_state(struct pglist_data *pgdat, enum node_stat_item item)
310 {
311 atomic_long_inc(&pgdat->vm_stat[item]);
312 atomic_long_inc(&vm_node_stat[item]);
313 }
314
__dec_zone_state(struct zone * zone,enum zone_stat_item item)315 static inline void __dec_zone_state(struct zone *zone, enum zone_stat_item item)
316 {
317 atomic_long_dec(&zone->vm_stat[item]);
318 atomic_long_dec(&vm_zone_stat[item]);
319 }
320
__dec_node_state(struct pglist_data * pgdat,enum node_stat_item item)321 static inline void __dec_node_state(struct pglist_data *pgdat, enum node_stat_item item)
322 {
323 atomic_long_dec(&pgdat->vm_stat[item]);
324 atomic_long_dec(&vm_node_stat[item]);
325 }
326
__inc_zone_page_state(struct page * page,enum zone_stat_item item)327 static inline void __inc_zone_page_state(struct page *page,
328 enum zone_stat_item item)
329 {
330 __inc_zone_state(page_zone(page), item);
331 }
332
__inc_node_page_state(struct page * page,enum node_stat_item item)333 static inline void __inc_node_page_state(struct page *page,
334 enum node_stat_item item)
335 {
336 __inc_node_state(page_pgdat(page), item);
337 }
338
339
__dec_zone_page_state(struct page * page,enum zone_stat_item item)340 static inline void __dec_zone_page_state(struct page *page,
341 enum zone_stat_item item)
342 {
343 __dec_zone_state(page_zone(page), item);
344 }
345
__dec_node_page_state(struct page * page,enum node_stat_item item)346 static inline void __dec_node_page_state(struct page *page,
347 enum node_stat_item item)
348 {
349 __dec_node_state(page_pgdat(page), item);
350 }
351
352
353 /*
354 * We only use atomic operations to update counters. So there is no need to
355 * disable interrupts.
356 */
357 #define inc_zone_page_state __inc_zone_page_state
358 #define dec_zone_page_state __dec_zone_page_state
359 #define mod_zone_page_state __mod_zone_page_state
360
361 #define inc_node_page_state __inc_node_page_state
362 #define dec_node_page_state __dec_node_page_state
363 #define mod_node_page_state __mod_node_page_state
364
365 #define inc_zone_state __inc_zone_state
366 #define inc_node_state __inc_node_state
367 #define dec_zone_state __dec_zone_state
368
369 #define set_pgdat_percpu_threshold(pgdat, callback) { }
370
refresh_zone_stat_thresholds(void)371 static inline void refresh_zone_stat_thresholds(void) { }
cpu_vm_stats_fold(int cpu)372 static inline void cpu_vm_stats_fold(int cpu) { }
quiet_vmstat(void)373 static inline void quiet_vmstat(void) { }
374
drain_zonestat(struct zone * zone,struct per_cpu_pageset * pset)375 static inline void drain_zonestat(struct zone *zone,
376 struct per_cpu_pageset *pset) { }
377 #endif /* CONFIG_SMP */
378
__mod_zone_freepage_state(struct zone * zone,int nr_pages,int migratetype)379 static inline void __mod_zone_freepage_state(struct zone *zone, int nr_pages,
380 int migratetype)
381 {
382 __mod_zone_page_state(zone, NR_FREE_PAGES, nr_pages);
383 if (is_migrate_cma(migratetype))
384 __mod_zone_page_state(zone, NR_FREE_CMA_PAGES, nr_pages);
385 }
386
387 extern const char * const vmstat_text[];
388
389 #endif /* _LINUX_VMSTAT_H */
390