Loading...
1/*
2 * Fast batching percpu counters.
3 */
4
5#include <linux/percpu_counter.h>
6#include <linux/notifier.h>
7#include <linux/mutex.h>
8#include <linux/init.h>
9#include <linux/cpu.h>
10#include <linux/module.h>
11#include <linux/debugobjects.h>
12
13#ifdef CONFIG_HOTPLUG_CPU
14static LIST_HEAD(percpu_counters);
15static DEFINE_SPINLOCK(percpu_counters_lock);
16#endif
17
18#ifdef CONFIG_DEBUG_OBJECTS_PERCPU_COUNTER
19
20static struct debug_obj_descr percpu_counter_debug_descr;
21
22static int percpu_counter_fixup_free(void *addr, enum debug_obj_state state)
23{
24 struct percpu_counter *fbc = addr;
25
26 switch (state) {
27 case ODEBUG_STATE_ACTIVE:
28 percpu_counter_destroy(fbc);
29 debug_object_free(fbc, &percpu_counter_debug_descr);
30 return 1;
31 default:
32 return 0;
33 }
34}
35
36static struct debug_obj_descr percpu_counter_debug_descr = {
37 .name = "percpu_counter",
38 .fixup_free = percpu_counter_fixup_free,
39};
40
41static inline void debug_percpu_counter_activate(struct percpu_counter *fbc)
42{
43 debug_object_init(fbc, &percpu_counter_debug_descr);
44 debug_object_activate(fbc, &percpu_counter_debug_descr);
45}
46
47static inline void debug_percpu_counter_deactivate(struct percpu_counter *fbc)
48{
49 debug_object_deactivate(fbc, &percpu_counter_debug_descr);
50 debug_object_free(fbc, &percpu_counter_debug_descr);
51}
52
53#else /* CONFIG_DEBUG_OBJECTS_PERCPU_COUNTER */
54static inline void debug_percpu_counter_activate(struct percpu_counter *fbc)
55{ }
56static inline void debug_percpu_counter_deactivate(struct percpu_counter *fbc)
57{ }
58#endif /* CONFIG_DEBUG_OBJECTS_PERCPU_COUNTER */
59
60void percpu_counter_set(struct percpu_counter *fbc, s64 amount)
61{
62 int cpu;
63 unsigned long flags;
64
65 raw_spin_lock_irqsave(&fbc->lock, flags);
66 for_each_possible_cpu(cpu) {
67 s32 *pcount = per_cpu_ptr(fbc->counters, cpu);
68 *pcount = 0;
69 }
70 fbc->count = amount;
71 raw_spin_unlock_irqrestore(&fbc->lock, flags);
72}
73EXPORT_SYMBOL(percpu_counter_set);
74
75void __percpu_counter_add(struct percpu_counter *fbc, s64 amount, s32 batch)
76{
77 s64 count;
78
79 preempt_disable();
80 count = __this_cpu_read(*fbc->counters) + amount;
81 if (count >= batch || count <= -batch) {
82 unsigned long flags;
83 raw_spin_lock_irqsave(&fbc->lock, flags);
84 fbc->count += count;
85 __this_cpu_sub(*fbc->counters, count - amount);
86 raw_spin_unlock_irqrestore(&fbc->lock, flags);
87 } else {
88 this_cpu_add(*fbc->counters, amount);
89 }
90 preempt_enable();
91}
92EXPORT_SYMBOL(__percpu_counter_add);
93
94/*
95 * Add up all the per-cpu counts, return the result. This is a more accurate
96 * but much slower version of percpu_counter_read_positive()
97 */
98s64 __percpu_counter_sum(struct percpu_counter *fbc)
99{
100 s64 ret;
101 int cpu;
102 unsigned long flags;
103
104 raw_spin_lock_irqsave(&fbc->lock, flags);
105 ret = fbc->count;
106 for_each_online_cpu(cpu) {
107 s32 *pcount = per_cpu_ptr(fbc->counters, cpu);
108 ret += *pcount;
109 }
110 raw_spin_unlock_irqrestore(&fbc->lock, flags);
111 return ret;
112}
113EXPORT_SYMBOL(__percpu_counter_sum);
114
115int __percpu_counter_init(struct percpu_counter *fbc, s64 amount,
116 struct lock_class_key *key)
117{
118 raw_spin_lock_init(&fbc->lock);
119 lockdep_set_class(&fbc->lock, key);
120 fbc->count = amount;
121 fbc->counters = alloc_percpu(s32);
122 if (!fbc->counters)
123 return -ENOMEM;
124
125 debug_percpu_counter_activate(fbc);
126
127#ifdef CONFIG_HOTPLUG_CPU
128 INIT_LIST_HEAD(&fbc->list);
129 spin_lock(&percpu_counters_lock);
130 list_add(&fbc->list, &percpu_counters);
131 spin_unlock(&percpu_counters_lock);
132#endif
133 return 0;
134}
135EXPORT_SYMBOL(__percpu_counter_init);
136
137void percpu_counter_destroy(struct percpu_counter *fbc)
138{
139 if (!fbc->counters)
140 return;
141
142 debug_percpu_counter_deactivate(fbc);
143
144#ifdef CONFIG_HOTPLUG_CPU
145 spin_lock(&percpu_counters_lock);
146 list_del(&fbc->list);
147 spin_unlock(&percpu_counters_lock);
148#endif
149 free_percpu(fbc->counters);
150 fbc->counters = NULL;
151}
152EXPORT_SYMBOL(percpu_counter_destroy);
153
154int percpu_counter_batch __read_mostly = 32;
155EXPORT_SYMBOL(percpu_counter_batch);
156
157static void compute_batch_value(void)
158{
159 int nr = num_online_cpus();
160
161 percpu_counter_batch = max(32, nr*2);
162}
163
164static int percpu_counter_hotcpu_callback(struct notifier_block *nb,
165 unsigned long action, void *hcpu)
166{
167#ifdef CONFIG_HOTPLUG_CPU
168 unsigned int cpu;
169 struct percpu_counter *fbc;
170
171 compute_batch_value();
172 if (action != CPU_DEAD && action != CPU_DEAD_FROZEN)
173 return NOTIFY_OK;
174
175 cpu = (unsigned long)hcpu;
176 spin_lock(&percpu_counters_lock);
177 list_for_each_entry(fbc, &percpu_counters, list) {
178 s32 *pcount;
179 unsigned long flags;
180
181 raw_spin_lock_irqsave(&fbc->lock, flags);
182 pcount = per_cpu_ptr(fbc->counters, cpu);
183 fbc->count += *pcount;
184 *pcount = 0;
185 raw_spin_unlock_irqrestore(&fbc->lock, flags);
186 }
187 spin_unlock(&percpu_counters_lock);
188#endif
189 return NOTIFY_OK;
190}
191
192/*
193 * Compare counter against given value.
194 * Return 1 if greater, 0 if equal and -1 if less
195 */
196int percpu_counter_compare(struct percpu_counter *fbc, s64 rhs)
197{
198 s64 count;
199
200 count = percpu_counter_read(fbc);
201 /* Check to see if rough count will be sufficient for comparison */
202 if (abs(count - rhs) > (percpu_counter_batch*num_online_cpus())) {
203 if (count > rhs)
204 return 1;
205 else
206 return -1;
207 }
208 /* Need to use precise count */
209 count = percpu_counter_sum(fbc);
210 if (count > rhs)
211 return 1;
212 else if (count < rhs)
213 return -1;
214 else
215 return 0;
216}
217EXPORT_SYMBOL(percpu_counter_compare);
218
219static int __init percpu_counter_startup(void)
220{
221 compute_batch_value();
222 hotcpu_notifier(percpu_counter_hotcpu_callback, 0);
223 return 0;
224}
225module_init(percpu_counter_startup);
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Fast batching percpu counters.
4 */
5
6#include <linux/percpu_counter.h>
7#include <linux/notifier.h>
8#include <linux/mutex.h>
9#include <linux/init.h>
10#include <linux/cpu.h>
11#include <linux/module.h>
12#include <linux/debugobjects.h>
13
14#ifdef CONFIG_HOTPLUG_CPU
15static LIST_HEAD(percpu_counters);
16static DEFINE_SPINLOCK(percpu_counters_lock);
17#endif
18
19#ifdef CONFIG_DEBUG_OBJECTS_PERCPU_COUNTER
20
21static struct debug_obj_descr percpu_counter_debug_descr;
22
23static bool percpu_counter_fixup_free(void *addr, enum debug_obj_state state)
24{
25 struct percpu_counter *fbc = addr;
26
27 switch (state) {
28 case ODEBUG_STATE_ACTIVE:
29 percpu_counter_destroy(fbc);
30 debug_object_free(fbc, &percpu_counter_debug_descr);
31 return true;
32 default:
33 return false;
34 }
35}
36
37static struct debug_obj_descr percpu_counter_debug_descr = {
38 .name = "percpu_counter",
39 .fixup_free = percpu_counter_fixup_free,
40};
41
42static inline void debug_percpu_counter_activate(struct percpu_counter *fbc)
43{
44 debug_object_init(fbc, &percpu_counter_debug_descr);
45 debug_object_activate(fbc, &percpu_counter_debug_descr);
46}
47
48static inline void debug_percpu_counter_deactivate(struct percpu_counter *fbc)
49{
50 debug_object_deactivate(fbc, &percpu_counter_debug_descr);
51 debug_object_free(fbc, &percpu_counter_debug_descr);
52}
53
54#else /* CONFIG_DEBUG_OBJECTS_PERCPU_COUNTER */
55static inline void debug_percpu_counter_activate(struct percpu_counter *fbc)
56{ }
57static inline void debug_percpu_counter_deactivate(struct percpu_counter *fbc)
58{ }
59#endif /* CONFIG_DEBUG_OBJECTS_PERCPU_COUNTER */
60
61void percpu_counter_set(struct percpu_counter *fbc, s64 amount)
62{
63 int cpu;
64 unsigned long flags;
65
66 raw_spin_lock_irqsave(&fbc->lock, flags);
67 for_each_possible_cpu(cpu) {
68 s32 *pcount = per_cpu_ptr(fbc->counters, cpu);
69 *pcount = 0;
70 }
71 fbc->count = amount;
72 raw_spin_unlock_irqrestore(&fbc->lock, flags);
73}
74EXPORT_SYMBOL(percpu_counter_set);
75
76/**
77 * This function is both preempt and irq safe. The former is due to explicit
78 * preemption disable. The latter is guaranteed by the fact that the slow path
79 * is explicitly protected by an irq-safe spinlock whereas the fast patch uses
80 * this_cpu_add which is irq-safe by definition. Hence there is no need muck
81 * with irq state before calling this one
82 */
83void percpu_counter_add_batch(struct percpu_counter *fbc, s64 amount, s32 batch)
84{
85 s64 count;
86
87 preempt_disable();
88 count = __this_cpu_read(*fbc->counters) + amount;
89 if (count >= batch || count <= -batch) {
90 unsigned long flags;
91 raw_spin_lock_irqsave(&fbc->lock, flags);
92 fbc->count += count;
93 __this_cpu_sub(*fbc->counters, count - amount);
94 raw_spin_unlock_irqrestore(&fbc->lock, flags);
95 } else {
96 this_cpu_add(*fbc->counters, amount);
97 }
98 preempt_enable();
99}
100EXPORT_SYMBOL(percpu_counter_add_batch);
101
102/*
103 * Add up all the per-cpu counts, return the result. This is a more accurate
104 * but much slower version of percpu_counter_read_positive()
105 */
106s64 __percpu_counter_sum(struct percpu_counter *fbc)
107{
108 s64 ret;
109 int cpu;
110 unsigned long flags;
111
112 raw_spin_lock_irqsave(&fbc->lock, flags);
113 ret = fbc->count;
114 for_each_online_cpu(cpu) {
115 s32 *pcount = per_cpu_ptr(fbc->counters, cpu);
116 ret += *pcount;
117 }
118 raw_spin_unlock_irqrestore(&fbc->lock, flags);
119 return ret;
120}
121EXPORT_SYMBOL(__percpu_counter_sum);
122
123int __percpu_counter_init(struct percpu_counter *fbc, s64 amount, gfp_t gfp,
124 struct lock_class_key *key)
125{
126 unsigned long flags __maybe_unused;
127
128 raw_spin_lock_init(&fbc->lock);
129 lockdep_set_class(&fbc->lock, key);
130 fbc->count = amount;
131 fbc->counters = alloc_percpu_gfp(s32, gfp);
132 if (!fbc->counters)
133 return -ENOMEM;
134
135 debug_percpu_counter_activate(fbc);
136
137#ifdef CONFIG_HOTPLUG_CPU
138 INIT_LIST_HEAD(&fbc->list);
139 spin_lock_irqsave(&percpu_counters_lock, flags);
140 list_add(&fbc->list, &percpu_counters);
141 spin_unlock_irqrestore(&percpu_counters_lock, flags);
142#endif
143 return 0;
144}
145EXPORT_SYMBOL(__percpu_counter_init);
146
147void percpu_counter_destroy(struct percpu_counter *fbc)
148{
149 unsigned long flags __maybe_unused;
150
151 if (!fbc->counters)
152 return;
153
154 debug_percpu_counter_deactivate(fbc);
155
156#ifdef CONFIG_HOTPLUG_CPU
157 spin_lock_irqsave(&percpu_counters_lock, flags);
158 list_del(&fbc->list);
159 spin_unlock_irqrestore(&percpu_counters_lock, flags);
160#endif
161 free_percpu(fbc->counters);
162 fbc->counters = NULL;
163}
164EXPORT_SYMBOL(percpu_counter_destroy);
165
166int percpu_counter_batch __read_mostly = 32;
167EXPORT_SYMBOL(percpu_counter_batch);
168
169static int compute_batch_value(unsigned int cpu)
170{
171 int nr = num_online_cpus();
172
173 percpu_counter_batch = max(32, nr*2);
174 return 0;
175}
176
177static int percpu_counter_cpu_dead(unsigned int cpu)
178{
179#ifdef CONFIG_HOTPLUG_CPU
180 struct percpu_counter *fbc;
181
182 compute_batch_value(cpu);
183
184 spin_lock_irq(&percpu_counters_lock);
185 list_for_each_entry(fbc, &percpu_counters, list) {
186 s32 *pcount;
187
188 raw_spin_lock(&fbc->lock);
189 pcount = per_cpu_ptr(fbc->counters, cpu);
190 fbc->count += *pcount;
191 *pcount = 0;
192 raw_spin_unlock(&fbc->lock);
193 }
194 spin_unlock_irq(&percpu_counters_lock);
195#endif
196 return 0;
197}
198
199/*
200 * Compare counter against given value.
201 * Return 1 if greater, 0 if equal and -1 if less
202 */
203int __percpu_counter_compare(struct percpu_counter *fbc, s64 rhs, s32 batch)
204{
205 s64 count;
206
207 count = percpu_counter_read(fbc);
208 /* Check to see if rough count will be sufficient for comparison */
209 if (abs(count - rhs) > (batch * num_online_cpus())) {
210 if (count > rhs)
211 return 1;
212 else
213 return -1;
214 }
215 /* Need to use precise count */
216 count = percpu_counter_sum(fbc);
217 if (count > rhs)
218 return 1;
219 else if (count < rhs)
220 return -1;
221 else
222 return 0;
223}
224EXPORT_SYMBOL(__percpu_counter_compare);
225
226static int __init percpu_counter_startup(void)
227{
228 int ret;
229
230 ret = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "lib/percpu_cnt:online",
231 compute_batch_value, NULL);
232 WARN_ON(ret < 0);
233 ret = cpuhp_setup_state_nocalls(CPUHP_PERCPU_CNT_DEAD,
234 "lib/percpu_cnt:dead", NULL,
235 percpu_counter_cpu_dead);
236 WARN_ON(ret < 0);
237 return 0;
238}
239module_init(percpu_counter_startup);