Linux Audio

Check our new training course

Loading...
v6.2
  1// SPDX-License-Identifier: GPL-2.0-only
  2/* Copyright (c) 2016 Facebook
  3 */
  4#include <linux/cpumask.h>
  5#include <linux/spinlock.h>
  6#include <linux/percpu.h>
  7
  8#include "bpf_lru_list.h"
  9
 10#define LOCAL_FREE_TARGET		(128)
 11#define LOCAL_NR_SCANS			LOCAL_FREE_TARGET
 12
 13#define PERCPU_FREE_TARGET		(4)
 14#define PERCPU_NR_SCANS			PERCPU_FREE_TARGET
 15
 16/* Helpers to get the local list index */
 17#define LOCAL_LIST_IDX(t)	((t) - BPF_LOCAL_LIST_T_OFFSET)
 18#define LOCAL_FREE_LIST_IDX	LOCAL_LIST_IDX(BPF_LRU_LOCAL_LIST_T_FREE)
 19#define LOCAL_PENDING_LIST_IDX	LOCAL_LIST_IDX(BPF_LRU_LOCAL_LIST_T_PENDING)
 20#define IS_LOCAL_LIST_TYPE(t)	((t) >= BPF_LOCAL_LIST_T_OFFSET)
 21
 22static int get_next_cpu(int cpu)
 23{
 24	cpu = cpumask_next(cpu, cpu_possible_mask);
 25	if (cpu >= nr_cpu_ids)
 26		cpu = cpumask_first(cpu_possible_mask);
 27	return cpu;
 28}
 29
 30/* Local list helpers */
 31static struct list_head *local_free_list(struct bpf_lru_locallist *loc_l)
 32{
 33	return &loc_l->lists[LOCAL_FREE_LIST_IDX];
 34}
 35
 36static struct list_head *local_pending_list(struct bpf_lru_locallist *loc_l)
 37{
 38	return &loc_l->lists[LOCAL_PENDING_LIST_IDX];
 39}
 40
 41/* bpf_lru_node helpers */
 42static bool bpf_lru_node_is_ref(const struct bpf_lru_node *node)
 43{
 44	return node->ref;
 
 
 
 
 
 45}
 46
 47static void bpf_lru_list_count_inc(struct bpf_lru_list *l,
 48				   enum bpf_lru_list_type type)
 49{
 50	if (type < NR_BPF_LRU_LIST_COUNT)
 51		l->counts[type]++;
 52}
 53
 54static void bpf_lru_list_count_dec(struct bpf_lru_list *l,
 55				   enum bpf_lru_list_type type)
 56{
 57	if (type < NR_BPF_LRU_LIST_COUNT)
 58		l->counts[type]--;
 59}
 60
 61static void __bpf_lru_node_move_to_free(struct bpf_lru_list *l,
 62					struct bpf_lru_node *node,
 63					struct list_head *free_list,
 64					enum bpf_lru_list_type tgt_free_type)
 65{
 66	if (WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(node->type)))
 67		return;
 68
 69	/* If the removing node is the next_inactive_rotation candidate,
 70	 * move the next_inactive_rotation pointer also.
 71	 */
 72	if (&node->list == l->next_inactive_rotation)
 73		l->next_inactive_rotation = l->next_inactive_rotation->prev;
 74
 75	bpf_lru_list_count_dec(l, node->type);
 76
 77	node->type = tgt_free_type;
 78	list_move(&node->list, free_list);
 79}
 80
 81/* Move nodes from local list to the LRU list */
 82static void __bpf_lru_node_move_in(struct bpf_lru_list *l,
 83				   struct bpf_lru_node *node,
 84				   enum bpf_lru_list_type tgt_type)
 85{
 86	if (WARN_ON_ONCE(!IS_LOCAL_LIST_TYPE(node->type)) ||
 87	    WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(tgt_type)))
 88		return;
 89
 90	bpf_lru_list_count_inc(l, tgt_type);
 91	node->type = tgt_type;
 92	node->ref = 0;
 93	list_move(&node->list, &l->lists[tgt_type]);
 94}
 95
 96/* Move nodes between or within active and inactive list (like
 97 * active to inactive, inactive to active or tail of active back to
 98 * the head of active).
 99 */
100static void __bpf_lru_node_move(struct bpf_lru_list *l,
101				struct bpf_lru_node *node,
102				enum bpf_lru_list_type tgt_type)
103{
104	if (WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(node->type)) ||
105	    WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(tgt_type)))
106		return;
107
108	if (node->type != tgt_type) {
109		bpf_lru_list_count_dec(l, node->type);
110		bpf_lru_list_count_inc(l, tgt_type);
111		node->type = tgt_type;
112	}
113	node->ref = 0;
114
115	/* If the moving node is the next_inactive_rotation candidate,
116	 * move the next_inactive_rotation pointer also.
117	 */
118	if (&node->list == l->next_inactive_rotation)
119		l->next_inactive_rotation = l->next_inactive_rotation->prev;
120
121	list_move(&node->list, &l->lists[tgt_type]);
122}
123
124static bool bpf_lru_list_inactive_low(const struct bpf_lru_list *l)
125{
126	return l->counts[BPF_LRU_LIST_T_INACTIVE] <
127		l->counts[BPF_LRU_LIST_T_ACTIVE];
128}
129
130/* Rotate the active list:
131 * 1. Start from tail
132 * 2. If the node has the ref bit set, it will be rotated
133 *    back to the head of active list with the ref bit cleared.
134 *    Give this node one more chance to survive in the active list.
135 * 3. If the ref bit is not set, move it to the head of the
136 *    inactive list.
137 * 4. It will at most scan nr_scans nodes
138 */
139static void __bpf_lru_list_rotate_active(struct bpf_lru *lru,
140					 struct bpf_lru_list *l)
141{
142	struct list_head *active = &l->lists[BPF_LRU_LIST_T_ACTIVE];
143	struct bpf_lru_node *node, *tmp_node, *first_node;
144	unsigned int i = 0;
145
146	first_node = list_first_entry(active, struct bpf_lru_node, list);
147	list_for_each_entry_safe_reverse(node, tmp_node, active, list) {
148		if (bpf_lru_node_is_ref(node))
149			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_ACTIVE);
150		else
151			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_INACTIVE);
152
153		if (++i == lru->nr_scans || node == first_node)
154			break;
155	}
156}
157
158/* Rotate the inactive list.  It starts from the next_inactive_rotation
159 * 1. If the node has ref bit set, it will be moved to the head
160 *    of active list with the ref bit cleared.
161 * 2. If the node does not have ref bit set, it will leave it
162 *    at its current location (i.e. do nothing) so that it can
163 *    be considered during the next inactive_shrink.
164 * 3. It will at most scan nr_scans nodes
165 */
166static void __bpf_lru_list_rotate_inactive(struct bpf_lru *lru,
167					   struct bpf_lru_list *l)
168{
169	struct list_head *inactive = &l->lists[BPF_LRU_LIST_T_INACTIVE];
170	struct list_head *cur, *last, *next = inactive;
171	struct bpf_lru_node *node;
172	unsigned int i = 0;
173
174	if (list_empty(inactive))
175		return;
176
177	last = l->next_inactive_rotation->next;
178	if (last == inactive)
179		last = last->next;
180
181	cur = l->next_inactive_rotation;
182	while (i < lru->nr_scans) {
183		if (cur == inactive) {
184			cur = cur->prev;
185			continue;
186		}
187
188		node = list_entry(cur, struct bpf_lru_node, list);
189		next = cur->prev;
190		if (bpf_lru_node_is_ref(node))
191			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_ACTIVE);
192		if (cur == last)
193			break;
194		cur = next;
195		i++;
196	}
197
198	l->next_inactive_rotation = next;
199}
200
201/* Shrink the inactive list.  It starts from the tail of the
202 * inactive list and only move the nodes without the ref bit
203 * set to the designated free list.
204 */
205static unsigned int
206__bpf_lru_list_shrink_inactive(struct bpf_lru *lru,
207			       struct bpf_lru_list *l,
208			       unsigned int tgt_nshrink,
209			       struct list_head *free_list,
210			       enum bpf_lru_list_type tgt_free_type)
211{
212	struct list_head *inactive = &l->lists[BPF_LRU_LIST_T_INACTIVE];
213	struct bpf_lru_node *node, *tmp_node;
214	unsigned int nshrinked = 0;
215	unsigned int i = 0;
216
217	list_for_each_entry_safe_reverse(node, tmp_node, inactive, list) {
218		if (bpf_lru_node_is_ref(node)) {
219			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_ACTIVE);
220		} else if (lru->del_from_htab(lru->del_arg, node)) {
221			__bpf_lru_node_move_to_free(l, node, free_list,
222						    tgt_free_type);
223			if (++nshrinked == tgt_nshrink)
224				break;
225		}
226
227		if (++i == lru->nr_scans)
228			break;
229	}
230
231	return nshrinked;
232}
233
234/* 1. Rotate the active list (if needed)
235 * 2. Always rotate the inactive list
236 */
237static void __bpf_lru_list_rotate(struct bpf_lru *lru, struct bpf_lru_list *l)
238{
239	if (bpf_lru_list_inactive_low(l))
240		__bpf_lru_list_rotate_active(lru, l);
241
242	__bpf_lru_list_rotate_inactive(lru, l);
243}
244
245/* Calls __bpf_lru_list_shrink_inactive() to shrink some
246 * ref-bit-cleared nodes and move them to the designated
247 * free list.
248 *
249 * If it cannot get a free node after calling
250 * __bpf_lru_list_shrink_inactive().  It will just remove
251 * one node from either inactive or active list without
252 * honoring the ref-bit.  It prefers inactive list to active
253 * list in this situation.
254 */
255static unsigned int __bpf_lru_list_shrink(struct bpf_lru *lru,
256					  struct bpf_lru_list *l,
257					  unsigned int tgt_nshrink,
258					  struct list_head *free_list,
259					  enum bpf_lru_list_type tgt_free_type)
260
261{
262	struct bpf_lru_node *node, *tmp_node;
263	struct list_head *force_shrink_list;
264	unsigned int nshrinked;
265
266	nshrinked = __bpf_lru_list_shrink_inactive(lru, l, tgt_nshrink,
267						   free_list, tgt_free_type);
268	if (nshrinked)
269		return nshrinked;
270
271	/* Do a force shrink by ignoring the reference bit */
272	if (!list_empty(&l->lists[BPF_LRU_LIST_T_INACTIVE]))
273		force_shrink_list = &l->lists[BPF_LRU_LIST_T_INACTIVE];
274	else
275		force_shrink_list = &l->lists[BPF_LRU_LIST_T_ACTIVE];
276
277	list_for_each_entry_safe_reverse(node, tmp_node, force_shrink_list,
278					 list) {
279		if (lru->del_from_htab(lru->del_arg, node)) {
280			__bpf_lru_node_move_to_free(l, node, free_list,
281						    tgt_free_type);
282			return 1;
283		}
284	}
285
286	return 0;
287}
288
289/* Flush the nodes from the local pending list to the LRU list */
290static void __local_list_flush(struct bpf_lru_list *l,
291			       struct bpf_lru_locallist *loc_l)
292{
293	struct bpf_lru_node *node, *tmp_node;
294
295	list_for_each_entry_safe_reverse(node, tmp_node,
296					 local_pending_list(loc_l), list) {
297		if (bpf_lru_node_is_ref(node))
298			__bpf_lru_node_move_in(l, node, BPF_LRU_LIST_T_ACTIVE);
299		else
300			__bpf_lru_node_move_in(l, node,
301					       BPF_LRU_LIST_T_INACTIVE);
302	}
303}
304
305static void bpf_lru_list_push_free(struct bpf_lru_list *l,
306				   struct bpf_lru_node *node)
307{
308	unsigned long flags;
309
310	if (WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(node->type)))
311		return;
312
313	raw_spin_lock_irqsave(&l->lock, flags);
314	__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_FREE);
315	raw_spin_unlock_irqrestore(&l->lock, flags);
316}
317
318static void bpf_lru_list_pop_free_to_local(struct bpf_lru *lru,
319					   struct bpf_lru_locallist *loc_l)
320{
321	struct bpf_lru_list *l = &lru->common_lru.lru_list;
322	struct bpf_lru_node *node, *tmp_node;
323	unsigned int nfree = 0;
324
325	raw_spin_lock(&l->lock);
326
327	__local_list_flush(l, loc_l);
328
329	__bpf_lru_list_rotate(lru, l);
330
331	list_for_each_entry_safe(node, tmp_node, &l->lists[BPF_LRU_LIST_T_FREE],
332				 list) {
333		__bpf_lru_node_move_to_free(l, node, local_free_list(loc_l),
334					    BPF_LRU_LOCAL_LIST_T_FREE);
335		if (++nfree == LOCAL_FREE_TARGET)
336			break;
337	}
338
339	if (nfree < LOCAL_FREE_TARGET)
340		__bpf_lru_list_shrink(lru, l, LOCAL_FREE_TARGET - nfree,
341				      local_free_list(loc_l),
342				      BPF_LRU_LOCAL_LIST_T_FREE);
343
344	raw_spin_unlock(&l->lock);
345}
346
347static void __local_list_add_pending(struct bpf_lru *lru,
348				     struct bpf_lru_locallist *loc_l,
349				     int cpu,
350				     struct bpf_lru_node *node,
351				     u32 hash)
352{
353	*(u32 *)((void *)node + lru->hash_offset) = hash;
354	node->cpu = cpu;
355	node->type = BPF_LRU_LOCAL_LIST_T_PENDING;
356	node->ref = 0;
357	list_add(&node->list, local_pending_list(loc_l));
358}
359
360static struct bpf_lru_node *
361__local_list_pop_free(struct bpf_lru_locallist *loc_l)
362{
363	struct bpf_lru_node *node;
364
365	node = list_first_entry_or_null(local_free_list(loc_l),
366					struct bpf_lru_node,
367					list);
368	if (node)
369		list_del(&node->list);
370
371	return node;
372}
373
374static struct bpf_lru_node *
375__local_list_pop_pending(struct bpf_lru *lru, struct bpf_lru_locallist *loc_l)
376{
377	struct bpf_lru_node *node;
378	bool force = false;
379
380ignore_ref:
381	/* Get from the tail (i.e. older element) of the pending list. */
382	list_for_each_entry_reverse(node, local_pending_list(loc_l),
383				    list) {
384		if ((!bpf_lru_node_is_ref(node) || force) &&
385		    lru->del_from_htab(lru->del_arg, node)) {
386			list_del(&node->list);
387			return node;
388		}
389	}
390
391	if (!force) {
392		force = true;
393		goto ignore_ref;
394	}
395
396	return NULL;
397}
398
399static struct bpf_lru_node *bpf_percpu_lru_pop_free(struct bpf_lru *lru,
400						    u32 hash)
401{
402	struct list_head *free_list;
403	struct bpf_lru_node *node = NULL;
404	struct bpf_lru_list *l;
405	unsigned long flags;
406	int cpu = raw_smp_processor_id();
407
408	l = per_cpu_ptr(lru->percpu_lru, cpu);
409
410	raw_spin_lock_irqsave(&l->lock, flags);
411
412	__bpf_lru_list_rotate(lru, l);
413
414	free_list = &l->lists[BPF_LRU_LIST_T_FREE];
415	if (list_empty(free_list))
416		__bpf_lru_list_shrink(lru, l, PERCPU_FREE_TARGET, free_list,
417				      BPF_LRU_LIST_T_FREE);
418
419	if (!list_empty(free_list)) {
420		node = list_first_entry(free_list, struct bpf_lru_node, list);
421		*(u32 *)((void *)node + lru->hash_offset) = hash;
422		node->ref = 0;
423		__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_INACTIVE);
424	}
425
426	raw_spin_unlock_irqrestore(&l->lock, flags);
427
428	return node;
429}
430
431static struct bpf_lru_node *bpf_common_lru_pop_free(struct bpf_lru *lru,
432						    u32 hash)
433{
434	struct bpf_lru_locallist *loc_l, *steal_loc_l;
435	struct bpf_common_lru *clru = &lru->common_lru;
436	struct bpf_lru_node *node;
437	int steal, first_steal;
438	unsigned long flags;
439	int cpu = raw_smp_processor_id();
440
441	loc_l = per_cpu_ptr(clru->local_list, cpu);
442
443	raw_spin_lock_irqsave(&loc_l->lock, flags);
444
445	node = __local_list_pop_free(loc_l);
446	if (!node) {
447		bpf_lru_list_pop_free_to_local(lru, loc_l);
448		node = __local_list_pop_free(loc_l);
449	}
450
451	if (node)
452		__local_list_add_pending(lru, loc_l, cpu, node, hash);
453
454	raw_spin_unlock_irqrestore(&loc_l->lock, flags);
455
456	if (node)
457		return node;
458
459	/* No free nodes found from the local free list and
460	 * the global LRU list.
461	 *
462	 * Steal from the local free/pending list of the
463	 * current CPU and remote CPU in RR.  It starts
464	 * with the loc_l->next_steal CPU.
465	 */
466
467	first_steal = loc_l->next_steal;
468	steal = first_steal;
469	do {
470		steal_loc_l = per_cpu_ptr(clru->local_list, steal);
471
472		raw_spin_lock_irqsave(&steal_loc_l->lock, flags);
473
474		node = __local_list_pop_free(steal_loc_l);
475		if (!node)
476			node = __local_list_pop_pending(lru, steal_loc_l);
477
478		raw_spin_unlock_irqrestore(&steal_loc_l->lock, flags);
479
480		steal = get_next_cpu(steal);
481	} while (!node && steal != first_steal);
482
483	loc_l->next_steal = steal;
484
485	if (node) {
486		raw_spin_lock_irqsave(&loc_l->lock, flags);
487		__local_list_add_pending(lru, loc_l, cpu, node, hash);
488		raw_spin_unlock_irqrestore(&loc_l->lock, flags);
489	}
490
491	return node;
492}
493
494struct bpf_lru_node *bpf_lru_pop_free(struct bpf_lru *lru, u32 hash)
495{
496	if (lru->percpu)
497		return bpf_percpu_lru_pop_free(lru, hash);
498	else
499		return bpf_common_lru_pop_free(lru, hash);
500}
501
502static void bpf_common_lru_push_free(struct bpf_lru *lru,
503				     struct bpf_lru_node *node)
504{
505	u8 node_type = READ_ONCE(node->type);
506	unsigned long flags;
507
508	if (WARN_ON_ONCE(node_type == BPF_LRU_LIST_T_FREE) ||
509	    WARN_ON_ONCE(node_type == BPF_LRU_LOCAL_LIST_T_FREE))
510		return;
511
512	if (node_type == BPF_LRU_LOCAL_LIST_T_PENDING) {
513		struct bpf_lru_locallist *loc_l;
514
515		loc_l = per_cpu_ptr(lru->common_lru.local_list, node->cpu);
516
517		raw_spin_lock_irqsave(&loc_l->lock, flags);
518
519		if (unlikely(node->type != BPF_LRU_LOCAL_LIST_T_PENDING)) {
520			raw_spin_unlock_irqrestore(&loc_l->lock, flags);
521			goto check_lru_list;
522		}
523
524		node->type = BPF_LRU_LOCAL_LIST_T_FREE;
525		node->ref = 0;
526		list_move(&node->list, local_free_list(loc_l));
527
528		raw_spin_unlock_irqrestore(&loc_l->lock, flags);
529		return;
530	}
531
532check_lru_list:
533	bpf_lru_list_push_free(&lru->common_lru.lru_list, node);
534}
535
536static void bpf_percpu_lru_push_free(struct bpf_lru *lru,
537				     struct bpf_lru_node *node)
538{
539	struct bpf_lru_list *l;
540	unsigned long flags;
541
542	l = per_cpu_ptr(lru->percpu_lru, node->cpu);
543
544	raw_spin_lock_irqsave(&l->lock, flags);
545
546	__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_FREE);
547
548	raw_spin_unlock_irqrestore(&l->lock, flags);
549}
550
551void bpf_lru_push_free(struct bpf_lru *lru, struct bpf_lru_node *node)
552{
553	if (lru->percpu)
554		bpf_percpu_lru_push_free(lru, node);
555	else
556		bpf_common_lru_push_free(lru, node);
557}
558
559static void bpf_common_lru_populate(struct bpf_lru *lru, void *buf,
560				    u32 node_offset, u32 elem_size,
561				    u32 nr_elems)
562{
563	struct bpf_lru_list *l = &lru->common_lru.lru_list;
564	u32 i;
565
566	for (i = 0; i < nr_elems; i++) {
567		struct bpf_lru_node *node;
568
569		node = (struct bpf_lru_node *)(buf + node_offset);
570		node->type = BPF_LRU_LIST_T_FREE;
571		node->ref = 0;
572		list_add(&node->list, &l->lists[BPF_LRU_LIST_T_FREE]);
573		buf += elem_size;
574	}
575}
576
577static void bpf_percpu_lru_populate(struct bpf_lru *lru, void *buf,
578				    u32 node_offset, u32 elem_size,
579				    u32 nr_elems)
580{
581	u32 i, pcpu_entries;
582	int cpu;
583	struct bpf_lru_list *l;
584
585	pcpu_entries = nr_elems / num_possible_cpus();
586
587	i = 0;
588
589	for_each_possible_cpu(cpu) {
590		struct bpf_lru_node *node;
591
592		l = per_cpu_ptr(lru->percpu_lru, cpu);
593again:
594		node = (struct bpf_lru_node *)(buf + node_offset);
595		node->cpu = cpu;
596		node->type = BPF_LRU_LIST_T_FREE;
597		node->ref = 0;
598		list_add(&node->list, &l->lists[BPF_LRU_LIST_T_FREE]);
599		i++;
600		buf += elem_size;
601		if (i == nr_elems)
602			break;
603		if (i % pcpu_entries)
604			goto again;
605	}
606}
607
608void bpf_lru_populate(struct bpf_lru *lru, void *buf, u32 node_offset,
609		      u32 elem_size, u32 nr_elems)
610{
611	if (lru->percpu)
612		bpf_percpu_lru_populate(lru, buf, node_offset, elem_size,
613					nr_elems);
614	else
615		bpf_common_lru_populate(lru, buf, node_offset, elem_size,
616					nr_elems);
617}
618
619static void bpf_lru_locallist_init(struct bpf_lru_locallist *loc_l, int cpu)
620{
621	int i;
622
623	for (i = 0; i < NR_BPF_LRU_LOCAL_LIST_T; i++)
624		INIT_LIST_HEAD(&loc_l->lists[i]);
625
626	loc_l->next_steal = cpu;
627
628	raw_spin_lock_init(&loc_l->lock);
629}
630
631static void bpf_lru_list_init(struct bpf_lru_list *l)
632{
633	int i;
634
635	for (i = 0; i < NR_BPF_LRU_LIST_T; i++)
636		INIT_LIST_HEAD(&l->lists[i]);
637
638	for (i = 0; i < NR_BPF_LRU_LIST_COUNT; i++)
639		l->counts[i] = 0;
640
641	l->next_inactive_rotation = &l->lists[BPF_LRU_LIST_T_INACTIVE];
642
643	raw_spin_lock_init(&l->lock);
644}
645
646int bpf_lru_init(struct bpf_lru *lru, bool percpu, u32 hash_offset,
647		 del_from_htab_func del_from_htab, void *del_arg)
648{
649	int cpu;
650
651	if (percpu) {
652		lru->percpu_lru = alloc_percpu(struct bpf_lru_list);
653		if (!lru->percpu_lru)
654			return -ENOMEM;
655
656		for_each_possible_cpu(cpu) {
657			struct bpf_lru_list *l;
658
659			l = per_cpu_ptr(lru->percpu_lru, cpu);
660			bpf_lru_list_init(l);
661		}
662		lru->nr_scans = PERCPU_NR_SCANS;
663	} else {
664		struct bpf_common_lru *clru = &lru->common_lru;
665
666		clru->local_list = alloc_percpu(struct bpf_lru_locallist);
667		if (!clru->local_list)
668			return -ENOMEM;
669
670		for_each_possible_cpu(cpu) {
671			struct bpf_lru_locallist *loc_l;
672
673			loc_l = per_cpu_ptr(clru->local_list, cpu);
674			bpf_lru_locallist_init(loc_l, cpu);
675		}
676
677		bpf_lru_list_init(&clru->lru_list);
678		lru->nr_scans = LOCAL_NR_SCANS;
679	}
680
681	lru->percpu = percpu;
682	lru->del_from_htab = del_from_htab;
683	lru->del_arg = del_arg;
684	lru->hash_offset = hash_offset;
685
686	return 0;
687}
688
689void bpf_lru_destroy(struct bpf_lru *lru)
690{
691	if (lru->percpu)
692		free_percpu(lru->percpu_lru);
693	else
694		free_percpu(lru->common_lru.local_list);
695}
v6.8
  1// SPDX-License-Identifier: GPL-2.0-only
  2/* Copyright (c) 2016 Facebook
  3 */
  4#include <linux/cpumask.h>
  5#include <linux/spinlock.h>
  6#include <linux/percpu.h>
  7
  8#include "bpf_lru_list.h"
  9
 10#define LOCAL_FREE_TARGET		(128)
 11#define LOCAL_NR_SCANS			LOCAL_FREE_TARGET
 12
 13#define PERCPU_FREE_TARGET		(4)
 14#define PERCPU_NR_SCANS			PERCPU_FREE_TARGET
 15
 16/* Helpers to get the local list index */
 17#define LOCAL_LIST_IDX(t)	((t) - BPF_LOCAL_LIST_T_OFFSET)
 18#define LOCAL_FREE_LIST_IDX	LOCAL_LIST_IDX(BPF_LRU_LOCAL_LIST_T_FREE)
 19#define LOCAL_PENDING_LIST_IDX	LOCAL_LIST_IDX(BPF_LRU_LOCAL_LIST_T_PENDING)
 20#define IS_LOCAL_LIST_TYPE(t)	((t) >= BPF_LOCAL_LIST_T_OFFSET)
 21
 22static int get_next_cpu(int cpu)
 23{
 24	cpu = cpumask_next(cpu, cpu_possible_mask);
 25	if (cpu >= nr_cpu_ids)
 26		cpu = cpumask_first(cpu_possible_mask);
 27	return cpu;
 28}
 29
 30/* Local list helpers */
 31static struct list_head *local_free_list(struct bpf_lru_locallist *loc_l)
 32{
 33	return &loc_l->lists[LOCAL_FREE_LIST_IDX];
 34}
 35
 36static struct list_head *local_pending_list(struct bpf_lru_locallist *loc_l)
 37{
 38	return &loc_l->lists[LOCAL_PENDING_LIST_IDX];
 39}
 40
 41/* bpf_lru_node helpers */
 42static bool bpf_lru_node_is_ref(const struct bpf_lru_node *node)
 43{
 44	return READ_ONCE(node->ref);
 45}
 46
 47static void bpf_lru_node_clear_ref(struct bpf_lru_node *node)
 48{
 49	WRITE_ONCE(node->ref, 0);
 50}
 51
 52static void bpf_lru_list_count_inc(struct bpf_lru_list *l,
 53				   enum bpf_lru_list_type type)
 54{
 55	if (type < NR_BPF_LRU_LIST_COUNT)
 56		l->counts[type]++;
 57}
 58
 59static void bpf_lru_list_count_dec(struct bpf_lru_list *l,
 60				   enum bpf_lru_list_type type)
 61{
 62	if (type < NR_BPF_LRU_LIST_COUNT)
 63		l->counts[type]--;
 64}
 65
 66static void __bpf_lru_node_move_to_free(struct bpf_lru_list *l,
 67					struct bpf_lru_node *node,
 68					struct list_head *free_list,
 69					enum bpf_lru_list_type tgt_free_type)
 70{
 71	if (WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(node->type)))
 72		return;
 73
 74	/* If the removing node is the next_inactive_rotation candidate,
 75	 * move the next_inactive_rotation pointer also.
 76	 */
 77	if (&node->list == l->next_inactive_rotation)
 78		l->next_inactive_rotation = l->next_inactive_rotation->prev;
 79
 80	bpf_lru_list_count_dec(l, node->type);
 81
 82	node->type = tgt_free_type;
 83	list_move(&node->list, free_list);
 84}
 85
 86/* Move nodes from local list to the LRU list */
 87static void __bpf_lru_node_move_in(struct bpf_lru_list *l,
 88				   struct bpf_lru_node *node,
 89				   enum bpf_lru_list_type tgt_type)
 90{
 91	if (WARN_ON_ONCE(!IS_LOCAL_LIST_TYPE(node->type)) ||
 92	    WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(tgt_type)))
 93		return;
 94
 95	bpf_lru_list_count_inc(l, tgt_type);
 96	node->type = tgt_type;
 97	bpf_lru_node_clear_ref(node);
 98	list_move(&node->list, &l->lists[tgt_type]);
 99}
100
101/* Move nodes between or within active and inactive list (like
102 * active to inactive, inactive to active or tail of active back to
103 * the head of active).
104 */
105static void __bpf_lru_node_move(struct bpf_lru_list *l,
106				struct bpf_lru_node *node,
107				enum bpf_lru_list_type tgt_type)
108{
109	if (WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(node->type)) ||
110	    WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(tgt_type)))
111		return;
112
113	if (node->type != tgt_type) {
114		bpf_lru_list_count_dec(l, node->type);
115		bpf_lru_list_count_inc(l, tgt_type);
116		node->type = tgt_type;
117	}
118	bpf_lru_node_clear_ref(node);
119
120	/* If the moving node is the next_inactive_rotation candidate,
121	 * move the next_inactive_rotation pointer also.
122	 */
123	if (&node->list == l->next_inactive_rotation)
124		l->next_inactive_rotation = l->next_inactive_rotation->prev;
125
126	list_move(&node->list, &l->lists[tgt_type]);
127}
128
129static bool bpf_lru_list_inactive_low(const struct bpf_lru_list *l)
130{
131	return l->counts[BPF_LRU_LIST_T_INACTIVE] <
132		l->counts[BPF_LRU_LIST_T_ACTIVE];
133}
134
135/* Rotate the active list:
136 * 1. Start from tail
137 * 2. If the node has the ref bit set, it will be rotated
138 *    back to the head of active list with the ref bit cleared.
139 *    Give this node one more chance to survive in the active list.
140 * 3. If the ref bit is not set, move it to the head of the
141 *    inactive list.
142 * 4. It will at most scan nr_scans nodes
143 */
144static void __bpf_lru_list_rotate_active(struct bpf_lru *lru,
145					 struct bpf_lru_list *l)
146{
147	struct list_head *active = &l->lists[BPF_LRU_LIST_T_ACTIVE];
148	struct bpf_lru_node *node, *tmp_node, *first_node;
149	unsigned int i = 0;
150
151	first_node = list_first_entry(active, struct bpf_lru_node, list);
152	list_for_each_entry_safe_reverse(node, tmp_node, active, list) {
153		if (bpf_lru_node_is_ref(node))
154			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_ACTIVE);
155		else
156			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_INACTIVE);
157
158		if (++i == lru->nr_scans || node == first_node)
159			break;
160	}
161}
162
163/* Rotate the inactive list.  It starts from the next_inactive_rotation
164 * 1. If the node has ref bit set, it will be moved to the head
165 *    of active list with the ref bit cleared.
166 * 2. If the node does not have ref bit set, it will leave it
167 *    at its current location (i.e. do nothing) so that it can
168 *    be considered during the next inactive_shrink.
169 * 3. It will at most scan nr_scans nodes
170 */
171static void __bpf_lru_list_rotate_inactive(struct bpf_lru *lru,
172					   struct bpf_lru_list *l)
173{
174	struct list_head *inactive = &l->lists[BPF_LRU_LIST_T_INACTIVE];
175	struct list_head *cur, *last, *next = inactive;
176	struct bpf_lru_node *node;
177	unsigned int i = 0;
178
179	if (list_empty(inactive))
180		return;
181
182	last = l->next_inactive_rotation->next;
183	if (last == inactive)
184		last = last->next;
185
186	cur = l->next_inactive_rotation;
187	while (i < lru->nr_scans) {
188		if (cur == inactive) {
189			cur = cur->prev;
190			continue;
191		}
192
193		node = list_entry(cur, struct bpf_lru_node, list);
194		next = cur->prev;
195		if (bpf_lru_node_is_ref(node))
196			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_ACTIVE);
197		if (cur == last)
198			break;
199		cur = next;
200		i++;
201	}
202
203	l->next_inactive_rotation = next;
204}
205
206/* Shrink the inactive list.  It starts from the tail of the
207 * inactive list and only move the nodes without the ref bit
208 * set to the designated free list.
209 */
210static unsigned int
211__bpf_lru_list_shrink_inactive(struct bpf_lru *lru,
212			       struct bpf_lru_list *l,
213			       unsigned int tgt_nshrink,
214			       struct list_head *free_list,
215			       enum bpf_lru_list_type tgt_free_type)
216{
217	struct list_head *inactive = &l->lists[BPF_LRU_LIST_T_INACTIVE];
218	struct bpf_lru_node *node, *tmp_node;
219	unsigned int nshrinked = 0;
220	unsigned int i = 0;
221
222	list_for_each_entry_safe_reverse(node, tmp_node, inactive, list) {
223		if (bpf_lru_node_is_ref(node)) {
224			__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_ACTIVE);
225		} else if (lru->del_from_htab(lru->del_arg, node)) {
226			__bpf_lru_node_move_to_free(l, node, free_list,
227						    tgt_free_type);
228			if (++nshrinked == tgt_nshrink)
229				break;
230		}
231
232		if (++i == lru->nr_scans)
233			break;
234	}
235
236	return nshrinked;
237}
238
239/* 1. Rotate the active list (if needed)
240 * 2. Always rotate the inactive list
241 */
242static void __bpf_lru_list_rotate(struct bpf_lru *lru, struct bpf_lru_list *l)
243{
244	if (bpf_lru_list_inactive_low(l))
245		__bpf_lru_list_rotate_active(lru, l);
246
247	__bpf_lru_list_rotate_inactive(lru, l);
248}
249
250/* Calls __bpf_lru_list_shrink_inactive() to shrink some
251 * ref-bit-cleared nodes and move them to the designated
252 * free list.
253 *
254 * If it cannot get a free node after calling
255 * __bpf_lru_list_shrink_inactive().  It will just remove
256 * one node from either inactive or active list without
257 * honoring the ref-bit.  It prefers inactive list to active
258 * list in this situation.
259 */
260static unsigned int __bpf_lru_list_shrink(struct bpf_lru *lru,
261					  struct bpf_lru_list *l,
262					  unsigned int tgt_nshrink,
263					  struct list_head *free_list,
264					  enum bpf_lru_list_type tgt_free_type)
265
266{
267	struct bpf_lru_node *node, *tmp_node;
268	struct list_head *force_shrink_list;
269	unsigned int nshrinked;
270
271	nshrinked = __bpf_lru_list_shrink_inactive(lru, l, tgt_nshrink,
272						   free_list, tgt_free_type);
273	if (nshrinked)
274		return nshrinked;
275
276	/* Do a force shrink by ignoring the reference bit */
277	if (!list_empty(&l->lists[BPF_LRU_LIST_T_INACTIVE]))
278		force_shrink_list = &l->lists[BPF_LRU_LIST_T_INACTIVE];
279	else
280		force_shrink_list = &l->lists[BPF_LRU_LIST_T_ACTIVE];
281
282	list_for_each_entry_safe_reverse(node, tmp_node, force_shrink_list,
283					 list) {
284		if (lru->del_from_htab(lru->del_arg, node)) {
285			__bpf_lru_node_move_to_free(l, node, free_list,
286						    tgt_free_type);
287			return 1;
288		}
289	}
290
291	return 0;
292}
293
294/* Flush the nodes from the local pending list to the LRU list */
295static void __local_list_flush(struct bpf_lru_list *l,
296			       struct bpf_lru_locallist *loc_l)
297{
298	struct bpf_lru_node *node, *tmp_node;
299
300	list_for_each_entry_safe_reverse(node, tmp_node,
301					 local_pending_list(loc_l), list) {
302		if (bpf_lru_node_is_ref(node))
303			__bpf_lru_node_move_in(l, node, BPF_LRU_LIST_T_ACTIVE);
304		else
305			__bpf_lru_node_move_in(l, node,
306					       BPF_LRU_LIST_T_INACTIVE);
307	}
308}
309
310static void bpf_lru_list_push_free(struct bpf_lru_list *l,
311				   struct bpf_lru_node *node)
312{
313	unsigned long flags;
314
315	if (WARN_ON_ONCE(IS_LOCAL_LIST_TYPE(node->type)))
316		return;
317
318	raw_spin_lock_irqsave(&l->lock, flags);
319	__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_FREE);
320	raw_spin_unlock_irqrestore(&l->lock, flags);
321}
322
323static void bpf_lru_list_pop_free_to_local(struct bpf_lru *lru,
324					   struct bpf_lru_locallist *loc_l)
325{
326	struct bpf_lru_list *l = &lru->common_lru.lru_list;
327	struct bpf_lru_node *node, *tmp_node;
328	unsigned int nfree = 0;
329
330	raw_spin_lock(&l->lock);
331
332	__local_list_flush(l, loc_l);
333
334	__bpf_lru_list_rotate(lru, l);
335
336	list_for_each_entry_safe(node, tmp_node, &l->lists[BPF_LRU_LIST_T_FREE],
337				 list) {
338		__bpf_lru_node_move_to_free(l, node, local_free_list(loc_l),
339					    BPF_LRU_LOCAL_LIST_T_FREE);
340		if (++nfree == LOCAL_FREE_TARGET)
341			break;
342	}
343
344	if (nfree < LOCAL_FREE_TARGET)
345		__bpf_lru_list_shrink(lru, l, LOCAL_FREE_TARGET - nfree,
346				      local_free_list(loc_l),
347				      BPF_LRU_LOCAL_LIST_T_FREE);
348
349	raw_spin_unlock(&l->lock);
350}
351
352static void __local_list_add_pending(struct bpf_lru *lru,
353				     struct bpf_lru_locallist *loc_l,
354				     int cpu,
355				     struct bpf_lru_node *node,
356				     u32 hash)
357{
358	*(u32 *)((void *)node + lru->hash_offset) = hash;
359	node->cpu = cpu;
360	node->type = BPF_LRU_LOCAL_LIST_T_PENDING;
361	bpf_lru_node_clear_ref(node);
362	list_add(&node->list, local_pending_list(loc_l));
363}
364
365static struct bpf_lru_node *
366__local_list_pop_free(struct bpf_lru_locallist *loc_l)
367{
368	struct bpf_lru_node *node;
369
370	node = list_first_entry_or_null(local_free_list(loc_l),
371					struct bpf_lru_node,
372					list);
373	if (node)
374		list_del(&node->list);
375
376	return node;
377}
378
379static struct bpf_lru_node *
380__local_list_pop_pending(struct bpf_lru *lru, struct bpf_lru_locallist *loc_l)
381{
382	struct bpf_lru_node *node;
383	bool force = false;
384
385ignore_ref:
386	/* Get from the tail (i.e. older element) of the pending list. */
387	list_for_each_entry_reverse(node, local_pending_list(loc_l),
388				    list) {
389		if ((!bpf_lru_node_is_ref(node) || force) &&
390		    lru->del_from_htab(lru->del_arg, node)) {
391			list_del(&node->list);
392			return node;
393		}
394	}
395
396	if (!force) {
397		force = true;
398		goto ignore_ref;
399	}
400
401	return NULL;
402}
403
404static struct bpf_lru_node *bpf_percpu_lru_pop_free(struct bpf_lru *lru,
405						    u32 hash)
406{
407	struct list_head *free_list;
408	struct bpf_lru_node *node = NULL;
409	struct bpf_lru_list *l;
410	unsigned long flags;
411	int cpu = raw_smp_processor_id();
412
413	l = per_cpu_ptr(lru->percpu_lru, cpu);
414
415	raw_spin_lock_irqsave(&l->lock, flags);
416
417	__bpf_lru_list_rotate(lru, l);
418
419	free_list = &l->lists[BPF_LRU_LIST_T_FREE];
420	if (list_empty(free_list))
421		__bpf_lru_list_shrink(lru, l, PERCPU_FREE_TARGET, free_list,
422				      BPF_LRU_LIST_T_FREE);
423
424	if (!list_empty(free_list)) {
425		node = list_first_entry(free_list, struct bpf_lru_node, list);
426		*(u32 *)((void *)node + lru->hash_offset) = hash;
427		bpf_lru_node_clear_ref(node);
428		__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_INACTIVE);
429	}
430
431	raw_spin_unlock_irqrestore(&l->lock, flags);
432
433	return node;
434}
435
436static struct bpf_lru_node *bpf_common_lru_pop_free(struct bpf_lru *lru,
437						    u32 hash)
438{
439	struct bpf_lru_locallist *loc_l, *steal_loc_l;
440	struct bpf_common_lru *clru = &lru->common_lru;
441	struct bpf_lru_node *node;
442	int steal, first_steal;
443	unsigned long flags;
444	int cpu = raw_smp_processor_id();
445
446	loc_l = per_cpu_ptr(clru->local_list, cpu);
447
448	raw_spin_lock_irqsave(&loc_l->lock, flags);
449
450	node = __local_list_pop_free(loc_l);
451	if (!node) {
452		bpf_lru_list_pop_free_to_local(lru, loc_l);
453		node = __local_list_pop_free(loc_l);
454	}
455
456	if (node)
457		__local_list_add_pending(lru, loc_l, cpu, node, hash);
458
459	raw_spin_unlock_irqrestore(&loc_l->lock, flags);
460
461	if (node)
462		return node;
463
464	/* No free nodes found from the local free list and
465	 * the global LRU list.
466	 *
467	 * Steal from the local free/pending list of the
468	 * current CPU and remote CPU in RR.  It starts
469	 * with the loc_l->next_steal CPU.
470	 */
471
472	first_steal = loc_l->next_steal;
473	steal = first_steal;
474	do {
475		steal_loc_l = per_cpu_ptr(clru->local_list, steal);
476
477		raw_spin_lock_irqsave(&steal_loc_l->lock, flags);
478
479		node = __local_list_pop_free(steal_loc_l);
480		if (!node)
481			node = __local_list_pop_pending(lru, steal_loc_l);
482
483		raw_spin_unlock_irqrestore(&steal_loc_l->lock, flags);
484
485		steal = get_next_cpu(steal);
486	} while (!node && steal != first_steal);
487
488	loc_l->next_steal = steal;
489
490	if (node) {
491		raw_spin_lock_irqsave(&loc_l->lock, flags);
492		__local_list_add_pending(lru, loc_l, cpu, node, hash);
493		raw_spin_unlock_irqrestore(&loc_l->lock, flags);
494	}
495
496	return node;
497}
498
499struct bpf_lru_node *bpf_lru_pop_free(struct bpf_lru *lru, u32 hash)
500{
501	if (lru->percpu)
502		return bpf_percpu_lru_pop_free(lru, hash);
503	else
504		return bpf_common_lru_pop_free(lru, hash);
505}
506
507static void bpf_common_lru_push_free(struct bpf_lru *lru,
508				     struct bpf_lru_node *node)
509{
510	u8 node_type = READ_ONCE(node->type);
511	unsigned long flags;
512
513	if (WARN_ON_ONCE(node_type == BPF_LRU_LIST_T_FREE) ||
514	    WARN_ON_ONCE(node_type == BPF_LRU_LOCAL_LIST_T_FREE))
515		return;
516
517	if (node_type == BPF_LRU_LOCAL_LIST_T_PENDING) {
518		struct bpf_lru_locallist *loc_l;
519
520		loc_l = per_cpu_ptr(lru->common_lru.local_list, node->cpu);
521
522		raw_spin_lock_irqsave(&loc_l->lock, flags);
523
524		if (unlikely(node->type != BPF_LRU_LOCAL_LIST_T_PENDING)) {
525			raw_spin_unlock_irqrestore(&loc_l->lock, flags);
526			goto check_lru_list;
527		}
528
529		node->type = BPF_LRU_LOCAL_LIST_T_FREE;
530		bpf_lru_node_clear_ref(node);
531		list_move(&node->list, local_free_list(loc_l));
532
533		raw_spin_unlock_irqrestore(&loc_l->lock, flags);
534		return;
535	}
536
537check_lru_list:
538	bpf_lru_list_push_free(&lru->common_lru.lru_list, node);
539}
540
541static void bpf_percpu_lru_push_free(struct bpf_lru *lru,
542				     struct bpf_lru_node *node)
543{
544	struct bpf_lru_list *l;
545	unsigned long flags;
546
547	l = per_cpu_ptr(lru->percpu_lru, node->cpu);
548
549	raw_spin_lock_irqsave(&l->lock, flags);
550
551	__bpf_lru_node_move(l, node, BPF_LRU_LIST_T_FREE);
552
553	raw_spin_unlock_irqrestore(&l->lock, flags);
554}
555
556void bpf_lru_push_free(struct bpf_lru *lru, struct bpf_lru_node *node)
557{
558	if (lru->percpu)
559		bpf_percpu_lru_push_free(lru, node);
560	else
561		bpf_common_lru_push_free(lru, node);
562}
563
564static void bpf_common_lru_populate(struct bpf_lru *lru, void *buf,
565				    u32 node_offset, u32 elem_size,
566				    u32 nr_elems)
567{
568	struct bpf_lru_list *l = &lru->common_lru.lru_list;
569	u32 i;
570
571	for (i = 0; i < nr_elems; i++) {
572		struct bpf_lru_node *node;
573
574		node = (struct bpf_lru_node *)(buf + node_offset);
575		node->type = BPF_LRU_LIST_T_FREE;
576		bpf_lru_node_clear_ref(node);
577		list_add(&node->list, &l->lists[BPF_LRU_LIST_T_FREE]);
578		buf += elem_size;
579	}
580}
581
582static void bpf_percpu_lru_populate(struct bpf_lru *lru, void *buf,
583				    u32 node_offset, u32 elem_size,
584				    u32 nr_elems)
585{
586	u32 i, pcpu_entries;
587	int cpu;
588	struct bpf_lru_list *l;
589
590	pcpu_entries = nr_elems / num_possible_cpus();
591
592	i = 0;
593
594	for_each_possible_cpu(cpu) {
595		struct bpf_lru_node *node;
596
597		l = per_cpu_ptr(lru->percpu_lru, cpu);
598again:
599		node = (struct bpf_lru_node *)(buf + node_offset);
600		node->cpu = cpu;
601		node->type = BPF_LRU_LIST_T_FREE;
602		bpf_lru_node_clear_ref(node);
603		list_add(&node->list, &l->lists[BPF_LRU_LIST_T_FREE]);
604		i++;
605		buf += elem_size;
606		if (i == nr_elems)
607			break;
608		if (i % pcpu_entries)
609			goto again;
610	}
611}
612
613void bpf_lru_populate(struct bpf_lru *lru, void *buf, u32 node_offset,
614		      u32 elem_size, u32 nr_elems)
615{
616	if (lru->percpu)
617		bpf_percpu_lru_populate(lru, buf, node_offset, elem_size,
618					nr_elems);
619	else
620		bpf_common_lru_populate(lru, buf, node_offset, elem_size,
621					nr_elems);
622}
623
624static void bpf_lru_locallist_init(struct bpf_lru_locallist *loc_l, int cpu)
625{
626	int i;
627
628	for (i = 0; i < NR_BPF_LRU_LOCAL_LIST_T; i++)
629		INIT_LIST_HEAD(&loc_l->lists[i]);
630
631	loc_l->next_steal = cpu;
632
633	raw_spin_lock_init(&loc_l->lock);
634}
635
636static void bpf_lru_list_init(struct bpf_lru_list *l)
637{
638	int i;
639
640	for (i = 0; i < NR_BPF_LRU_LIST_T; i++)
641		INIT_LIST_HEAD(&l->lists[i]);
642
643	for (i = 0; i < NR_BPF_LRU_LIST_COUNT; i++)
644		l->counts[i] = 0;
645
646	l->next_inactive_rotation = &l->lists[BPF_LRU_LIST_T_INACTIVE];
647
648	raw_spin_lock_init(&l->lock);
649}
650
651int bpf_lru_init(struct bpf_lru *lru, bool percpu, u32 hash_offset,
652		 del_from_htab_func del_from_htab, void *del_arg)
653{
654	int cpu;
655
656	if (percpu) {
657		lru->percpu_lru = alloc_percpu(struct bpf_lru_list);
658		if (!lru->percpu_lru)
659			return -ENOMEM;
660
661		for_each_possible_cpu(cpu) {
662			struct bpf_lru_list *l;
663
664			l = per_cpu_ptr(lru->percpu_lru, cpu);
665			bpf_lru_list_init(l);
666		}
667		lru->nr_scans = PERCPU_NR_SCANS;
668	} else {
669		struct bpf_common_lru *clru = &lru->common_lru;
670
671		clru->local_list = alloc_percpu(struct bpf_lru_locallist);
672		if (!clru->local_list)
673			return -ENOMEM;
674
675		for_each_possible_cpu(cpu) {
676			struct bpf_lru_locallist *loc_l;
677
678			loc_l = per_cpu_ptr(clru->local_list, cpu);
679			bpf_lru_locallist_init(loc_l, cpu);
680		}
681
682		bpf_lru_list_init(&clru->lru_list);
683		lru->nr_scans = LOCAL_NR_SCANS;
684	}
685
686	lru->percpu = percpu;
687	lru->del_from_htab = del_from_htab;
688	lru->del_arg = del_arg;
689	lru->hash_offset = hash_offset;
690
691	return 0;
692}
693
694void bpf_lru_destroy(struct bpf_lru *lru)
695{
696	if (lru->percpu)
697		free_percpu(lru->percpu_lru);
698	else
699		free_percpu(lru->common_lru.local_list);
700}