3 * Copyright (c) 2017 Jesper Dangaard Brouer, Red Hat Inc.
4 * Released under terms in GPL version 2. See COPYING.
6 #include <linux/types.h>
8 #include <linux/slab.h>
10 #include <linux/rhashtable.h>
11 #include <net/page_pool.h>
15 #define REG_STATE_NEW 0x0
16 #define REG_STATE_REGISTERED 0x1
17 #define REG_STATE_UNREGISTERED 0x2
18 #define REG_STATE_UNUSED 0x3
20 static DEFINE_IDA(mem_id_pool);
21 static DEFINE_MUTEX(mem_id_lock);
22 #define MEM_ID_MAX 0xFFFE
24 static int mem_id_next = MEM_ID_MIN;
26 static bool mem_id_init; /* false */
27 static struct rhashtable *mem_id_ht;
29 struct xdp_mem_allocator {
30 struct xdp_mem_info mem;
33 struct page_pool *page_pool;
35 struct rhash_head node;
39 static u32 xdp_mem_id_hashfn(const void *data, u32 len, u32 seed)
44 BUILD_BUG_ON(FIELD_SIZEOF(struct xdp_mem_allocator, mem.id)
47 /* Use cyclic increasing ID as direct hash key, see rht_bucket_index */
48 return key << RHT_HASH_RESERVED_SPACE;
51 static int xdp_mem_id_cmp(struct rhashtable_compare_arg *arg,
54 const struct xdp_mem_allocator *xa = ptr;
55 u32 mem_id = *(u32 *)arg->key;
57 return xa->mem.id != mem_id;
60 static const struct rhashtable_params mem_id_rht_params = {
62 .head_offset = offsetof(struct xdp_mem_allocator, node),
63 .key_offset = offsetof(struct xdp_mem_allocator, mem.id),
64 .key_len = FIELD_SIZEOF(struct xdp_mem_allocator, mem.id),
65 .max_size = MEM_ID_MAX,
67 .automatic_shrinking = true,
68 .hashfn = xdp_mem_id_hashfn,
69 .obj_cmpfn = xdp_mem_id_cmp,
72 static void __xdp_mem_allocator_rcu_free(struct rcu_head *rcu)
74 struct xdp_mem_allocator *xa;
76 xa = container_of(rcu, struct xdp_mem_allocator, rcu);
78 /* Allow this ID to be reused */
79 ida_simple_remove(&mem_id_pool, xa->mem.id);
81 /* Notice, driver is expected to free the *allocator,
82 * e.g. page_pool, and MUST also use RCU free.
87 xa->mem.type = 0xF0F0;
88 xa->allocator = (void *)0xDEAD9001;
93 static void __xdp_rxq_info_unreg_mem_model(struct xdp_rxq_info *xdp_rxq)
95 struct xdp_mem_allocator *xa;
96 int id = xdp_rxq->mem.id;
102 mutex_lock(&mem_id_lock);
104 xa = rhashtable_lookup(mem_id_ht, &id, mem_id_rht_params);
106 mutex_unlock(&mem_id_lock);
110 err = rhashtable_remove_fast(mem_id_ht, &xa->node, mem_id_rht_params);
113 call_rcu(&xa->rcu, __xdp_mem_allocator_rcu_free);
115 mutex_unlock(&mem_id_lock);
118 void xdp_rxq_info_unreg(struct xdp_rxq_info *xdp_rxq)
120 /* Simplify driver cleanup code paths, allow unreg "unused" */
121 if (xdp_rxq->reg_state == REG_STATE_UNUSED)
124 WARN(!(xdp_rxq->reg_state == REG_STATE_REGISTERED), "Driver BUG");
126 __xdp_rxq_info_unreg_mem_model(xdp_rxq);
128 xdp_rxq->reg_state = REG_STATE_UNREGISTERED;
131 /* Reset mem info to defaults */
133 xdp_rxq->mem.type = 0;
135 EXPORT_SYMBOL_GPL(xdp_rxq_info_unreg);
137 static void xdp_rxq_info_init(struct xdp_rxq_info *xdp_rxq)
139 memset(xdp_rxq, 0, sizeof(*xdp_rxq));
142 /* Returns 0 on success, negative on failure */
143 int xdp_rxq_info_reg(struct xdp_rxq_info *xdp_rxq,
144 struct net_device *dev, u32 queue_index)
146 if (xdp_rxq->reg_state == REG_STATE_UNUSED) {
147 WARN(1, "Driver promised not to register this");
151 if (xdp_rxq->reg_state == REG_STATE_REGISTERED) {
152 WARN(1, "Missing unregister, handled but fix driver");
153 xdp_rxq_info_unreg(xdp_rxq);
157 WARN(1, "Missing net_device from driver");
161 /* State either UNREGISTERED or NEW */
162 xdp_rxq_info_init(xdp_rxq);
164 xdp_rxq->queue_index = queue_index;
166 xdp_rxq->reg_state = REG_STATE_REGISTERED;
169 EXPORT_SYMBOL_GPL(xdp_rxq_info_reg);
171 void xdp_rxq_info_unused(struct xdp_rxq_info *xdp_rxq)
173 xdp_rxq->reg_state = REG_STATE_UNUSED;
175 EXPORT_SYMBOL_GPL(xdp_rxq_info_unused);
177 bool xdp_rxq_info_is_reg(struct xdp_rxq_info *xdp_rxq)
179 return (xdp_rxq->reg_state == REG_STATE_REGISTERED);
181 EXPORT_SYMBOL_GPL(xdp_rxq_info_is_reg);
183 static int __mem_id_init_hash_table(void)
185 struct rhashtable *rht;
188 if (unlikely(mem_id_init))
191 rht = kzalloc(sizeof(*rht), GFP_KERNEL);
195 ret = rhashtable_init(rht, &mem_id_rht_params);
201 smp_mb(); /* mutex lock should provide enough pairing */
207 /* Allocate a cyclic ID that maps to allocator pointer.
208 * See: https://www.kernel.org/doc/html/latest/core-api/idr.html
210 * Caller must lock mem_id_lock.
212 static int __mem_id_cyclic_get(gfp_t gfp)
218 id = ida_simple_get(&mem_id_pool, mem_id_next, MEM_ID_MAX, gfp);
221 /* Cyclic allocator, reset next id */
223 mem_id_next = MEM_ID_MIN;
227 return id; /* errno */
229 mem_id_next = id + 1;
234 static bool __is_supported_mem_type(enum xdp_mem_type type)
236 if (type == MEM_TYPE_PAGE_POOL)
237 return is_page_pool_compiled_in();
239 if (type >= MEM_TYPE_MAX)
245 int xdp_rxq_info_reg_mem_model(struct xdp_rxq_info *xdp_rxq,
246 enum xdp_mem_type type, void *allocator)
248 struct xdp_mem_allocator *xdp_alloc;
249 gfp_t gfp = GFP_KERNEL;
253 if (xdp_rxq->reg_state != REG_STATE_REGISTERED) {
254 WARN(1, "Missing register, driver bug");
258 if (!__is_supported_mem_type(type))
261 xdp_rxq->mem.type = type;
264 if (type == MEM_TYPE_PAGE_POOL)
265 return -EINVAL; /* Setup time check page_pool req */
269 /* Delay init of rhashtable to save memory if feature isn't used */
271 mutex_lock(&mem_id_lock);
272 ret = __mem_id_init_hash_table();
273 mutex_unlock(&mem_id_lock);
280 xdp_alloc = kzalloc(sizeof(*xdp_alloc), gfp);
284 mutex_lock(&mem_id_lock);
285 id = __mem_id_cyclic_get(gfp);
290 xdp_rxq->mem.id = id;
291 xdp_alloc->mem = xdp_rxq->mem;
292 xdp_alloc->allocator = allocator;
294 /* Insert allocator into ID lookup table */
295 ptr = rhashtable_insert_slow(mem_id_ht, &id, &xdp_alloc->node);
297 errno = PTR_ERR(ptr);
301 mutex_unlock(&mem_id_lock);
305 mutex_unlock(&mem_id_lock);
309 EXPORT_SYMBOL_GPL(xdp_rxq_info_reg_mem_model);
311 /* XDP RX runs under NAPI protection, and in different delivery error
312 * scenarios (e.g. queue full), it is possible to return the xdp_frame
313 * while still leveraging this protection. The @napi_direct boolian
314 * is used for those calls sites. Thus, allowing for faster recycling
315 * of xdp_frames/pages in those cases.
317 static void __xdp_return(void *data, struct xdp_mem_info *mem, bool napi_direct)
319 struct xdp_mem_allocator *xa;
323 case MEM_TYPE_PAGE_POOL:
325 /* mem->id is valid, checked in xdp_rxq_info_reg_mem_model() */
326 xa = rhashtable_lookup(mem_id_ht, &mem->id, mem_id_rht_params);
327 page = virt_to_head_page(data);
329 page_pool_put_page(xa->page_pool, page, napi_direct);
334 case MEM_TYPE_PAGE_SHARED:
335 page_frag_free(data);
337 case MEM_TYPE_PAGE_ORDER0:
338 page = virt_to_page(data); /* Assumes order0 page*/
342 /* Not possible, checked in xdp_rxq_info_reg_mem_model() */
347 void xdp_return_frame(struct xdp_frame *xdpf)
349 __xdp_return(xdpf->data, &xdpf->mem, false);
351 EXPORT_SYMBOL_GPL(xdp_return_frame);
353 void xdp_return_frame_rx_napi(struct xdp_frame *xdpf)
355 __xdp_return(xdpf->data, &xdpf->mem, true);
357 EXPORT_SYMBOL_GPL(xdp_return_frame_rx_napi);
359 void xdp_return_buff(struct xdp_buff *xdp)
361 __xdp_return(xdp->data, &xdp->rxq->mem, true);
363 EXPORT_SYMBOL_GPL(xdp_return_buff);