1 // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
3 * Copyright 2015-2021 Amazon.com, Inc. or its affiliates. All rights reserved.
8 static int validate_xdp_req_id(struct ena_ring *tx_ring, u16 req_id)
10 struct ena_tx_buffer *tx_info;
12 tx_info = &tx_ring->tx_buffer_info[req_id];
13 if (likely(tx_info->xdpf))
16 return handle_invalid_req_id(tx_ring, req_id, tx_info, true);
19 static int ena_xdp_tx_map_frame(struct ena_ring *tx_ring,
20 struct ena_tx_buffer *tx_info,
21 struct xdp_frame *xdpf,
22 struct ena_com_tx_ctx *ena_tx_ctx)
24 struct ena_adapter *adapter = tx_ring->adapter;
25 struct ena_com_buf *ena_buf;
32 data = tx_info->xdpf->data;
33 size = tx_info->xdpf->len;
35 if (tx_ring->tx_mem_queue_type == ENA_ADMIN_PLACEMENT_POLICY_DEV) {
36 /* Designate part of the packet for LLQ */
37 push_len = min_t(u32, size, tx_ring->tx_max_header_size);
39 ena_tx_ctx->push_header = data;
45 ena_tx_ctx->header_len = push_len;
48 dma = dma_map_single(tx_ring->dev,
52 if (unlikely(dma_mapping_error(tx_ring->dev, dma)))
53 goto error_report_dma_error;
55 tx_info->map_linear_data = 0;
57 ena_buf = tx_info->bufs;
61 ena_tx_ctx->ena_bufs = ena_buf;
62 ena_tx_ctx->num_bufs = tx_info->num_of_bufs = 1;
67 error_report_dma_error:
68 ena_increase_stat(&tx_ring->tx_stats.dma_mapping_err, 1,
70 netif_warn(adapter, tx_queued, adapter->netdev, "Failed to map xdp buff\n");
75 int ena_xdp_xmit_frame(struct ena_ring *tx_ring,
76 struct ena_adapter *adapter,
77 struct xdp_frame *xdpf,
80 struct ena_com_tx_ctx ena_tx_ctx = {};
81 struct ena_tx_buffer *tx_info;
82 u16 next_to_use, req_id;
85 next_to_use = tx_ring->next_to_use;
86 req_id = tx_ring->free_ids[next_to_use];
87 tx_info = &tx_ring->tx_buffer_info[req_id];
88 tx_info->num_of_bufs = 0;
90 rc = ena_xdp_tx_map_frame(tx_ring, tx_info, xdpf, &ena_tx_ctx);
94 ena_tx_ctx.req_id = req_id;
96 rc = ena_xmit_common(adapter,
103 goto error_unmap_dma;
105 /* trigger the dma engine. ena_ring_tx_doorbell()
106 * calls a memory barrier inside it.
108 if (flags & XDP_XMIT_FLUSH)
109 ena_ring_tx_doorbell(tx_ring);
114 ena_unmap_tx_buff(tx_ring, tx_info);
115 tx_info->xdpf = NULL;
119 int ena_xdp_xmit(struct net_device *dev, int n,
120 struct xdp_frame **frames, u32 flags)
122 struct ena_adapter *adapter = netdev_priv(dev);
123 struct ena_ring *tx_ring;
124 int qid, i, nxmit = 0;
126 if (unlikely(flags & ~XDP_XMIT_FLAGS_MASK))
129 if (!test_bit(ENA_FLAG_DEV_UP, &adapter->flags))
132 /* We assume that all rings have the same XDP program */
133 if (!READ_ONCE(adapter->rx_ring->xdp_bpf_prog))
136 qid = smp_processor_id() % adapter->xdp_num_queues;
137 qid += adapter->xdp_first_ring;
138 tx_ring = &adapter->tx_ring[qid];
140 /* Other CPU ids might try to send thorugh this queue */
141 spin_lock(&tx_ring->xdp_tx_lock);
143 for (i = 0; i < n; i++) {
144 if (ena_xdp_xmit_frame(tx_ring, adapter, frames[i], 0))
149 /* Ring doorbell to make device aware of the packets */
150 if (flags & XDP_XMIT_FLUSH)
151 ena_ring_tx_doorbell(tx_ring);
153 spin_unlock(&tx_ring->xdp_tx_lock);
155 /* Return number of packets sent */
159 static void ena_init_all_xdp_queues(struct ena_adapter *adapter)
161 adapter->xdp_first_ring = adapter->num_io_queues;
162 adapter->xdp_num_queues = adapter->num_io_queues;
164 ena_init_io_rings(adapter,
165 adapter->xdp_first_ring,
166 adapter->xdp_num_queues);
169 int ena_setup_and_create_all_xdp_queues(struct ena_adapter *adapter)
171 u32 xdp_first_ring = adapter->xdp_first_ring;
172 u32 xdp_num_queues = adapter->xdp_num_queues;
175 rc = ena_setup_tx_resources_in_range(adapter, xdp_first_ring, xdp_num_queues);
179 rc = ena_create_io_tx_queues_in_range(adapter, xdp_first_ring, xdp_num_queues);
186 ena_free_all_io_tx_resources_in_range(adapter, xdp_first_ring, xdp_num_queues);
191 /* Provides a way for both kernel and bpf-prog to know
192 * more about the RX-queue a given XDP frame arrived on.
194 int ena_xdp_register_rxq_info(struct ena_ring *rx_ring)
198 rc = xdp_rxq_info_reg(&rx_ring->xdp_rxq, rx_ring->netdev, rx_ring->qid, 0);
200 netif_dbg(rx_ring->adapter, ifup, rx_ring->netdev, "Registering RX info for queue %d",
203 netif_err(rx_ring->adapter, ifup, rx_ring->netdev,
204 "Failed to register xdp rx queue info. RX queue num %d rc: %d\n",
209 rc = xdp_rxq_info_reg_mem_model(&rx_ring->xdp_rxq, MEM_TYPE_PAGE_SHARED, NULL);
212 netif_err(rx_ring->adapter, ifup, rx_ring->netdev,
213 "Failed to register xdp rx queue info memory model. RX queue num %d rc: %d\n",
215 xdp_rxq_info_unreg(&rx_ring->xdp_rxq);
222 void ena_xdp_unregister_rxq_info(struct ena_ring *rx_ring)
224 netif_dbg(rx_ring->adapter, ifdown, rx_ring->netdev,
225 "Unregistering RX info for queue %d",
227 xdp_rxq_info_unreg_mem_model(&rx_ring->xdp_rxq);
228 xdp_rxq_info_unreg(&rx_ring->xdp_rxq);
231 void ena_xdp_exchange_program_rx_in_range(struct ena_adapter *adapter,
232 struct bpf_prog *prog,
233 int first, int count)
235 struct bpf_prog *old_bpf_prog;
236 struct ena_ring *rx_ring;
239 for (i = first; i < count; i++) {
240 rx_ring = &adapter->rx_ring[i];
241 old_bpf_prog = xchg(&rx_ring->xdp_bpf_prog, prog);
243 if (!old_bpf_prog && prog) {
244 rx_ring->rx_headroom = XDP_PACKET_HEADROOM;
245 } else if (old_bpf_prog && !prog) {
246 rx_ring->rx_headroom = NET_SKB_PAD;
251 static void ena_xdp_exchange_program(struct ena_adapter *adapter,
252 struct bpf_prog *prog)
254 struct bpf_prog *old_bpf_prog = xchg(&adapter->xdp_bpf_prog, prog);
256 ena_xdp_exchange_program_rx_in_range(adapter,
259 adapter->num_io_queues);
262 bpf_prog_put(old_bpf_prog);
265 static int ena_destroy_and_free_all_xdp_queues(struct ena_adapter *adapter)
270 was_up = test_bit(ENA_FLAG_DEV_UP, &adapter->flags);
275 adapter->xdp_first_ring = 0;
276 adapter->xdp_num_queues = 0;
277 ena_xdp_exchange_program(adapter, NULL);
279 rc = ena_up(adapter);
286 static int ena_xdp_set(struct net_device *netdev, struct netdev_bpf *bpf)
288 struct ena_adapter *adapter = netdev_priv(netdev);
289 struct bpf_prog *prog = bpf->prog;
290 struct bpf_prog *old_bpf_prog;
294 is_up = test_bit(ENA_FLAG_DEV_UP, &adapter->flags);
295 rc = ena_xdp_allowed(adapter);
296 if (rc == ENA_XDP_ALLOWED) {
297 old_bpf_prog = adapter->xdp_bpf_prog;
300 ena_init_all_xdp_queues(adapter);
301 } else if (!old_bpf_prog) {
303 ena_init_all_xdp_queues(adapter);
305 ena_xdp_exchange_program(adapter, prog);
307 netif_dbg(adapter, drv, adapter->netdev, "Set a new XDP program\n");
309 if (is_up && !old_bpf_prog) {
310 rc = ena_up(adapter);
314 xdp_features_set_redirect_target(netdev, false);
315 } else if (old_bpf_prog) {
316 xdp_features_clear_redirect_target(netdev);
317 netif_dbg(adapter, drv, adapter->netdev, "Removing XDP program\n");
319 rc = ena_destroy_and_free_all_xdp_queues(adapter);
324 prev_mtu = netdev->max_mtu;
325 netdev->max_mtu = prog ? ENA_XDP_MAX_MTU : adapter->max_mtu;
328 netif_info(adapter, drv, adapter->netdev,
329 "XDP program is set, changing the max_mtu from %d to %d",
330 prev_mtu, netdev->max_mtu);
332 } else if (rc == ENA_XDP_CURRENT_MTU_TOO_LARGE) {
333 netif_err(adapter, drv, adapter->netdev,
334 "Failed to set xdp program, the current MTU (%d) is larger than the maximum allowed MTU (%lu) while xdp is on",
335 netdev->mtu, ENA_XDP_MAX_MTU);
336 NL_SET_ERR_MSG_MOD(bpf->extack,
337 "Failed to set xdp program, the current MTU is larger than the maximum allowed MTU. Check the dmesg for more info");
339 } else if (rc == ENA_XDP_NO_ENOUGH_QUEUES) {
340 netif_err(adapter, drv, adapter->netdev,
341 "Failed to set xdp program, the Rx/Tx channel count should be at most half of the maximum allowed channel count. The current queue count (%d), the maximal queue count (%d)\n",
342 adapter->num_io_queues, adapter->max_num_io_queues);
343 NL_SET_ERR_MSG_MOD(bpf->extack,
344 "Failed to set xdp program, there is no enough space for allocating XDP queues, Check the dmesg for more info");
351 /* This is the main xdp callback, it's used by the kernel to set/unset the xdp
352 * program as well as to query the current xdp program id.
354 int ena_xdp(struct net_device *netdev, struct netdev_bpf *bpf)
356 switch (bpf->command) {
358 return ena_xdp_set(netdev, bpf);
365 static int ena_clean_xdp_irq(struct ena_ring *tx_ring, u32 budget)
373 if (unlikely(!tx_ring))
375 next_to_clean = tx_ring->next_to_clean;
377 while (tx_pkts < budget) {
378 struct ena_tx_buffer *tx_info;
379 struct xdp_frame *xdpf;
381 rc = ena_com_tx_comp_req_id_get(tx_ring->ena_com_io_cq,
384 if (unlikely(rc == -EINVAL))
385 handle_invalid_req_id(tx_ring, req_id, NULL, true);
389 /* validate that the request id points to a valid xdp_frame */
390 rc = validate_xdp_req_id(tx_ring, req_id);
394 tx_info = &tx_ring->tx_buffer_info[req_id];
396 tx_info->last_jiffies = 0;
398 xdpf = tx_info->xdpf;
399 tx_info->xdpf = NULL;
400 ena_unmap_tx_buff(tx_ring, tx_info);
401 xdp_return_frame(xdpf);
404 total_done += tx_info->tx_descs;
405 tx_ring->free_ids[next_to_clean] = req_id;
406 next_to_clean = ENA_TX_RING_IDX_NEXT(next_to_clean,
409 netif_dbg(tx_ring->adapter, tx_done, tx_ring->netdev,
410 "tx_poll: q %d pkt #%d req_id %d\n", tx_ring->qid, tx_pkts, req_id);
413 tx_ring->next_to_clean = next_to_clean;
414 ena_com_comp_ack(tx_ring->ena_com_io_sq, total_done);
416 netif_dbg(tx_ring->adapter, tx_done, tx_ring->netdev,
417 "tx_poll: q %d done. total pkts: %d\n",
418 tx_ring->qid, tx_pkts);
423 /* This is the XDP napi callback. XDP queues use a separate napi callback
426 int ena_xdp_io_poll(struct napi_struct *napi, int budget)
428 struct ena_napi *ena_napi = container_of(napi, struct ena_napi, napi);
429 struct ena_ring *tx_ring;
433 tx_ring = ena_napi->tx_ring;
435 if (!test_bit(ENA_FLAG_DEV_UP, &tx_ring->adapter->flags) ||
436 test_bit(ENA_FLAG_TRIGGER_RESET, &tx_ring->adapter->flags)) {
437 napi_complete_done(napi, 0);
441 work_done = ena_clean_xdp_irq(tx_ring, budget);
443 /* If the device is about to reset or down, avoid unmask
444 * the interrupt and return 0 so NAPI won't reschedule
446 if (unlikely(!test_bit(ENA_FLAG_DEV_UP, &tx_ring->adapter->flags))) {
447 napi_complete_done(napi, 0);
449 } else if (budget > work_done) {
450 ena_increase_stat(&tx_ring->tx_stats.napi_comp, 1,
452 if (napi_complete_done(napi, work_done))
453 ena_unmask_interrupt(tx_ring, NULL);
455 ena_update_ring_numa_node(tx_ring, NULL);
461 u64_stats_update_begin(&tx_ring->syncp);
462 tx_ring->tx_stats.tx_poll++;
463 u64_stats_update_end(&tx_ring->syncp);
464 tx_ring->tx_stats.last_napi_jiffies = jiffies;