3fc2333933
Add support for XSK zero-copy to RX path. The setup of the XSK pool can be done at runtime. If the netdev is running, then the queue must be disabled and enabled during reconfiguration. This can be done easily with functions introduced in previous commits. A more important property is that, if the netdev is running, then the setup of the XSK pool shall not stop the netdev in case of errors. A broken netdev after a failed XSK pool setup is bad behavior. Therefore, the allocation and setup of resources during XSK pool setup is done only before any queue is disabled. Additionally, freeing and later allocation of resources is eliminated in some cases. Page pool entries are kept for later use. Two memory models are registered in parallel. As a result, the XSK pool setup cannot fail during queue reconfiguration. In contrast to other drivers, XSK pool setup and XDP BPF program setup are separate actions. XSK pool setup can be done without any XDP BPF program. The XDP BPF program can be added, removed or changed without any reconfiguration of the XSK pool. Test results with A53 1.2GHz: xdpsock rxdrop copy mode, 64 byte frames: pps pkts 1.00 rx 856,054 10,625,775 Two CPUs with both 100% utilization. xdpsock rxdrop zero-copy mode, 64 byte frames: pps pkts 1.00 rx 889,388 4,615,284 Two CPUs with 100% and 20% utilization. Packet rate increases and CPU utilization is reduced. 100% CPU load seems to the base load. This load is consumed by ksoftirqd just for dropping the generated packets without xdpsock running. Using batch API reduced CPU utilization slightly, but measurements are not stable enough to provide meaningful numbers. Signed-off-by: Gerhard Engleder <gerhard@engleder-embedded.com> Reviewed-by: Maciej Fijalkowski <maciej.fijalkowski@intel.com> Signed-off-by: Jakub Kicinski <kuba@kernel.org>
86 lines
1.9 KiB
C
86 lines
1.9 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/* Copyright (C) 2022 Gerhard Engleder <gerhard@engleder-embedded.com> */
|
|
|
|
#include <linux/if_vlan.h>
|
|
#include <net/xdp_sock_drv.h>
|
|
|
|
#include "tsnep.h"
|
|
|
|
int tsnep_xdp_setup_prog(struct tsnep_adapter *adapter, struct bpf_prog *prog,
|
|
struct netlink_ext_ack *extack)
|
|
{
|
|
struct bpf_prog *old_prog;
|
|
|
|
old_prog = xchg(&adapter->xdp_prog, prog);
|
|
if (old_prog)
|
|
bpf_prog_put(old_prog);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int tsnep_xdp_enable_pool(struct tsnep_adapter *adapter,
|
|
struct xsk_buff_pool *pool, u16 queue_id)
|
|
{
|
|
struct tsnep_queue *queue;
|
|
int retval;
|
|
|
|
if (queue_id >= adapter->num_rx_queues ||
|
|
queue_id >= adapter->num_tx_queues)
|
|
return -EINVAL;
|
|
|
|
queue = &adapter->queue[queue_id];
|
|
if (queue->rx->queue_index != queue_id ||
|
|
queue->tx->queue_index != queue_id) {
|
|
netdev_err(adapter->netdev,
|
|
"XSK support only for TX/RX queue pairs\n");
|
|
|
|
return -EOPNOTSUPP;
|
|
}
|
|
|
|
retval = xsk_pool_dma_map(pool, adapter->dmadev,
|
|
DMA_ATTR_SKIP_CPU_SYNC);
|
|
if (retval) {
|
|
netdev_err(adapter->netdev, "failed to map XSK pool\n");
|
|
|
|
return retval;
|
|
}
|
|
|
|
retval = tsnep_enable_xsk(queue, pool);
|
|
if (retval) {
|
|
xsk_pool_dma_unmap(pool, DMA_ATTR_SKIP_CPU_SYNC);
|
|
|
|
return retval;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int tsnep_xdp_disable_pool(struct tsnep_adapter *adapter, u16 queue_id)
|
|
{
|
|
struct xsk_buff_pool *pool;
|
|
struct tsnep_queue *queue;
|
|
|
|
if (queue_id >= adapter->num_rx_queues ||
|
|
queue_id >= adapter->num_tx_queues)
|
|
return -EINVAL;
|
|
|
|
pool = xsk_get_pool_from_qid(adapter->netdev, queue_id);
|
|
if (!pool)
|
|
return -EINVAL;
|
|
|
|
queue = &adapter->queue[queue_id];
|
|
|
|
tsnep_disable_xsk(queue);
|
|
|
|
xsk_pool_dma_unmap(pool, DMA_ATTR_SKIP_CPU_SYNC);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int tsnep_xdp_setup_pool(struct tsnep_adapter *adapter,
|
|
struct xsk_buff_pool *pool, u16 queue_id)
|
|
{
|
|
return pool ? tsnep_xdp_enable_pool(adapter, pool, queue_id) :
|
|
tsnep_xdp_disable_pool(adapter, queue_id);
|
|
}
|