cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

xdpxceiver.c (44029B)


      1// SPDX-License-Identifier: GPL-2.0
      2/* Copyright(c) 2020 Intel Corporation. */
      3
      4/*
      5 * Some functions in this program are taken from
      6 * Linux kernel samples/bpf/xdpsock* and modified
      7 * for use.
      8 *
      9 * See test_xsk.sh for detailed information on test topology
     10 * and prerequisite network setup.
     11 *
     12 * This test program contains two threads, each thread is single socket with
     13 * a unique UMEM. It validates in-order packet delivery and packet content
     14 * by sending packets to each other.
     15 *
     16 * Tests Information:
     17 * ------------------
     18 * These selftests test AF_XDP SKB and Native/DRV modes using veth
     19 * Virtual Ethernet interfaces.
     20 *
     21 * For each mode, the following tests are run:
     22 *    a. nopoll - soft-irq processing in run-to-completion mode
     23 *    b. poll - using poll() syscall
     24 *    c. Socket Teardown
     25 *       Create a Tx and a Rx socket, Tx from one socket, Rx on another. Destroy
     26 *       both sockets, then repeat multiple times. Only nopoll mode is used
     27 *    d. Bi-directional sockets
     28 *       Configure sockets as bi-directional tx/rx sockets, sets up fill and
     29 *       completion rings on each socket, tx/rx in both directions. Only nopoll
     30 *       mode is used
     31 *    e. Statistics
     32 *       Trigger some error conditions and ensure that the appropriate statistics
     33 *       are incremented. Within this test, the following statistics are tested:
     34 *       i.   rx dropped
     35 *            Increase the UMEM frame headroom to a value which results in
     36 *            insufficient space in the rx buffer for both the packet and the headroom.
     37 *       ii.  tx invalid
     38 *            Set the 'len' field of tx descriptors to an invalid value (umem frame
     39 *            size + 1).
     40 *       iii. rx ring full
     41 *            Reduce the size of the RX ring to a fraction of the fill ring size.
     42 *       iv.  fill queue empty
     43 *            Do not populate the fill queue and then try to receive pkts.
     44 *    f. bpf_link resource persistence
     45 *       Configure sockets at indexes 0 and 1, run a traffic on queue ids 0,
     46 *       then remove xsk sockets from queue 0 on both veth interfaces and
     47 *       finally run a traffic on queues ids 1
     48 *    g. unaligned mode
     49 *    h. tests for invalid and corner case Tx descriptors so that the correct ones
     50 *       are discarded and let through, respectively.
     51 *    i. 2K frame size tests
     52 *
     53 * Total tests: 12
     54 *
     55 * Flow:
     56 * -----
     57 * - Single process spawns two threads: Tx and Rx
     58 * - Each of these two threads attach to a veth interface within their assigned
     59 *   namespaces
     60 * - Each thread Creates one AF_XDP socket connected to a unique umem for each
     61 *   veth interface
     62 * - Tx thread Transmits 10k packets from veth<xxxx> to veth<yyyy>
     63 * - Rx thread verifies if all 10k packets were received and delivered in-order,
     64 *   and have the right content
     65 *
     66 * Enable/disable packet dump mode:
     67 * --------------------------
     68 * To enable L2 - L4 headers and payload dump of each packet on STDOUT, add
     69 * parameter -D to params array in test_xsk.sh, i.e. params=("-S" "-D")
     70 */
     71
     72#define _GNU_SOURCE
     73#include <fcntl.h>
     74#include <errno.h>
     75#include <getopt.h>
     76#include <asm/barrier.h>
     77#include <linux/if_link.h>
     78#include <linux/if_ether.h>
     79#include <linux/ip.h>
     80#include <linux/udp.h>
     81#include <arpa/inet.h>
     82#include <net/if.h>
     83#include <locale.h>
     84#include <poll.h>
     85#include <pthread.h>
     86#include <signal.h>
     87#include <stdbool.h>
     88#include <stdio.h>
     89#include <stdlib.h>
     90#include <string.h>
     91#include <stddef.h>
     92#include <sys/mman.h>
     93#include <sys/socket.h>
     94#include <sys/time.h>
     95#include <sys/types.h>
     96#include <sys/queue.h>
     97#include <time.h>
     98#include <unistd.h>
     99#include <stdatomic.h>
    100#include <bpf/xsk.h>
    101#include "xdpxceiver.h"
    102#include "../kselftest.h"
    103
    104/* AF_XDP APIs were moved into libxdp and marked as deprecated in libbpf.
    105 * Until xdpxceiver is either moved or re-writed into libxdp, suppress
    106 * deprecation warnings in this file
    107 */
    108#pragma GCC diagnostic ignored "-Wdeprecated-declarations"
    109
    110static const char *MAC1 = "\x00\x0A\x56\x9E\xEE\x62";
    111static const char *MAC2 = "\x00\x0A\x56\x9E\xEE\x61";
    112static const char *IP1 = "192.168.100.162";
    113static const char *IP2 = "192.168.100.161";
    114static const u16 UDP_PORT1 = 2020;
    115static const u16 UDP_PORT2 = 2121;
    116
    117static void __exit_with_error(int error, const char *file, const char *func, int line)
    118{
    119	ksft_test_result_fail("[%s:%s:%i]: ERROR: %d/\"%s\"\n", file, func, line, error,
    120			      strerror(error));
    121	ksft_exit_xfail();
    122}
    123
    124#define exit_with_error(error) __exit_with_error(error, __FILE__, __func__, __LINE__)
    125
    126#define mode_string(test) (test)->ifobj_tx->xdp_flags & XDP_FLAGS_SKB_MODE ? "SKB" : "DRV"
    127#define busy_poll_string(test) (test)->ifobj_tx->busy_poll ? "BUSY-POLL " : ""
    128
    129static void report_failure(struct test_spec *test)
    130{
    131	if (test->fail)
    132		return;
    133
    134	ksft_test_result_fail("FAIL: %s %s%s\n", mode_string(test), busy_poll_string(test),
    135			      test->name);
    136	test->fail = true;
    137}
    138
    139static void memset32_htonl(void *dest, u32 val, u32 size)
    140{
    141	u32 *ptr = (u32 *)dest;
    142	int i;
    143
    144	val = htonl(val);
    145
    146	for (i = 0; i < (size & (~0x3)); i += 4)
    147		ptr[i >> 2] = val;
    148}
    149
    150/*
    151 * Fold a partial checksum
    152 * This function code has been taken from
    153 * Linux kernel include/asm-generic/checksum.h
    154 */
    155static __u16 csum_fold(__u32 csum)
    156{
    157	u32 sum = (__force u32)csum;
    158
    159	sum = (sum & 0xffff) + (sum >> 16);
    160	sum = (sum & 0xffff) + (sum >> 16);
    161	return (__force __u16)~sum;
    162}
    163
    164/*
    165 * This function code has been taken from
    166 * Linux kernel lib/checksum.c
    167 */
    168static u32 from64to32(u64 x)
    169{
    170	/* add up 32-bit and 32-bit for 32+c bit */
    171	x = (x & 0xffffffff) + (x >> 32);
    172	/* add up carry.. */
    173	x = (x & 0xffffffff) + (x >> 32);
    174	return (u32)x;
    175}
    176
    177/*
    178 * This function code has been taken from
    179 * Linux kernel lib/checksum.c
    180 */
    181static __u32 csum_tcpudp_nofold(__be32 saddr, __be32 daddr, __u32 len, __u8 proto, __u32 sum)
    182{
    183	unsigned long long s = (__force u32)sum;
    184
    185	s += (__force u32)saddr;
    186	s += (__force u32)daddr;
    187#ifdef __BIG_ENDIAN__
    188	s += proto + len;
    189#else
    190	s += (proto + len) << 8;
    191#endif
    192	return (__force __u32)from64to32(s);
    193}
    194
    195/*
    196 * This function has been taken from
    197 * Linux kernel include/asm-generic/checksum.h
    198 */
    199static __u16 csum_tcpudp_magic(__be32 saddr, __be32 daddr, __u32 len, __u8 proto, __u32 sum)
    200{
    201	return csum_fold(csum_tcpudp_nofold(saddr, daddr, len, proto, sum));
    202}
    203
    204static u16 udp_csum(u32 saddr, u32 daddr, u32 len, u8 proto, u16 *udp_pkt)
    205{
    206	u32 csum = 0;
    207	u32 cnt = 0;
    208
    209	/* udp hdr and data */
    210	for (; cnt < len; cnt += 2)
    211		csum += udp_pkt[cnt >> 1];
    212
    213	return csum_tcpudp_magic(saddr, daddr, len, proto, csum);
    214}
    215
    216static void gen_eth_hdr(struct ifobject *ifobject, struct ethhdr *eth_hdr)
    217{
    218	memcpy(eth_hdr->h_dest, ifobject->dst_mac, ETH_ALEN);
    219	memcpy(eth_hdr->h_source, ifobject->src_mac, ETH_ALEN);
    220	eth_hdr->h_proto = htons(ETH_P_IP);
    221}
    222
    223static void gen_ip_hdr(struct ifobject *ifobject, struct iphdr *ip_hdr)
    224{
    225	ip_hdr->version = IP_PKT_VER;
    226	ip_hdr->ihl = 0x5;
    227	ip_hdr->tos = IP_PKT_TOS;
    228	ip_hdr->tot_len = htons(IP_PKT_SIZE);
    229	ip_hdr->id = 0;
    230	ip_hdr->frag_off = 0;
    231	ip_hdr->ttl = IPDEFTTL;
    232	ip_hdr->protocol = IPPROTO_UDP;
    233	ip_hdr->saddr = ifobject->src_ip;
    234	ip_hdr->daddr = ifobject->dst_ip;
    235	ip_hdr->check = 0;
    236}
    237
    238static void gen_udp_hdr(u32 payload, void *pkt, struct ifobject *ifobject,
    239			struct udphdr *udp_hdr)
    240{
    241	udp_hdr->source = htons(ifobject->src_port);
    242	udp_hdr->dest = htons(ifobject->dst_port);
    243	udp_hdr->len = htons(UDP_PKT_SIZE);
    244	memset32_htonl(pkt + PKT_HDR_SIZE, payload, UDP_PKT_DATA_SIZE);
    245}
    246
    247static void gen_udp_csum(struct udphdr *udp_hdr, struct iphdr *ip_hdr)
    248{
    249	udp_hdr->check = 0;
    250	udp_hdr->check =
    251	    udp_csum(ip_hdr->saddr, ip_hdr->daddr, UDP_PKT_SIZE, IPPROTO_UDP, (u16 *)udp_hdr);
    252}
    253
    254static int xsk_configure_umem(struct xsk_umem_info *umem, void *buffer, u64 size)
    255{
    256	struct xsk_umem_config cfg = {
    257		.fill_size = XSK_RING_PROD__DEFAULT_NUM_DESCS,
    258		.comp_size = XSK_RING_CONS__DEFAULT_NUM_DESCS,
    259		.frame_size = umem->frame_size,
    260		.frame_headroom = umem->frame_headroom,
    261		.flags = XSK_UMEM__DEFAULT_FLAGS
    262	};
    263	int ret;
    264
    265	if (umem->unaligned_mode)
    266		cfg.flags |= XDP_UMEM_UNALIGNED_CHUNK_FLAG;
    267
    268	ret = xsk_umem__create(&umem->umem, buffer, size,
    269			       &umem->fq, &umem->cq, &cfg);
    270	if (ret)
    271		return ret;
    272
    273	umem->buffer = buffer;
    274	return 0;
    275}
    276
    277static void enable_busy_poll(struct xsk_socket_info *xsk)
    278{
    279	int sock_opt;
    280
    281	sock_opt = 1;
    282	if (setsockopt(xsk_socket__fd(xsk->xsk), SOL_SOCKET, SO_PREFER_BUSY_POLL,
    283		       (void *)&sock_opt, sizeof(sock_opt)) < 0)
    284		exit_with_error(errno);
    285
    286	sock_opt = 20;
    287	if (setsockopt(xsk_socket__fd(xsk->xsk), SOL_SOCKET, SO_BUSY_POLL,
    288		       (void *)&sock_opt, sizeof(sock_opt)) < 0)
    289		exit_with_error(errno);
    290
    291	sock_opt = BATCH_SIZE;
    292	if (setsockopt(xsk_socket__fd(xsk->xsk), SOL_SOCKET, SO_BUSY_POLL_BUDGET,
    293		       (void *)&sock_opt, sizeof(sock_opt)) < 0)
    294		exit_with_error(errno);
    295}
    296
    297static int xsk_configure_socket(struct xsk_socket_info *xsk, struct xsk_umem_info *umem,
    298				struct ifobject *ifobject, bool shared)
    299{
    300	struct xsk_socket_config cfg = {};
    301	struct xsk_ring_cons *rxr;
    302	struct xsk_ring_prod *txr;
    303
    304	xsk->umem = umem;
    305	cfg.rx_size = xsk->rxqsize;
    306	cfg.tx_size = XSK_RING_PROD__DEFAULT_NUM_DESCS;
    307	cfg.libbpf_flags = XSK_LIBBPF_FLAGS__INHIBIT_PROG_LOAD;
    308	cfg.xdp_flags = ifobject->xdp_flags;
    309	cfg.bind_flags = ifobject->bind_flags;
    310	if (shared)
    311		cfg.bind_flags |= XDP_SHARED_UMEM;
    312
    313	txr = ifobject->tx_on ? &xsk->tx : NULL;
    314	rxr = ifobject->rx_on ? &xsk->rx : NULL;
    315	return xsk_socket__create(&xsk->xsk, ifobject->ifname, 0, umem->umem, rxr, txr, &cfg);
    316}
    317
    318static struct option long_options[] = {
    319	{"interface", required_argument, 0, 'i'},
    320	{"busy-poll", no_argument, 0, 'b'},
    321	{"dump-pkts", no_argument, 0, 'D'},
    322	{"verbose", no_argument, 0, 'v'},
    323	{0, 0, 0, 0}
    324};
    325
    326static void usage(const char *prog)
    327{
    328	const char *str =
    329		"  Usage: %s [OPTIONS]\n"
    330		"  Options:\n"
    331		"  -i, --interface      Use interface\n"
    332		"  -D, --dump-pkts      Dump packets L2 - L5\n"
    333		"  -v, --verbose        Verbose output\n"
    334		"  -b, --busy-poll      Enable busy poll\n";
    335
    336	ksft_print_msg(str, prog);
    337}
    338
    339static int switch_namespace(const char *nsname)
    340{
    341	char fqns[26] = "/var/run/netns/";
    342	int nsfd;
    343
    344	if (!nsname || strlen(nsname) == 0)
    345		return -1;
    346
    347	strncat(fqns, nsname, sizeof(fqns) - strlen(fqns) - 1);
    348	nsfd = open(fqns, O_RDONLY);
    349
    350	if (nsfd == -1)
    351		exit_with_error(errno);
    352
    353	if (setns(nsfd, 0) == -1)
    354		exit_with_error(errno);
    355
    356	print_verbose("NS switched: %s\n", nsname);
    357
    358	return nsfd;
    359}
    360
    361static bool validate_interface(struct ifobject *ifobj)
    362{
    363	if (!strcmp(ifobj->ifname, ""))
    364		return false;
    365	return true;
    366}
    367
    368static void parse_command_line(struct ifobject *ifobj_tx, struct ifobject *ifobj_rx, int argc,
    369			       char **argv)
    370{
    371	struct ifobject *ifobj;
    372	u32 interface_nb = 0;
    373	int option_index, c;
    374
    375	opterr = 0;
    376
    377	for (;;) {
    378		char *sptr, *token;
    379
    380		c = getopt_long(argc, argv, "i:Dvb", long_options, &option_index);
    381		if (c == -1)
    382			break;
    383
    384		switch (c) {
    385		case 'i':
    386			if (interface_nb == 0)
    387				ifobj = ifobj_tx;
    388			else if (interface_nb == 1)
    389				ifobj = ifobj_rx;
    390			else
    391				break;
    392
    393			sptr = strndupa(optarg, strlen(optarg));
    394			memcpy(ifobj->ifname, strsep(&sptr, ","), MAX_INTERFACE_NAME_CHARS);
    395			token = strsep(&sptr, ",");
    396			if (token)
    397				memcpy(ifobj->nsname, token, MAX_INTERFACES_NAMESPACE_CHARS);
    398			interface_nb++;
    399			break;
    400		case 'D':
    401			opt_pkt_dump = true;
    402			break;
    403		case 'v':
    404			opt_verbose = true;
    405			break;
    406		case 'b':
    407			ifobj_tx->busy_poll = true;
    408			ifobj_rx->busy_poll = true;
    409			break;
    410		default:
    411			usage(basename(argv[0]));
    412			ksft_exit_xfail();
    413		}
    414	}
    415}
    416
    417static void __test_spec_init(struct test_spec *test, struct ifobject *ifobj_tx,
    418			     struct ifobject *ifobj_rx)
    419{
    420	u32 i, j;
    421
    422	for (i = 0; i < MAX_INTERFACES; i++) {
    423		struct ifobject *ifobj = i ? ifobj_rx : ifobj_tx;
    424
    425		ifobj->xsk = &ifobj->xsk_arr[0];
    426		ifobj->use_poll = false;
    427		ifobj->use_fill_ring = true;
    428		ifobj->release_rx = true;
    429		ifobj->pkt_stream = test->pkt_stream_default;
    430		ifobj->validation_func = NULL;
    431
    432		if (i == 0) {
    433			ifobj->rx_on = false;
    434			ifobj->tx_on = true;
    435		} else {
    436			ifobj->rx_on = true;
    437			ifobj->tx_on = false;
    438		}
    439
    440		memset(ifobj->umem, 0, sizeof(*ifobj->umem));
    441		ifobj->umem->num_frames = DEFAULT_UMEM_BUFFERS;
    442		ifobj->umem->frame_size = XSK_UMEM__DEFAULT_FRAME_SIZE;
    443
    444		for (j = 0; j < MAX_SOCKETS; j++) {
    445			memset(&ifobj->xsk_arr[j], 0, sizeof(ifobj->xsk_arr[j]));
    446			ifobj->xsk_arr[j].rxqsize = XSK_RING_CONS__DEFAULT_NUM_DESCS;
    447		}
    448	}
    449
    450	test->ifobj_tx = ifobj_tx;
    451	test->ifobj_rx = ifobj_rx;
    452	test->current_step = 0;
    453	test->total_steps = 1;
    454	test->nb_sockets = 1;
    455	test->fail = false;
    456}
    457
    458static void test_spec_init(struct test_spec *test, struct ifobject *ifobj_tx,
    459			   struct ifobject *ifobj_rx, enum test_mode mode)
    460{
    461	struct pkt_stream *pkt_stream;
    462	u32 i;
    463
    464	pkt_stream = test->pkt_stream_default;
    465	memset(test, 0, sizeof(*test));
    466	test->pkt_stream_default = pkt_stream;
    467
    468	for (i = 0; i < MAX_INTERFACES; i++) {
    469		struct ifobject *ifobj = i ? ifobj_rx : ifobj_tx;
    470
    471		ifobj->xdp_flags = XDP_FLAGS_UPDATE_IF_NOEXIST;
    472		if (mode == TEST_MODE_SKB)
    473			ifobj->xdp_flags |= XDP_FLAGS_SKB_MODE;
    474		else
    475			ifobj->xdp_flags |= XDP_FLAGS_DRV_MODE;
    476
    477		ifobj->bind_flags = XDP_USE_NEED_WAKEUP | XDP_COPY;
    478	}
    479
    480	__test_spec_init(test, ifobj_tx, ifobj_rx);
    481}
    482
    483static void test_spec_reset(struct test_spec *test)
    484{
    485	__test_spec_init(test, test->ifobj_tx, test->ifobj_rx);
    486}
    487
    488static void test_spec_set_name(struct test_spec *test, const char *name)
    489{
    490	strncpy(test->name, name, MAX_TEST_NAME_SIZE);
    491}
    492
    493static void pkt_stream_reset(struct pkt_stream *pkt_stream)
    494{
    495	if (pkt_stream)
    496		pkt_stream->rx_pkt_nb = 0;
    497}
    498
    499static struct pkt *pkt_stream_get_pkt(struct pkt_stream *pkt_stream, u32 pkt_nb)
    500{
    501	if (pkt_nb >= pkt_stream->nb_pkts)
    502		return NULL;
    503
    504	return &pkt_stream->pkts[pkt_nb];
    505}
    506
    507static struct pkt *pkt_stream_get_next_rx_pkt(struct pkt_stream *pkt_stream, u32 *pkts_sent)
    508{
    509	while (pkt_stream->rx_pkt_nb < pkt_stream->nb_pkts) {
    510		(*pkts_sent)++;
    511		if (pkt_stream->pkts[pkt_stream->rx_pkt_nb].valid)
    512			return &pkt_stream->pkts[pkt_stream->rx_pkt_nb++];
    513		pkt_stream->rx_pkt_nb++;
    514	}
    515	return NULL;
    516}
    517
    518static void pkt_stream_delete(struct pkt_stream *pkt_stream)
    519{
    520	free(pkt_stream->pkts);
    521	free(pkt_stream);
    522}
    523
    524static void pkt_stream_restore_default(struct test_spec *test)
    525{
    526	struct pkt_stream *tx_pkt_stream = test->ifobj_tx->pkt_stream;
    527
    528	if (tx_pkt_stream != test->pkt_stream_default) {
    529		pkt_stream_delete(test->ifobj_tx->pkt_stream);
    530		test->ifobj_tx->pkt_stream = test->pkt_stream_default;
    531	}
    532
    533	if (test->ifobj_rx->pkt_stream != test->pkt_stream_default &&
    534	    test->ifobj_rx->pkt_stream != tx_pkt_stream)
    535		pkt_stream_delete(test->ifobj_rx->pkt_stream);
    536	test->ifobj_rx->pkt_stream = test->pkt_stream_default;
    537}
    538
    539static struct pkt_stream *__pkt_stream_alloc(u32 nb_pkts)
    540{
    541	struct pkt_stream *pkt_stream;
    542
    543	pkt_stream = calloc(1, sizeof(*pkt_stream));
    544	if (!pkt_stream)
    545		return NULL;
    546
    547	pkt_stream->pkts = calloc(nb_pkts, sizeof(*pkt_stream->pkts));
    548	if (!pkt_stream->pkts) {
    549		free(pkt_stream);
    550		return NULL;
    551	}
    552
    553	pkt_stream->nb_pkts = nb_pkts;
    554	return pkt_stream;
    555}
    556
    557static void pkt_set(struct xsk_umem_info *umem, struct pkt *pkt, u64 addr, u32 len)
    558{
    559	pkt->addr = addr;
    560	pkt->len = len;
    561	if (len > umem->frame_size - XDP_PACKET_HEADROOM - MIN_PKT_SIZE * 2 - umem->frame_headroom)
    562		pkt->valid = false;
    563	else
    564		pkt->valid = true;
    565}
    566
    567static struct pkt_stream *pkt_stream_generate(struct xsk_umem_info *umem, u32 nb_pkts, u32 pkt_len)
    568{
    569	struct pkt_stream *pkt_stream;
    570	u32 i;
    571
    572	pkt_stream = __pkt_stream_alloc(nb_pkts);
    573	if (!pkt_stream)
    574		exit_with_error(ENOMEM);
    575
    576	pkt_stream->nb_pkts = nb_pkts;
    577	for (i = 0; i < nb_pkts; i++) {
    578		pkt_set(umem, &pkt_stream->pkts[i], (i % umem->num_frames) * umem->frame_size,
    579			pkt_len);
    580		pkt_stream->pkts[i].payload = i;
    581	}
    582
    583	return pkt_stream;
    584}
    585
    586static struct pkt_stream *pkt_stream_clone(struct xsk_umem_info *umem,
    587					   struct pkt_stream *pkt_stream)
    588{
    589	return pkt_stream_generate(umem, pkt_stream->nb_pkts, pkt_stream->pkts[0].len);
    590}
    591
    592static void pkt_stream_replace(struct test_spec *test, u32 nb_pkts, u32 pkt_len)
    593{
    594	struct pkt_stream *pkt_stream;
    595
    596	pkt_stream = pkt_stream_generate(test->ifobj_tx->umem, nb_pkts, pkt_len);
    597	test->ifobj_tx->pkt_stream = pkt_stream;
    598	test->ifobj_rx->pkt_stream = pkt_stream;
    599}
    600
    601static void pkt_stream_replace_half(struct test_spec *test, u32 pkt_len, int offset)
    602{
    603	struct xsk_umem_info *umem = test->ifobj_tx->umem;
    604	struct pkt_stream *pkt_stream;
    605	u32 i;
    606
    607	pkt_stream = pkt_stream_clone(umem, test->pkt_stream_default);
    608	for (i = 1; i < test->pkt_stream_default->nb_pkts; i += 2)
    609		pkt_set(umem, &pkt_stream->pkts[i],
    610			(i % umem->num_frames) * umem->frame_size + offset, pkt_len);
    611
    612	test->ifobj_tx->pkt_stream = pkt_stream;
    613	test->ifobj_rx->pkt_stream = pkt_stream;
    614}
    615
    616static void pkt_stream_receive_half(struct test_spec *test)
    617{
    618	struct xsk_umem_info *umem = test->ifobj_rx->umem;
    619	struct pkt_stream *pkt_stream = test->ifobj_tx->pkt_stream;
    620	u32 i;
    621
    622	test->ifobj_rx->pkt_stream = pkt_stream_generate(umem, pkt_stream->nb_pkts,
    623							 pkt_stream->pkts[0].len);
    624	pkt_stream = test->ifobj_rx->pkt_stream;
    625	for (i = 1; i < pkt_stream->nb_pkts; i += 2)
    626		pkt_stream->pkts[i].valid = false;
    627}
    628
    629static struct pkt *pkt_generate(struct ifobject *ifobject, u32 pkt_nb)
    630{
    631	struct pkt *pkt = pkt_stream_get_pkt(ifobject->pkt_stream, pkt_nb);
    632	struct udphdr *udp_hdr;
    633	struct ethhdr *eth_hdr;
    634	struct iphdr *ip_hdr;
    635	void *data;
    636
    637	if (!pkt)
    638		return NULL;
    639	if (!pkt->valid || pkt->len < MIN_PKT_SIZE)
    640		return pkt;
    641
    642	data = xsk_umem__get_data(ifobject->umem->buffer, pkt->addr);
    643	udp_hdr = (struct udphdr *)(data + sizeof(struct ethhdr) + sizeof(struct iphdr));
    644	ip_hdr = (struct iphdr *)(data + sizeof(struct ethhdr));
    645	eth_hdr = (struct ethhdr *)data;
    646
    647	gen_udp_hdr(pkt_nb, data, ifobject, udp_hdr);
    648	gen_ip_hdr(ifobject, ip_hdr);
    649	gen_udp_csum(udp_hdr, ip_hdr);
    650	gen_eth_hdr(ifobject, eth_hdr);
    651
    652	return pkt;
    653}
    654
    655static void pkt_stream_generate_custom(struct test_spec *test, struct pkt *pkts, u32 nb_pkts)
    656{
    657	struct pkt_stream *pkt_stream;
    658	u32 i;
    659
    660	pkt_stream = __pkt_stream_alloc(nb_pkts);
    661	if (!pkt_stream)
    662		exit_with_error(ENOMEM);
    663
    664	test->ifobj_tx->pkt_stream = pkt_stream;
    665	test->ifobj_rx->pkt_stream = pkt_stream;
    666
    667	for (i = 0; i < nb_pkts; i++) {
    668		pkt_stream->pkts[i].addr = pkts[i].addr;
    669		pkt_stream->pkts[i].len = pkts[i].len;
    670		pkt_stream->pkts[i].payload = i;
    671		pkt_stream->pkts[i].valid = pkts[i].valid;
    672	}
    673}
    674
    675static void pkt_dump(void *pkt, u32 len)
    676{
    677	char s[INET_ADDRSTRLEN];
    678	struct ethhdr *ethhdr;
    679	struct udphdr *udphdr;
    680	struct iphdr *iphdr;
    681	int payload, i;
    682
    683	ethhdr = pkt;
    684	iphdr = pkt + sizeof(*ethhdr);
    685	udphdr = pkt + sizeof(*ethhdr) + sizeof(*iphdr);
    686
    687	/*extract L2 frame */
    688	fprintf(stdout, "DEBUG>> L2: dst mac: ");
    689	for (i = 0; i < ETH_ALEN; i++)
    690		fprintf(stdout, "%02X", ethhdr->h_dest[i]);
    691
    692	fprintf(stdout, "\nDEBUG>> L2: src mac: ");
    693	for (i = 0; i < ETH_ALEN; i++)
    694		fprintf(stdout, "%02X", ethhdr->h_source[i]);
    695
    696	/*extract L3 frame */
    697	fprintf(stdout, "\nDEBUG>> L3: ip_hdr->ihl: %02X\n", iphdr->ihl);
    698	fprintf(stdout, "DEBUG>> L3: ip_hdr->saddr: %s\n",
    699		inet_ntop(AF_INET, &iphdr->saddr, s, sizeof(s)));
    700	fprintf(stdout, "DEBUG>> L3: ip_hdr->daddr: %s\n",
    701		inet_ntop(AF_INET, &iphdr->daddr, s, sizeof(s)));
    702	/*extract L4 frame */
    703	fprintf(stdout, "DEBUG>> L4: udp_hdr->src: %d\n", ntohs(udphdr->source));
    704	fprintf(stdout, "DEBUG>> L4: udp_hdr->dst: %d\n", ntohs(udphdr->dest));
    705	/*extract L5 frame */
    706	payload = *((uint32_t *)(pkt + PKT_HDR_SIZE));
    707
    708	fprintf(stdout, "DEBUG>> L5: payload: %d\n", payload);
    709	fprintf(stdout, "---------------------------------------\n");
    710}
    711
    712static bool is_offset_correct(struct xsk_umem_info *umem, struct pkt_stream *pkt_stream, u64 addr,
    713			      u64 pkt_stream_addr)
    714{
    715	u32 headroom = umem->unaligned_mode ? 0 : umem->frame_headroom;
    716	u32 offset = addr % umem->frame_size, expected_offset = 0;
    717
    718	if (!pkt_stream->use_addr_for_fill)
    719		pkt_stream_addr = 0;
    720
    721	expected_offset += (pkt_stream_addr + headroom + XDP_PACKET_HEADROOM) % umem->frame_size;
    722
    723	if (offset == expected_offset)
    724		return true;
    725
    726	ksft_print_msg("[%s] expected [%u], got [%u]\n", __func__, expected_offset, offset);
    727	return false;
    728}
    729
    730static bool is_pkt_valid(struct pkt *pkt, void *buffer, u64 addr, u32 len)
    731{
    732	void *data = xsk_umem__get_data(buffer, addr);
    733	struct iphdr *iphdr = (struct iphdr *)(data + sizeof(struct ethhdr));
    734
    735	if (!pkt) {
    736		ksft_print_msg("[%s] too many packets received\n", __func__);
    737		return false;
    738	}
    739
    740	if (len < MIN_PKT_SIZE || pkt->len < MIN_PKT_SIZE) {
    741		/* Do not try to verify packets that are smaller than minimum size. */
    742		return true;
    743	}
    744
    745	if (pkt->len != len) {
    746		ksft_print_msg("[%s] expected length [%d], got length [%d]\n",
    747			       __func__, pkt->len, len);
    748		return false;
    749	}
    750
    751	if (iphdr->version == IP_PKT_VER && iphdr->tos == IP_PKT_TOS) {
    752		u32 seqnum = ntohl(*((u32 *)(data + PKT_HDR_SIZE)));
    753
    754		if (opt_pkt_dump)
    755			pkt_dump(data, PKT_SIZE);
    756
    757		if (pkt->payload != seqnum) {
    758			ksft_print_msg("[%s] expected seqnum [%d], got seqnum [%d]\n",
    759				       __func__, pkt->payload, seqnum);
    760			return false;
    761		}
    762	} else {
    763		ksft_print_msg("Invalid frame received: ");
    764		ksft_print_msg("[IP_PKT_VER: %02X], [IP_PKT_TOS: %02X]\n", iphdr->version,
    765			       iphdr->tos);
    766		return false;
    767	}
    768
    769	return true;
    770}
    771
    772static void kick_tx(struct xsk_socket_info *xsk)
    773{
    774	int ret;
    775
    776	ret = sendto(xsk_socket__fd(xsk->xsk), NULL, 0, MSG_DONTWAIT, NULL, 0);
    777	if (ret >= 0)
    778		return;
    779	if (errno == ENOBUFS || errno == EAGAIN || errno == EBUSY || errno == ENETDOWN) {
    780		usleep(100);
    781		return;
    782	}
    783	exit_with_error(errno);
    784}
    785
    786static void kick_rx(struct xsk_socket_info *xsk)
    787{
    788	int ret;
    789
    790	ret = recvfrom(xsk_socket__fd(xsk->xsk), NULL, 0, MSG_DONTWAIT, NULL, NULL);
    791	if (ret < 0)
    792		exit_with_error(errno);
    793}
    794
    795static int complete_pkts(struct xsk_socket_info *xsk, int batch_size)
    796{
    797	unsigned int rcvd;
    798	u32 idx;
    799
    800	if (xsk_ring_prod__needs_wakeup(&xsk->tx))
    801		kick_tx(xsk);
    802
    803	rcvd = xsk_ring_cons__peek(&xsk->umem->cq, batch_size, &idx);
    804	if (rcvd) {
    805		if (rcvd > xsk->outstanding_tx) {
    806			u64 addr = *xsk_ring_cons__comp_addr(&xsk->umem->cq, idx + rcvd - 1);
    807
    808			ksft_print_msg("[%s] Too many packets completed\n", __func__);
    809			ksft_print_msg("Last completion address: %llx\n", addr);
    810			return TEST_FAILURE;
    811		}
    812
    813		xsk_ring_cons__release(&xsk->umem->cq, rcvd);
    814		xsk->outstanding_tx -= rcvd;
    815	}
    816
    817	return TEST_PASS;
    818}
    819
    820static int receive_pkts(struct ifobject *ifobj, struct pollfd *fds)
    821{
    822	struct timeval tv_end, tv_now, tv_timeout = {RECV_TMOUT, 0};
    823	u32 idx_rx = 0, idx_fq = 0, rcvd, i, pkts_sent = 0;
    824	struct pkt_stream *pkt_stream = ifobj->pkt_stream;
    825	struct xsk_socket_info *xsk = ifobj->xsk;
    826	struct xsk_umem_info *umem = xsk->umem;
    827	struct pkt *pkt;
    828	int ret;
    829
    830	ret = gettimeofday(&tv_now, NULL);
    831	if (ret)
    832		exit_with_error(errno);
    833	timeradd(&tv_now, &tv_timeout, &tv_end);
    834
    835	pkt = pkt_stream_get_next_rx_pkt(pkt_stream, &pkts_sent);
    836	while (pkt) {
    837		ret = gettimeofday(&tv_now, NULL);
    838		if (ret)
    839			exit_with_error(errno);
    840		if (timercmp(&tv_now, &tv_end, >)) {
    841			ksft_print_msg("ERROR: [%s] Receive loop timed out\n", __func__);
    842			return TEST_FAILURE;
    843		}
    844
    845		kick_rx(xsk);
    846
    847		rcvd = xsk_ring_cons__peek(&xsk->rx, BATCH_SIZE, &idx_rx);
    848		if (!rcvd) {
    849			if (xsk_ring_prod__needs_wakeup(&umem->fq)) {
    850				ret = poll(fds, 1, POLL_TMOUT);
    851				if (ret < 0)
    852					exit_with_error(-ret);
    853			}
    854			continue;
    855		}
    856
    857		if (ifobj->use_fill_ring) {
    858			ret = xsk_ring_prod__reserve(&umem->fq, rcvd, &idx_fq);
    859			while (ret != rcvd) {
    860				if (ret < 0)
    861					exit_with_error(-ret);
    862				if (xsk_ring_prod__needs_wakeup(&umem->fq)) {
    863					ret = poll(fds, 1, POLL_TMOUT);
    864					if (ret < 0)
    865						exit_with_error(-ret);
    866				}
    867				ret = xsk_ring_prod__reserve(&umem->fq, rcvd, &idx_fq);
    868			}
    869		}
    870
    871		for (i = 0; i < rcvd; i++) {
    872			const struct xdp_desc *desc = xsk_ring_cons__rx_desc(&xsk->rx, idx_rx++);
    873			u64 addr = desc->addr, orig;
    874
    875			orig = xsk_umem__extract_addr(addr);
    876			addr = xsk_umem__add_offset_to_addr(addr);
    877
    878			if (!is_pkt_valid(pkt, umem->buffer, addr, desc->len) ||
    879			    !is_offset_correct(umem, pkt_stream, addr, pkt->addr))
    880				return TEST_FAILURE;
    881
    882			if (ifobj->use_fill_ring)
    883				*xsk_ring_prod__fill_addr(&umem->fq, idx_fq++) = orig;
    884			pkt = pkt_stream_get_next_rx_pkt(pkt_stream, &pkts_sent);
    885		}
    886
    887		if (ifobj->use_fill_ring)
    888			xsk_ring_prod__submit(&umem->fq, rcvd);
    889		if (ifobj->release_rx)
    890			xsk_ring_cons__release(&xsk->rx, rcvd);
    891
    892		pthread_mutex_lock(&pacing_mutex);
    893		pkts_in_flight -= pkts_sent;
    894		if (pkts_in_flight < umem->num_frames)
    895			pthread_cond_signal(&pacing_cond);
    896		pthread_mutex_unlock(&pacing_mutex);
    897		pkts_sent = 0;
    898	}
    899
    900	return TEST_PASS;
    901}
    902
    903static int __send_pkts(struct ifobject *ifobject, u32 *pkt_nb)
    904{
    905	struct xsk_socket_info *xsk = ifobject->xsk;
    906	u32 i, idx, valid_pkts = 0;
    907
    908	while (xsk_ring_prod__reserve(&xsk->tx, BATCH_SIZE, &idx) < BATCH_SIZE)
    909		complete_pkts(xsk, BATCH_SIZE);
    910
    911	for (i = 0; i < BATCH_SIZE; i++) {
    912		struct xdp_desc *tx_desc = xsk_ring_prod__tx_desc(&xsk->tx, idx + i);
    913		struct pkt *pkt = pkt_generate(ifobject, *pkt_nb);
    914
    915		if (!pkt)
    916			break;
    917
    918		tx_desc->addr = pkt->addr;
    919		tx_desc->len = pkt->len;
    920		(*pkt_nb)++;
    921		if (pkt->valid)
    922			valid_pkts++;
    923	}
    924
    925	pthread_mutex_lock(&pacing_mutex);
    926	pkts_in_flight += valid_pkts;
    927	/* pkts_in_flight might be negative if many invalid packets are sent */
    928	if (pkts_in_flight >= (int)(ifobject->umem->num_frames - BATCH_SIZE)) {
    929		kick_tx(xsk);
    930		pthread_cond_wait(&pacing_cond, &pacing_mutex);
    931	}
    932	pthread_mutex_unlock(&pacing_mutex);
    933
    934	xsk_ring_prod__submit(&xsk->tx, i);
    935	xsk->outstanding_tx += valid_pkts;
    936	if (complete_pkts(xsk, i))
    937		return TEST_FAILURE;
    938
    939	usleep(10);
    940	return TEST_PASS;
    941}
    942
    943static void wait_for_tx_completion(struct xsk_socket_info *xsk)
    944{
    945	while (xsk->outstanding_tx)
    946		complete_pkts(xsk, BATCH_SIZE);
    947}
    948
    949static int send_pkts(struct test_spec *test, struct ifobject *ifobject)
    950{
    951	struct pollfd fds = { };
    952	u32 pkt_cnt = 0;
    953
    954	fds.fd = xsk_socket__fd(ifobject->xsk->xsk);
    955	fds.events = POLLOUT;
    956
    957	while (pkt_cnt < ifobject->pkt_stream->nb_pkts) {
    958		int err;
    959
    960		if (ifobject->use_poll) {
    961			int ret;
    962
    963			ret = poll(&fds, 1, POLL_TMOUT);
    964			if (ret <= 0)
    965				continue;
    966
    967			if (!(fds.revents & POLLOUT))
    968				continue;
    969		}
    970
    971		err = __send_pkts(ifobject, &pkt_cnt);
    972		if (err || test->fail)
    973			return TEST_FAILURE;
    974	}
    975
    976	wait_for_tx_completion(ifobject->xsk);
    977	return TEST_PASS;
    978}
    979
    980static int get_xsk_stats(struct xsk_socket *xsk, struct xdp_statistics *stats)
    981{
    982	int fd = xsk_socket__fd(xsk), err;
    983	socklen_t optlen, expected_len;
    984
    985	optlen = sizeof(*stats);
    986	err = getsockopt(fd, SOL_XDP, XDP_STATISTICS, stats, &optlen);
    987	if (err) {
    988		ksft_print_msg("[%s] getsockopt(XDP_STATISTICS) error %u %s\n",
    989			       __func__, -err, strerror(-err));
    990		return TEST_FAILURE;
    991	}
    992
    993	expected_len = sizeof(struct xdp_statistics);
    994	if (optlen != expected_len) {
    995		ksft_print_msg("[%s] getsockopt optlen error. Expected: %u got: %u\n",
    996			       __func__, expected_len, optlen);
    997		return TEST_FAILURE;
    998	}
    999
   1000	return TEST_PASS;
   1001}
   1002
   1003static int validate_rx_dropped(struct ifobject *ifobject)
   1004{
   1005	struct xsk_socket *xsk = ifobject->xsk->xsk;
   1006	struct xdp_statistics stats;
   1007	int err;
   1008
   1009	kick_rx(ifobject->xsk);
   1010
   1011	err = get_xsk_stats(xsk, &stats);
   1012	if (err)
   1013		return TEST_FAILURE;
   1014
   1015	if (stats.rx_dropped == ifobject->pkt_stream->nb_pkts / 2)
   1016		return TEST_PASS;
   1017
   1018	return TEST_FAILURE;
   1019}
   1020
   1021static int validate_rx_full(struct ifobject *ifobject)
   1022{
   1023	struct xsk_socket *xsk = ifobject->xsk->xsk;
   1024	struct xdp_statistics stats;
   1025	int err;
   1026
   1027	usleep(1000);
   1028	kick_rx(ifobject->xsk);
   1029
   1030	err = get_xsk_stats(xsk, &stats);
   1031	if (err)
   1032		return TEST_FAILURE;
   1033
   1034	if (stats.rx_ring_full)
   1035		return TEST_PASS;
   1036
   1037	return TEST_FAILURE;
   1038}
   1039
   1040static int validate_fill_empty(struct ifobject *ifobject)
   1041{
   1042	struct xsk_socket *xsk = ifobject->xsk->xsk;
   1043	struct xdp_statistics stats;
   1044	int err;
   1045
   1046	usleep(1000);
   1047	kick_rx(ifobject->xsk);
   1048
   1049	err = get_xsk_stats(xsk, &stats);
   1050	if (err)
   1051		return TEST_FAILURE;
   1052
   1053	if (stats.rx_fill_ring_empty_descs)
   1054		return TEST_PASS;
   1055
   1056	return TEST_FAILURE;
   1057}
   1058
   1059static int validate_tx_invalid_descs(struct ifobject *ifobject)
   1060{
   1061	struct xsk_socket *xsk = ifobject->xsk->xsk;
   1062	int fd = xsk_socket__fd(xsk);
   1063	struct xdp_statistics stats;
   1064	socklen_t optlen;
   1065	int err;
   1066
   1067	optlen = sizeof(stats);
   1068	err = getsockopt(fd, SOL_XDP, XDP_STATISTICS, &stats, &optlen);
   1069	if (err) {
   1070		ksft_print_msg("[%s] getsockopt(XDP_STATISTICS) error %u %s\n",
   1071			       __func__, -err, strerror(-err));
   1072		return TEST_FAILURE;
   1073	}
   1074
   1075	if (stats.tx_invalid_descs != ifobject->pkt_stream->nb_pkts / 2) {
   1076		ksft_print_msg("[%s] tx_invalid_descs incorrect. Got [%u] expected [%u]\n",
   1077			       __func__, stats.tx_invalid_descs, ifobject->pkt_stream->nb_pkts);
   1078		return TEST_FAILURE;
   1079	}
   1080
   1081	return TEST_PASS;
   1082}
   1083
   1084static void thread_common_ops(struct test_spec *test, struct ifobject *ifobject)
   1085{
   1086	u64 umem_sz = ifobject->umem->num_frames * ifobject->umem->frame_size;
   1087	int mmap_flags = MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE;
   1088	int ret, ifindex;
   1089	void *bufs;
   1090	u32 i;
   1091
   1092	ifobject->ns_fd = switch_namespace(ifobject->nsname);
   1093
   1094	if (ifobject->umem->unaligned_mode)
   1095		mmap_flags |= MAP_HUGETLB;
   1096
   1097	bufs = mmap(NULL, umem_sz, PROT_READ | PROT_WRITE, mmap_flags, -1, 0);
   1098	if (bufs == MAP_FAILED)
   1099		exit_with_error(errno);
   1100
   1101	ret = xsk_configure_umem(ifobject->umem, bufs, umem_sz);
   1102	if (ret)
   1103		exit_with_error(-ret);
   1104
   1105	for (i = 0; i < test->nb_sockets; i++) {
   1106		u32 ctr = 0;
   1107
   1108		while (ctr++ < SOCK_RECONF_CTR) {
   1109			ret = xsk_configure_socket(&ifobject->xsk_arr[i], ifobject->umem,
   1110						   ifobject, !!i);
   1111			if (!ret)
   1112				break;
   1113
   1114			/* Retry if it fails as xsk_socket__create() is asynchronous */
   1115			if (ctr >= SOCK_RECONF_CTR)
   1116				exit_with_error(-ret);
   1117			usleep(USLEEP_MAX);
   1118		}
   1119
   1120		if (ifobject->busy_poll)
   1121			enable_busy_poll(&ifobject->xsk_arr[i]);
   1122	}
   1123
   1124	ifobject->xsk = &ifobject->xsk_arr[0];
   1125
   1126	if (!ifobject->rx_on)
   1127		return;
   1128
   1129	ifindex = if_nametoindex(ifobject->ifname);
   1130	if (!ifindex)
   1131		exit_with_error(errno);
   1132
   1133	ret = xsk_setup_xdp_prog(ifindex, &ifobject->xsk_map_fd);
   1134	if (ret)
   1135		exit_with_error(-ret);
   1136
   1137	ret = xsk_socket__update_xskmap(ifobject->xsk->xsk, ifobject->xsk_map_fd);
   1138	if (ret)
   1139		exit_with_error(-ret);
   1140}
   1141
   1142static void testapp_cleanup_xsk_res(struct ifobject *ifobj)
   1143{
   1144	print_verbose("Destroying socket\n");
   1145	xsk_socket__delete(ifobj->xsk->xsk);
   1146	munmap(ifobj->umem->buffer, ifobj->umem->num_frames * ifobj->umem->frame_size);
   1147	xsk_umem__delete(ifobj->umem->umem);
   1148}
   1149
   1150static void *worker_testapp_validate_tx(void *arg)
   1151{
   1152	struct test_spec *test = (struct test_spec *)arg;
   1153	struct ifobject *ifobject = test->ifobj_tx;
   1154	int err;
   1155
   1156	if (test->current_step == 1)
   1157		thread_common_ops(test, ifobject);
   1158
   1159	print_verbose("Sending %d packets on interface %s\n", ifobject->pkt_stream->nb_pkts,
   1160		      ifobject->ifname);
   1161	err = send_pkts(test, ifobject);
   1162
   1163	if (!err && ifobject->validation_func)
   1164		err = ifobject->validation_func(ifobject);
   1165	if (err)
   1166		report_failure(test);
   1167
   1168	if (test->total_steps == test->current_step || err)
   1169		testapp_cleanup_xsk_res(ifobject);
   1170	pthread_exit(NULL);
   1171}
   1172
   1173static void xsk_populate_fill_ring(struct xsk_umem_info *umem, struct pkt_stream *pkt_stream)
   1174{
   1175	u32 idx = 0, i, buffers_to_fill;
   1176	int ret;
   1177
   1178	if (umem->num_frames < XSK_RING_PROD__DEFAULT_NUM_DESCS)
   1179		buffers_to_fill = umem->num_frames;
   1180	else
   1181		buffers_to_fill = XSK_RING_PROD__DEFAULT_NUM_DESCS;
   1182
   1183	ret = xsk_ring_prod__reserve(&umem->fq, buffers_to_fill, &idx);
   1184	if (ret != buffers_to_fill)
   1185		exit_with_error(ENOSPC);
   1186	for (i = 0; i < buffers_to_fill; i++) {
   1187		u64 addr;
   1188
   1189		if (pkt_stream->use_addr_for_fill) {
   1190			struct pkt *pkt = pkt_stream_get_pkt(pkt_stream, i);
   1191
   1192			if (!pkt)
   1193				break;
   1194			addr = pkt->addr;
   1195		} else {
   1196			addr = i * umem->frame_size;
   1197		}
   1198
   1199		*xsk_ring_prod__fill_addr(&umem->fq, idx++) = addr;
   1200	}
   1201	xsk_ring_prod__submit(&umem->fq, buffers_to_fill);
   1202}
   1203
   1204static void *worker_testapp_validate_rx(void *arg)
   1205{
   1206	struct test_spec *test = (struct test_spec *)arg;
   1207	struct ifobject *ifobject = test->ifobj_rx;
   1208	struct pollfd fds = { };
   1209	int err;
   1210
   1211	if (test->current_step == 1)
   1212		thread_common_ops(test, ifobject);
   1213
   1214	xsk_populate_fill_ring(ifobject->umem, ifobject->pkt_stream);
   1215
   1216	fds.fd = xsk_socket__fd(ifobject->xsk->xsk);
   1217	fds.events = POLLIN;
   1218
   1219	pthread_barrier_wait(&barr);
   1220
   1221	err = receive_pkts(ifobject, &fds);
   1222
   1223	if (!err && ifobject->validation_func)
   1224		err = ifobject->validation_func(ifobject);
   1225	if (err) {
   1226		report_failure(test);
   1227		pthread_mutex_lock(&pacing_mutex);
   1228		pthread_cond_signal(&pacing_cond);
   1229		pthread_mutex_unlock(&pacing_mutex);
   1230	}
   1231
   1232	if (test->total_steps == test->current_step || err)
   1233		testapp_cleanup_xsk_res(ifobject);
   1234	pthread_exit(NULL);
   1235}
   1236
   1237static int testapp_validate_traffic(struct test_spec *test)
   1238{
   1239	struct ifobject *ifobj_tx = test->ifobj_tx;
   1240	struct ifobject *ifobj_rx = test->ifobj_rx;
   1241	pthread_t t0, t1;
   1242
   1243	if (pthread_barrier_init(&barr, NULL, 2))
   1244		exit_with_error(errno);
   1245
   1246	test->current_step++;
   1247	pkt_stream_reset(ifobj_rx->pkt_stream);
   1248	pkts_in_flight = 0;
   1249
   1250	/*Spawn RX thread */
   1251	pthread_create(&t0, NULL, ifobj_rx->func_ptr, test);
   1252
   1253	pthread_barrier_wait(&barr);
   1254	if (pthread_barrier_destroy(&barr))
   1255		exit_with_error(errno);
   1256
   1257	/*Spawn TX thread */
   1258	pthread_create(&t1, NULL, ifobj_tx->func_ptr, test);
   1259
   1260	pthread_join(t1, NULL);
   1261	pthread_join(t0, NULL);
   1262
   1263	return !!test->fail;
   1264}
   1265
   1266static void testapp_teardown(struct test_spec *test)
   1267{
   1268	int i;
   1269
   1270	test_spec_set_name(test, "TEARDOWN");
   1271	for (i = 0; i < MAX_TEARDOWN_ITER; i++) {
   1272		if (testapp_validate_traffic(test))
   1273			return;
   1274		test_spec_reset(test);
   1275	}
   1276}
   1277
   1278static void swap_directions(struct ifobject **ifobj1, struct ifobject **ifobj2)
   1279{
   1280	thread_func_t tmp_func_ptr = (*ifobj1)->func_ptr;
   1281	struct ifobject *tmp_ifobj = (*ifobj1);
   1282
   1283	(*ifobj1)->func_ptr = (*ifobj2)->func_ptr;
   1284	(*ifobj2)->func_ptr = tmp_func_ptr;
   1285
   1286	*ifobj1 = *ifobj2;
   1287	*ifobj2 = tmp_ifobj;
   1288}
   1289
   1290static void testapp_bidi(struct test_spec *test)
   1291{
   1292	test_spec_set_name(test, "BIDIRECTIONAL");
   1293	test->ifobj_tx->rx_on = true;
   1294	test->ifobj_rx->tx_on = true;
   1295	test->total_steps = 2;
   1296	if (testapp_validate_traffic(test))
   1297		return;
   1298
   1299	print_verbose("Switching Tx/Rx vectors\n");
   1300	swap_directions(&test->ifobj_rx, &test->ifobj_tx);
   1301	testapp_validate_traffic(test);
   1302
   1303	swap_directions(&test->ifobj_rx, &test->ifobj_tx);
   1304}
   1305
   1306static void swap_xsk_resources(struct ifobject *ifobj_tx, struct ifobject *ifobj_rx)
   1307{
   1308	int ret;
   1309
   1310	xsk_socket__delete(ifobj_tx->xsk->xsk);
   1311	xsk_socket__delete(ifobj_rx->xsk->xsk);
   1312	ifobj_tx->xsk = &ifobj_tx->xsk_arr[1];
   1313	ifobj_rx->xsk = &ifobj_rx->xsk_arr[1];
   1314
   1315	ret = xsk_socket__update_xskmap(ifobj_rx->xsk->xsk, ifobj_rx->xsk_map_fd);
   1316	if (ret)
   1317		exit_with_error(-ret);
   1318}
   1319
   1320static void testapp_bpf_res(struct test_spec *test)
   1321{
   1322	test_spec_set_name(test, "BPF_RES");
   1323	test->total_steps = 2;
   1324	test->nb_sockets = 2;
   1325	if (testapp_validate_traffic(test))
   1326		return;
   1327
   1328	swap_xsk_resources(test->ifobj_tx, test->ifobj_rx);
   1329	testapp_validate_traffic(test);
   1330}
   1331
   1332static void testapp_headroom(struct test_spec *test)
   1333{
   1334	test_spec_set_name(test, "UMEM_HEADROOM");
   1335	test->ifobj_rx->umem->frame_headroom = UMEM_HEADROOM_TEST_SIZE;
   1336	testapp_validate_traffic(test);
   1337}
   1338
   1339static void testapp_stats_rx_dropped(struct test_spec *test)
   1340{
   1341	test_spec_set_name(test, "STAT_RX_DROPPED");
   1342	test->ifobj_rx->umem->frame_headroom = test->ifobj_rx->umem->frame_size -
   1343		XDP_PACKET_HEADROOM - MIN_PKT_SIZE * 3;
   1344	pkt_stream_replace_half(test, MIN_PKT_SIZE * 4, 0);
   1345	pkt_stream_receive_half(test);
   1346	test->ifobj_rx->validation_func = validate_rx_dropped;
   1347	testapp_validate_traffic(test);
   1348}
   1349
   1350static void testapp_stats_tx_invalid_descs(struct test_spec *test)
   1351{
   1352	test_spec_set_name(test, "STAT_TX_INVALID");
   1353	pkt_stream_replace_half(test, XSK_UMEM__INVALID_FRAME_SIZE, 0);
   1354	test->ifobj_tx->validation_func = validate_tx_invalid_descs;
   1355	testapp_validate_traffic(test);
   1356
   1357	pkt_stream_restore_default(test);
   1358}
   1359
   1360static void testapp_stats_rx_full(struct test_spec *test)
   1361{
   1362	test_spec_set_name(test, "STAT_RX_FULL");
   1363	pkt_stream_replace(test, DEFAULT_UMEM_BUFFERS + DEFAULT_UMEM_BUFFERS / 2, PKT_SIZE);
   1364	test->ifobj_rx->pkt_stream = pkt_stream_generate(test->ifobj_rx->umem,
   1365							 DEFAULT_UMEM_BUFFERS, PKT_SIZE);
   1366	if (!test->ifobj_rx->pkt_stream)
   1367		exit_with_error(ENOMEM);
   1368
   1369	test->ifobj_rx->xsk->rxqsize = DEFAULT_UMEM_BUFFERS;
   1370	test->ifobj_rx->release_rx = false;
   1371	test->ifobj_rx->validation_func = validate_rx_full;
   1372	testapp_validate_traffic(test);
   1373
   1374	pkt_stream_restore_default(test);
   1375}
   1376
   1377static void testapp_stats_fill_empty(struct test_spec *test)
   1378{
   1379	test_spec_set_name(test, "STAT_RX_FILL_EMPTY");
   1380	pkt_stream_replace(test, DEFAULT_UMEM_BUFFERS + DEFAULT_UMEM_BUFFERS / 2, PKT_SIZE);
   1381	test->ifobj_rx->pkt_stream = pkt_stream_generate(test->ifobj_rx->umem,
   1382							 DEFAULT_UMEM_BUFFERS, PKT_SIZE);
   1383	if (!test->ifobj_rx->pkt_stream)
   1384		exit_with_error(ENOMEM);
   1385
   1386	test->ifobj_rx->use_fill_ring = false;
   1387	test->ifobj_rx->validation_func = validate_fill_empty;
   1388	testapp_validate_traffic(test);
   1389
   1390	pkt_stream_restore_default(test);
   1391}
   1392
   1393/* Simple test */
   1394static bool hugepages_present(struct ifobject *ifobject)
   1395{
   1396	const size_t mmap_sz = 2 * ifobject->umem->num_frames * ifobject->umem->frame_size;
   1397	void *bufs;
   1398
   1399	bufs = mmap(NULL, mmap_sz, PROT_READ | PROT_WRITE,
   1400		    MAP_PRIVATE | MAP_ANONYMOUS | MAP_HUGETLB, -1, 0);
   1401	if (bufs == MAP_FAILED)
   1402		return false;
   1403
   1404	munmap(bufs, mmap_sz);
   1405	return true;
   1406}
   1407
   1408static bool testapp_unaligned(struct test_spec *test)
   1409{
   1410	if (!hugepages_present(test->ifobj_tx)) {
   1411		ksft_test_result_skip("No 2M huge pages present.\n");
   1412		return false;
   1413	}
   1414
   1415	test_spec_set_name(test, "UNALIGNED_MODE");
   1416	test->ifobj_tx->umem->unaligned_mode = true;
   1417	test->ifobj_rx->umem->unaligned_mode = true;
   1418	/* Let half of the packets straddle a buffer boundrary */
   1419	pkt_stream_replace_half(test, PKT_SIZE, -PKT_SIZE / 2);
   1420	test->ifobj_rx->pkt_stream->use_addr_for_fill = true;
   1421	testapp_validate_traffic(test);
   1422
   1423	pkt_stream_restore_default(test);
   1424	return true;
   1425}
   1426
   1427static void testapp_single_pkt(struct test_spec *test)
   1428{
   1429	struct pkt pkts[] = {{0x1000, PKT_SIZE, 0, true}};
   1430
   1431	pkt_stream_generate_custom(test, pkts, ARRAY_SIZE(pkts));
   1432	testapp_validate_traffic(test);
   1433	pkt_stream_restore_default(test);
   1434}
   1435
   1436static void testapp_invalid_desc(struct test_spec *test)
   1437{
   1438	struct pkt pkts[] = {
   1439		/* Zero packet address allowed */
   1440		{0, PKT_SIZE, 0, true},
   1441		/* Allowed packet */
   1442		{0x1000, PKT_SIZE, 0, true},
   1443		/* Straddling the start of umem */
   1444		{-2, PKT_SIZE, 0, false},
   1445		/* Packet too large */
   1446		{0x2000, XSK_UMEM__INVALID_FRAME_SIZE, 0, false},
   1447		/* After umem ends */
   1448		{UMEM_SIZE, PKT_SIZE, 0, false},
   1449		/* Straddle the end of umem */
   1450		{UMEM_SIZE - PKT_SIZE / 2, PKT_SIZE, 0, false},
   1451		/* Straddle a page boundrary */
   1452		{0x3000 - PKT_SIZE / 2, PKT_SIZE, 0, false},
   1453		/* Straddle a 2K boundrary */
   1454		{0x3800 - PKT_SIZE / 2, PKT_SIZE, 0, true},
   1455		/* Valid packet for synch so that something is received */
   1456		{0x4000, PKT_SIZE, 0, true}};
   1457
   1458	if (test->ifobj_tx->umem->unaligned_mode) {
   1459		/* Crossing a page boundrary allowed */
   1460		pkts[6].valid = true;
   1461	}
   1462	if (test->ifobj_tx->umem->frame_size == XSK_UMEM__DEFAULT_FRAME_SIZE / 2) {
   1463		/* Crossing a 2K frame size boundrary not allowed */
   1464		pkts[7].valid = false;
   1465	}
   1466
   1467	pkt_stream_generate_custom(test, pkts, ARRAY_SIZE(pkts));
   1468	testapp_validate_traffic(test);
   1469	pkt_stream_restore_default(test);
   1470}
   1471
   1472static void init_iface(struct ifobject *ifobj, const char *dst_mac, const char *src_mac,
   1473		       const char *dst_ip, const char *src_ip, const u16 dst_port,
   1474		       const u16 src_port, thread_func_t func_ptr)
   1475{
   1476	struct in_addr ip;
   1477
   1478	memcpy(ifobj->dst_mac, dst_mac, ETH_ALEN);
   1479	memcpy(ifobj->src_mac, src_mac, ETH_ALEN);
   1480
   1481	inet_aton(dst_ip, &ip);
   1482	ifobj->dst_ip = ip.s_addr;
   1483
   1484	inet_aton(src_ip, &ip);
   1485	ifobj->src_ip = ip.s_addr;
   1486
   1487	ifobj->dst_port = dst_port;
   1488	ifobj->src_port = src_port;
   1489
   1490	ifobj->func_ptr = func_ptr;
   1491}
   1492
   1493static void run_pkt_test(struct test_spec *test, enum test_mode mode, enum test_type type)
   1494{
   1495	switch (type) {
   1496	case TEST_TYPE_STATS_RX_DROPPED:
   1497		testapp_stats_rx_dropped(test);
   1498		break;
   1499	case TEST_TYPE_STATS_TX_INVALID_DESCS:
   1500		testapp_stats_tx_invalid_descs(test);
   1501		break;
   1502	case TEST_TYPE_STATS_RX_FULL:
   1503		testapp_stats_rx_full(test);
   1504		break;
   1505	case TEST_TYPE_STATS_FILL_EMPTY:
   1506		testapp_stats_fill_empty(test);
   1507		break;
   1508	case TEST_TYPE_TEARDOWN:
   1509		testapp_teardown(test);
   1510		break;
   1511	case TEST_TYPE_BIDI:
   1512		testapp_bidi(test);
   1513		break;
   1514	case TEST_TYPE_BPF_RES:
   1515		testapp_bpf_res(test);
   1516		break;
   1517	case TEST_TYPE_RUN_TO_COMPLETION:
   1518		test_spec_set_name(test, "RUN_TO_COMPLETION");
   1519		testapp_validate_traffic(test);
   1520		break;
   1521	case TEST_TYPE_RUN_TO_COMPLETION_SINGLE_PKT:
   1522		test_spec_set_name(test, "RUN_TO_COMPLETION_SINGLE_PKT");
   1523		testapp_single_pkt(test);
   1524		break;
   1525	case TEST_TYPE_RUN_TO_COMPLETION_2K_FRAME:
   1526		test_spec_set_name(test, "RUN_TO_COMPLETION_2K_FRAME_SIZE");
   1527		test->ifobj_tx->umem->frame_size = 2048;
   1528		test->ifobj_rx->umem->frame_size = 2048;
   1529		pkt_stream_replace(test, DEFAULT_PKT_CNT, PKT_SIZE);
   1530		testapp_validate_traffic(test);
   1531
   1532		pkt_stream_restore_default(test);
   1533		break;
   1534	case TEST_TYPE_POLL:
   1535		test->ifobj_tx->use_poll = true;
   1536		test->ifobj_rx->use_poll = true;
   1537		test_spec_set_name(test, "POLL");
   1538		testapp_validate_traffic(test);
   1539		break;
   1540	case TEST_TYPE_ALIGNED_INV_DESC:
   1541		test_spec_set_name(test, "ALIGNED_INV_DESC");
   1542		testapp_invalid_desc(test);
   1543		break;
   1544	case TEST_TYPE_ALIGNED_INV_DESC_2K_FRAME:
   1545		test_spec_set_name(test, "ALIGNED_INV_DESC_2K_FRAME_SIZE");
   1546		test->ifobj_tx->umem->frame_size = 2048;
   1547		test->ifobj_rx->umem->frame_size = 2048;
   1548		testapp_invalid_desc(test);
   1549		break;
   1550	case TEST_TYPE_UNALIGNED_INV_DESC:
   1551		if (!hugepages_present(test->ifobj_tx)) {
   1552			ksft_test_result_skip("No 2M huge pages present.\n");
   1553			return;
   1554		}
   1555		test_spec_set_name(test, "UNALIGNED_INV_DESC");
   1556		test->ifobj_tx->umem->unaligned_mode = true;
   1557		test->ifobj_rx->umem->unaligned_mode = true;
   1558		testapp_invalid_desc(test);
   1559		break;
   1560	case TEST_TYPE_UNALIGNED:
   1561		if (!testapp_unaligned(test))
   1562			return;
   1563		break;
   1564	case TEST_TYPE_HEADROOM:
   1565		testapp_headroom(test);
   1566		break;
   1567	default:
   1568		break;
   1569	}
   1570
   1571	if (!test->fail)
   1572		ksft_test_result_pass("PASS: %s %s%s\n", mode_string(test), busy_poll_string(test),
   1573				      test->name);
   1574}
   1575
   1576static struct ifobject *ifobject_create(void)
   1577{
   1578	struct ifobject *ifobj;
   1579
   1580	ifobj = calloc(1, sizeof(struct ifobject));
   1581	if (!ifobj)
   1582		return NULL;
   1583
   1584	ifobj->xsk_arr = calloc(MAX_SOCKETS, sizeof(*ifobj->xsk_arr));
   1585	if (!ifobj->xsk_arr)
   1586		goto out_xsk_arr;
   1587
   1588	ifobj->umem = calloc(1, sizeof(*ifobj->umem));
   1589	if (!ifobj->umem)
   1590		goto out_umem;
   1591
   1592	return ifobj;
   1593
   1594out_umem:
   1595	free(ifobj->xsk_arr);
   1596out_xsk_arr:
   1597	free(ifobj);
   1598	return NULL;
   1599}
   1600
   1601static void ifobject_delete(struct ifobject *ifobj)
   1602{
   1603	free(ifobj->umem);
   1604	free(ifobj->xsk_arr);
   1605	free(ifobj);
   1606}
   1607
   1608int main(int argc, char **argv)
   1609{
   1610	struct pkt_stream *pkt_stream_default;
   1611	struct ifobject *ifobj_tx, *ifobj_rx;
   1612	u32 i, j, failed_tests = 0;
   1613	struct test_spec test;
   1614
   1615	/* Use libbpf 1.0 API mode */
   1616	libbpf_set_strict_mode(LIBBPF_STRICT_ALL);
   1617
   1618	ifobj_tx = ifobject_create();
   1619	if (!ifobj_tx)
   1620		exit_with_error(ENOMEM);
   1621	ifobj_rx = ifobject_create();
   1622	if (!ifobj_rx)
   1623		exit_with_error(ENOMEM);
   1624
   1625	setlocale(LC_ALL, "");
   1626
   1627	parse_command_line(ifobj_tx, ifobj_rx, argc, argv);
   1628
   1629	if (!validate_interface(ifobj_tx) || !validate_interface(ifobj_rx)) {
   1630		usage(basename(argv[0]));
   1631		ksft_exit_xfail();
   1632	}
   1633
   1634	init_iface(ifobj_tx, MAC1, MAC2, IP1, IP2, UDP_PORT1, UDP_PORT2,
   1635		   worker_testapp_validate_tx);
   1636	init_iface(ifobj_rx, MAC2, MAC1, IP2, IP1, UDP_PORT2, UDP_PORT1,
   1637		   worker_testapp_validate_rx);
   1638
   1639	test_spec_init(&test, ifobj_tx, ifobj_rx, 0);
   1640	pkt_stream_default = pkt_stream_generate(ifobj_tx->umem, DEFAULT_PKT_CNT, PKT_SIZE);
   1641	if (!pkt_stream_default)
   1642		exit_with_error(ENOMEM);
   1643	test.pkt_stream_default = pkt_stream_default;
   1644
   1645	ksft_set_plan(TEST_MODE_MAX * TEST_TYPE_MAX);
   1646
   1647	for (i = 0; i < TEST_MODE_MAX; i++)
   1648		for (j = 0; j < TEST_TYPE_MAX; j++) {
   1649			test_spec_init(&test, ifobj_tx, ifobj_rx, i);
   1650			run_pkt_test(&test, i, j);
   1651			usleep(USLEEP_MAX);
   1652
   1653			if (test.fail)
   1654				failed_tests++;
   1655		}
   1656
   1657	pkt_stream_delete(pkt_stream_default);
   1658	ifobject_delete(ifobj_tx);
   1659	ifobject_delete(ifobj_rx);
   1660
   1661	if (failed_tests)
   1662		ksft_exit_fail();
   1663	else
   1664		ksft_exit_pass();
   1665}