#include <stdint.h>
#include <stdlib.h>
#include <inttypes.h>
#include <unistd.h>
#include <signal.h>
#include <getopt.h>
#define RX_RING_SIZE 1024
#define TX_RING_SIZE 1024
#define NUM_MBUFS ((64*1024)-1)
#define MBUF_CACHE_SIZE 128
#define BURST_SIZE 64
#define SCHED_RX_RING_SZ 8192
#define SCHED_TX_RING_SZ 65536
#define BURST_SIZE_TX 32
#define RTE_LOGTYPE_DISTRAPP RTE_LOGTYPE_USER1
#define ANSI_COLOR_RED "\x1b[31m"
#define ANSI_COLOR_RESET "\x1b[0m"
static uint32_t enabled_port_mask;
volatile uint8_t quit_signal;
volatile uint8_t quit_signal_rx;
volatile uint8_t quit_signal_dist;
volatile uint8_t quit_signal_work;
unsigned int power_lib_initialised;
bool enable_lcore_rx_distributor;
unsigned int num_workers;
static volatile struct app_stats {
alignas(RTE_CACHE_LINE_SIZE) struct {
uint64_t rx_pkts;
uint64_t returned_pkts;
uint64_t enqueued_pkts;
uint64_t enqdrop_pkts;
} rx;
alignas(RTE_CACHE_LINE_SIZE) int pad1;
alignas(RTE_CACHE_LINE_SIZE) struct {
uint64_t in_pkts;
uint64_t ret_pkts;
uint64_t sent_pkts;
uint64_t enqdrop_pkts;
} dist;
alignas(RTE_CACHE_LINE_SIZE) int pad2;
alignas(RTE_CACHE_LINE_SIZE) struct {
uint64_t dequeue_pkts;
uint64_t tx_pkts;
uint64_t enqdrop_pkts;
} tx;
alignas(RTE_CACHE_LINE_SIZE) int pad3;
alignas(RTE_CACHE_LINE_SIZE) uint64_t worker_pkts[64];
alignas(RTE_CACHE_LINE_SIZE) int pad4;
alignas(RTE_CACHE_LINE_SIZE) uint64_t worker_bursts[64][8];
alignas(RTE_CACHE_LINE_SIZE) int pad5;
alignas(RTE_CACHE_LINE_SIZE) uint64_t port_rx_pkts[64];
alignas(RTE_CACHE_LINE_SIZE) uint64_t port_tx_pkts[64];
} app_stats;
struct app_stats prev_app_stats;
},
.txmode = {
},
.rx_adv_conf = {
.rss_conf = {
.rss_hf = RTE_ETH_RSS_IP | RTE_ETH_RSS_UDP |
RTE_ETH_RSS_TCP | RTE_ETH_RSS_SCTP,
}
},
};
struct output_buffer {
unsigned count;
};
static void print_stats(void);
static inline int
{
const uint16_t rxRings = 1, txRings = 1;
int retval;
uint16_t q;
uint16_t nb_rxd = RX_RING_SIZE;
uint16_t nb_txd = TX_RING_SIZE;
return -1;
if (retval != 0) {
printf("Error during getting device (port %u) info: %s\n",
port, strerror(-retval));
return retval;
}
printf("Port %u modified RSS hash function based on hardware support,"
"requested:%#"PRIx64" configured:%#"PRIx64"\n",
port,
}
if (retval != 0)
return retval;
if (retval != 0)
return retval;
for (q = 0; q < rxRings; q++) {
NULL, mbuf_pool);
if (retval < 0)
return retval;
}
for (q = 0; q < txRings; q++) {
&txconf);
if (retval < 0)
return retval;
}
if (retval < 0)
return retval;
do {
if (retval < 0) {
printf("Failed link get (port %u): %s\n",
return retval;
break;
printf("Waiting for Link up on port %"PRIu16"\n", port);
sleep(1);
printf("Link down on port %"PRIu16"\n", port);
return 0;
}
struct rte_ether_addr addr;
if (retval < 0) {
printf("Failed to get MAC address (port %u): %s\n",
return retval;
}
printf("Port %u MAC: %02"PRIx8" %02"PRIx8" %02"PRIx8
" %02"PRIx8" %02"PRIx8" %02"PRIx8"\n",
if (retval != 0)
return retval;
return 0;
}
struct lcore_params {
unsigned worker_id;
struct rte_distributor *d;
};
static int
lcore_rx(struct lcore_params *p)
{
uint16_t port;
if ((enabled_port_mask & (1 << port)) == 0)
continue;
printf("WARNING, port %u is on remote NUMA node to "
"RX thread.\n\tPerformance will not "
"be optimal.\n", port);
}
port = 0;
while (!quit_signal_rx) {
if ((enabled_port_mask & (1 << port)) == 0) {
if (++port == nb_ports)
port = 0;
continue;
}
BURST_SIZE);
if (++port == nb_ports)
port = 0;
continue;
}
app_stats.rx.rx_pkts += nb_rx;
struct rte_ring *out_ring = p->rx_dist_ring;
(void *)bufs, nb_rx, NULL);
app_stats.rx.enqueued_pkts += sent;
app_stats.rx.enqdrop_pkts += nb_rx - sent;
"%s:Packet loss due to full ring\n", __func__);
while (sent < nb_rx)
}
if (++port == nb_ports)
port = 0;
}
if (power_lib_initialised)
quit_signal_dist = 1;
return 0;
}
static int
lcore_rx_and_distributor(struct lcore_params *p)
{
struct rte_distributor *d = p->d;
uint16_t port;
if ((enabled_port_mask & (1 << port)) == 0)
continue;
printf("WARNING, port %u is on remote NUMA node to "
"RX thread.\n\tPerformance will not "
"be optimal.\n", port);
}
printf(
"\nCore %u doing packet RX and Distributor.\n",
rte_lcore_id());
port = 0;
while (!quit_signal_rx) {
if ((enabled_port_mask & (1 << port)) == 0) {
if (++port == nb_ports)
port = 0;
continue;
}
BURST_SIZE);
if (++port == nb_ports)
port = 0;
continue;
}
app_stats.rx.rx_pkts += nb_rx;
bufs, BURST_SIZE*2);
app_stats.rx.returned_pkts += nb_ret;
if (++port == nb_ports)
port = 0;
continue;
}
struct rte_ring *tx_ring = p->dist_tx_ring;
(void *)bufs, nb_ret, NULL);
app_stats.rx.enqueued_pkts += sent;
app_stats.rx.enqdrop_pkts += nb_ret - sent;
"%s:Packet loss due to full ring\n", __func__);
while (sent < nb_ret)
}
if (++port == nb_ports)
port = 0;
}
if (power_lib_initialised)
quit_signal = 1;
quit_signal_work = 1;
return 0;
}
static inline void
flush_one_port(struct output_buffer *outbuf, uint8_t outp)
{
outbuf->mbufs, outbuf->count);
app_stats.tx.tx_pkts += outbuf->count;
app_stats.tx.enqdrop_pkts += outbuf->count - nb_tx;
do {
} while (++nb_tx < outbuf->count);
}
outbuf->count = 0;
}
static inline void
flush_all_ports(struct output_buffer *tx_buffers)
{
uint16_t outp;
if ((enabled_port_mask & (1 << outp)) == 0)
continue;
if (tx_buffers[outp].count == 0)
continue;
flush_one_port(&tx_buffers[outp], outp);
}
}
static int
lcore_distributor(struct lcore_params *p)
{
struct rte_ring *in_r = p->rx_dist_ring;
struct rte_ring *out_r = p->dist_tx_ring;
struct rte_distributor *d = p->d;
printf(
"\nCore %u acting as distributor core.\n",
rte_lcore_id());
while (!quit_signal_dist) {
(void *)bufs, BURST_SIZE*1, NULL);
if (nb_rx) {
app_stats.dist.in_pkts += nb_rx;
const uint16_t nb_ret =
bufs, BURST_SIZE*2);
continue;
app_stats.dist.ret_pkts += nb_ret;
(void *)bufs, nb_ret, NULL);
app_stats.dist.sent_pkts += sent;
app_stats.dist.enqdrop_pkts += nb_ret - sent;
"%s:Packet loss due to full out ring\n",
__func__);
while (sent < nb_ret)
}
}
}
if (power_lib_initialised)
printf(
"\nCore %u exiting distributor task.\n",
rte_lcore_id());
quit_signal = 1;
quit_signal_work = 1;
return 0;
}
static int
{
static struct output_buffer tx_buffers[RTE_MAX_ETHPORTS];
uint16_t port;
if ((enabled_port_mask & (1 << port)) == 0)
continue;
printf("WARNING, port %u is on remote NUMA node to "
"TX thread.\n\tPerformance will not "
"be optimal.\n", port);
}
while (!quit_signal) {
if ((enabled_port_mask & (1 << port)) == 0)
continue;
(void *)bufs, BURST_SIZE_TX, NULL);
app_stats.tx.dequeue_pkts += nb_rx;
flush_all_ports(tx_buffers);
continue;
}
uint16_t i;
for (i = 0; i < nb_rx; i++) {
struct output_buffer *outbuf;
uint8_t outp;
outp = bufs[i]->port;
if ((enabled_port_mask & (1 << outp)) == 0)
continue;
outbuf = &tx_buffers[outp];
outbuf->mbufs[outbuf->count++] = bufs[i];
if (outbuf->count == BURST_SIZE_TX)
flush_one_port(outbuf, outp);
}
}
}
if (power_lib_initialised)
return 0;
}
static void
int_handler(int sig_num)
{
printf("Exiting on signal %d\n", sig_num);
quit_signal_rx = 1;
}
static void
print_stats(void)
{
unsigned int i, j;
app_stats.port_rx_pkts[i] = eth_stats.
ipackets;
app_stats.port_tx_pkts[i] = eth_stats.
opackets;
}
printf("\n\nRX Thread:\n");
printf("Port %u Pktsin : %5.2f\n", i,
(app_stats.port_rx_pkts[i] -
prev_app_stats.port_rx_pkts[i])/1000000.0);
prev_app_stats.port_rx_pkts[i] = app_stats.port_rx_pkts[i];
}
printf(" - Received: %5.2f\n",
(app_stats.rx.rx_pkts -
prev_app_stats.rx.rx_pkts)/1000000.0);
printf(" - Returned: %5.2f\n",
(app_stats.rx.returned_pkts -
prev_app_stats.rx.returned_pkts)/1000000.0);
printf(" - Enqueued: %5.2f\n",
(app_stats.rx.enqueued_pkts -
prev_app_stats.rx.enqueued_pkts)/1000000.0);
printf(" - Dropped: %s%5.2f%s\n", ANSI_COLOR_RED,
(app_stats.rx.enqdrop_pkts -
prev_app_stats.rx.enqdrop_pkts)/1000000.0,
ANSI_COLOR_RESET);
if (!enable_lcore_rx_distributor) {
printf("Distributor thread:\n");
printf(" - In: %5.2f\n",
(app_stats.dist.in_pkts -
prev_app_stats.dist.in_pkts)/1000000.0);
printf(" - Returned: %5.2f\n",
(app_stats.dist.ret_pkts -
prev_app_stats.dist.ret_pkts)/1000000.0);
printf(" - Sent: %5.2f\n",
(app_stats.dist.sent_pkts -
prev_app_stats.dist.sent_pkts)/1000000.0);
printf(" - Dropped %s%5.2f%s\n", ANSI_COLOR_RED,
(app_stats.dist.enqdrop_pkts -
prev_app_stats.dist.enqdrop_pkts)/1000000.0,
ANSI_COLOR_RESET);
}
printf("TX thread:\n");
printf(" - Dequeued: %5.2f\n",
(app_stats.tx.dequeue_pkts -
prev_app_stats.tx.dequeue_pkts)/1000000.0);
printf("Port %u Pktsout: %5.2f\n",
i, (app_stats.port_tx_pkts[i] -
prev_app_stats.port_tx_pkts[i])/1000000.0);
prev_app_stats.port_tx_pkts[i] = app_stats.port_tx_pkts[i];
}
printf(" - Transmitted: %5.2f\n",
(app_stats.tx.tx_pkts -
prev_app_stats.tx.tx_pkts)/1000000.0);
printf(" - Dropped: %s%5.2f%s\n", ANSI_COLOR_RED,
(app_stats.tx.enqdrop_pkts -
prev_app_stats.tx.enqdrop_pkts)/1000000.0,
ANSI_COLOR_RESET);
prev_app_stats.rx.rx_pkts = app_stats.rx.rx_pkts;
prev_app_stats.rx.returned_pkts = app_stats.rx.returned_pkts;
prev_app_stats.rx.enqueued_pkts = app_stats.rx.enqueued_pkts;
prev_app_stats.rx.enqdrop_pkts = app_stats.rx.enqdrop_pkts;
prev_app_stats.dist.in_pkts = app_stats.dist.in_pkts;
prev_app_stats.dist.ret_pkts = app_stats.dist.ret_pkts;
prev_app_stats.dist.sent_pkts = app_stats.dist.sent_pkts;
prev_app_stats.dist.enqdrop_pkts = app_stats.dist.enqdrop_pkts;
prev_app_stats.tx.dequeue_pkts = app_stats.tx.dequeue_pkts;
prev_app_stats.tx.tx_pkts = app_stats.tx.tx_pkts;
prev_app_stats.tx.enqdrop_pkts = app_stats.tx.enqdrop_pkts;
for (i = 0; i < num_workers; i++) {
printf("Worker %02u Pkts: %5.2f. Bursts(1-8): ", i,
(app_stats.worker_pkts[i] -
prev_app_stats.worker_pkts[i])/1000000.0);
for (j = 0; j < 8; j++) {
printf("%"PRIu64" ", app_stats.worker_bursts[i][j]);
app_stats.worker_bursts[i][j] = 0;
}
printf("\n");
prev_app_stats.worker_pkts[i] = app_stats.worker_pkts[i];
}
}
static int
lcore_worker(struct lcore_params *p)
{
struct rte_distributor *d = p->d;
const unsigned id = p->worker_id;
unsigned int num = 0;
unsigned int i;
alignas(RTE_CACHE_LINE_SIZE)
struct rte_mbuf *buf[8];
for (i = 0; i < 8; i++)
buf[i] = NULL;
app_stats.worker_pkts[p->worker_id] = 1;
printf(
"\nCore %u acting as worker core.\n",
rte_lcore_id());
while (!quit_signal_work) {
for (i = 0; i < num; i++) {
uint64_t t = rte_rdtsc()+100;
while (rte_rdtsc() < t)
buf[i]->port ^= xor_val;
}
app_stats.worker_pkts[p->worker_id] += num;
if (num > 0)
app_stats.worker_bursts[p->worker_id][num-1]++;
}
if (power_lib_initialised)
return 0;
}
static int
init_power_library(void)
{
int ret = 0, lcore_id;
if (ret) {
fprintf(stderr,
"Library initialization failed on core %u\n",
lcore_id);
return ret;
}
}
return ret;
}
static void
print_usage(const char *prgname)
{
printf("%s [EAL options] -- -p PORTMASK [-c]\n"
" -p PORTMASK: hexadecimal bitmask of ports to configure\n"
" -c: Combines the RX core with the distribution core\n",
prgname);
}
static int
parse_portmask(const char *portmask)
{
char *end = NULL;
unsigned long pm;
pm = strtoul(portmask, &end, 16);
if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0'))
return 0;
return pm;
}
static int
parse_args(int argc, char **argv)
{
int opt;
char **argvopt;
int option_index;
char *prgname = argv[0];
static struct option lgopts[] = {
{NULL, 0, 0, 0}
};
argvopt = argv;
enable_lcore_rx_distributor = false;
while ((opt = getopt_long(argc, argvopt, "cp:",
lgopts, &option_index)) != EOF) {
switch (opt) {
case 'p':
enabled_port_mask = parse_portmask(optarg);
if (enabled_port_mask == 0) {
printf("invalid portmask\n");
print_usage(prgname);
return -1;
}
break;
case 'c':
enable_lcore_rx_distributor = true;
break;
default:
print_usage(prgname);
return -1;
}
}
if (optind <= 1) {
print_usage(prgname);
return -1;
}
argv[optind-1] = prgname;
optind = 1;
return 0;
}
int
main(int argc, char *argv[])
{
struct rte_distributor *d;
unsigned int lcore_id, worker_id = 0;
int distr_core_id = -1, rx_core_id = -1, tx_core_id = -1;
unsigned nb_ports;
unsigned int min_cores;
uint16_t portid;
uint16_t nb_ports_available;
uint64_t t, freq;
signal(SIGINT, int_handler);
if (ret < 0)
rte_exit(EXIT_FAILURE,
"Error with EAL initialization\n");
argc -= ret;
argv += ret;
ret = parse_args(argc, argv);
if (ret < 0)
rte_exit(EXIT_FAILURE,
"Invalid distributor parameters\n");
if (enable_lcore_rx_distributor) {
min_cores = 4;
} else {
min_cores = 5;
}
rte_exit(EXIT_FAILURE,
"Error, This application needs at " "least 4 logical cores to run:\n"
"1 lcore for stats (can be core 0)\n"
"1 or 2 lcore for packet RX and distribution\n"
"1 lcore for packet TX\n"
"and at least 1 lcore for worker threads\n");
if (init_power_library() == 0)
power_lib_initialised = 1;
if (nb_ports == 0)
rte_exit(EXIT_FAILURE,
"Error: no ethernet ports detected\n");
if (nb_ports != 1 && (nb_ports & 1))
rte_exit(EXIT_FAILURE,
"Error: number of ports must be even, except " "when using a single port\n");
NUM_MBUFS * nb_ports, MBUF_CACHE_SIZE, 0,
if (mbuf_pool == NULL)
rte_exit(EXIT_FAILURE,
"Cannot create mbuf pool\n");
nb_ports_available = nb_ports;
if ((enabled_port_mask & (1 << portid)) == 0) {
printf("\nSkipping disabled port %d\n", portid);
nb_ports_available--;
continue;
}
printf("Initializing port %u... done\n", portid);
if (port_init(portid, mbuf_pool) != 0)
rte_exit(EXIT_FAILURE,
"Cannot initialize port %u\n",
portid);
}
if (!nb_ports_available) {
"All available ports are disabled. Please set portmask.\n");
}
num_workers,
RTE_DIST_ALG_BURST);
if (d == NULL)
rte_exit(EXIT_FAILURE,
"Cannot create distributor\n");
if (dist_tx_ring == NULL)
rte_exit(EXIT_FAILURE,
"Cannot create output ring\n");
if (rx_dist_ring == NULL)
rte_exit(EXIT_FAILURE,
"Cannot create output ring\n");
if (power_lib_initialised) {
rte_power_get_capabilities(lcore_id, &lcore_cap);
continue;
if (distr_core_id < 0 && !enable_lcore_rx_distributor) {
distr_core_id = lcore_id;
printf("Distributor on priority core %d\n",
lcore_id);
continue;
}
if (rx_core_id < 0) {
rx_core_id = lcore_id;
printf("Rx on priority core %d\n",
lcore_id);
continue;
}
if (tx_core_id < 0) {
tx_core_id = lcore_id;
printf("Tx on priority core %d\n",
lcore_id);
continue;
}
}
}
if (lcore_id == (unsigned int)distr_core_id ||
lcore_id == (unsigned int)rx_core_id ||
lcore_id == (unsigned int)tx_core_id)
continue;
if (distr_core_id < 0 && !enable_lcore_rx_distributor) {
distr_core_id = lcore_id;
printf("Distributor on core %d\n", lcore_id);
continue;
}
if (rx_core_id < 0) {
rx_core_id = lcore_id;
printf("Rx on core %d\n", lcore_id);
continue;
}
if (tx_core_id < 0) {
tx_core_id = lcore_id;
printf("Tx on core %d\n", lcore_id);
continue;
}
}
if (enable_lcore_rx_distributor)
printf(" tx id %d, rx id %d\n",
tx_core_id,
rx_core_id);
else
printf(" tx id %d, dist id %d, rx id %d\n",
tx_core_id,
distr_core_id,
rx_core_id);
if (lcore_id == (unsigned int)distr_core_id ||
lcore_id == (unsigned int)rx_core_id ||
lcore_id == (unsigned int)tx_core_id)
continue;
printf("Starting thread %d as worker, lcore_id %d\n",
worker_id, lcore_id);
struct lcore_params *p =
if (!p)
*p = (struct lcore_params){worker_id++, d, rx_dist_ring,
dist_tx_ring, mbuf_pool};
p, lcore_id);
}
dist_tx_ring, tx_core_id);
struct lcore_params *pd = NULL;
if (!enable_lcore_rx_distributor) {
if (!pd)
*pd = (struct lcore_params){worker_id++, d,
rx_dist_ring, dist_tx_ring, mbuf_pool};
pd, distr_core_id);
}
struct lcore_params *pr =
if (!pr)
*pr = (struct lcore_params){worker_id++, d, rx_dist_ring,
dist_tx_ring, mbuf_pool};
if (enable_lcore_rx_distributor)
pr, rx_core_id);
else
pr, rx_core_id);
t = rte_rdtsc() + freq;
while (!quit_signal) {
if (t < rte_rdtsc()) {
print_stats();
t = rte_rdtsc() + freq;
}
usleep(1000);
}
return -1;
}
print_stats();
return 0;
}