mirror of
https://github.com/scylladb/scylladb.git
synced 2026-04-24 10:30:38 +00:00
652 lines
19 KiB
C++
652 lines
19 KiB
C++
/*
|
|
* Copyright (C) 2014 Cloudius Systems, Ltd.
|
|
*/
|
|
|
|
#ifdef HAVE_DPDK
|
|
|
|
#include "core/posix.hh"
|
|
#include "core/vla.hh"
|
|
#include "virtio-interface.hh"
|
|
#include "core/reactor.hh"
|
|
#include "core/stream.hh"
|
|
#include "core/circular_buffer.hh"
|
|
#include "core/align.hh"
|
|
#include "core/sstring.hh"
|
|
#include "util/function_input_iterator.hh"
|
|
#include "util/transform_iterator.hh"
|
|
#include <atomic>
|
|
#include <vector>
|
|
#include <queue>
|
|
#include "ip.hh"
|
|
#include "const.hh"
|
|
#include "dpdk.hh"
|
|
#include "proxy.hh"
|
|
|
|
#include <getopt.h>
|
|
|
|
#include <rte_config.h>
|
|
#include <rte_common.h>
|
|
#include <rte_eal.h>
|
|
#include <rte_pci.h>
|
|
#include <rte_ethdev.h>
|
|
#include <rte_cycles.h>
|
|
#include <rte_memzone.h>
|
|
|
|
using namespace net;
|
|
|
|
namespace dpdk {
|
|
|
|
/******************* Net device related constatns *****************************/
|
|
|
|
static constexpr uint16_t mbufs_per_queue = 1536;
|
|
static constexpr uint16_t mbuf_cache_size = 512;
|
|
static constexpr uint16_t mbuf_overhead =
|
|
sizeof(struct rte_mbuf) + RTE_PKTMBUF_HEADROOM;
|
|
static constexpr size_t mbuf_data_size = 2048;
|
|
|
|
// MBUF_DATA_SIZE(2K) * 32 = 64K = Max TSO/LRO size
|
|
static constexpr uint8_t max_frags = 32;
|
|
|
|
static constexpr uint16_t mbuf_size = mbuf_data_size + mbuf_overhead;
|
|
|
|
static constexpr uint16_t default_rx_ring_size = 512;
|
|
static constexpr uint16_t default_tx_ring_size = 512;
|
|
|
|
/*
|
|
* RX and TX Prefetch, Host, and Write-back threshold values should be
|
|
* carefully set for optimal performance. Consult the network
|
|
* controller's datasheet and supporting DPDK documentation for guidance
|
|
* on how these parameters should be set.
|
|
*/
|
|
/* Default configuration for rx and tx thresholds etc. */
|
|
/*
|
|
* These default values are optimized for use with the Intel(R) 82599 10 GbE
|
|
* Controller and the DPDK ixgbe PMD. Consider using other values for other
|
|
* network controllers and/or network drivers.
|
|
*/
|
|
static constexpr uint8_t default_pthresh = 36;
|
|
static constexpr uint8_t default_rx_hthresh = 8;
|
|
static constexpr uint8_t default_tx_hthresh = 0;
|
|
static constexpr uint8_t default_wthresh = 0;
|
|
|
|
static constexpr const char* pktmbuf_pool_name = "dpdk_net_pktmbuf_pool";
|
|
|
|
/*
|
|
* When doing reads from the NIC queues, use this batch size
|
|
*/
|
|
static constexpr uint8_t packet_read_size = 32;
|
|
/******************************************************************************/
|
|
|
|
// DPDK Environment Abstraction Layer object
|
|
class dpdk_eal {
|
|
public:
|
|
dpdk_eal() : _num_ports(0) {}
|
|
void init(boost::program_options::variables_map opts);
|
|
uint8_t get_port_num() const { return _num_ports; }
|
|
void get_port_hw_info(uint8_t port_idx, rte_eth_dev_info* info) {
|
|
assert(port_idx < _num_ports);
|
|
rte_eth_dev_info_get(port_idx, info);
|
|
}
|
|
private:
|
|
bool _initialized = false;
|
|
uint8_t _num_ports;
|
|
} eal;
|
|
|
|
class dpdk_distributed_device : public distributed_device {
|
|
uint8_t _port_idx;
|
|
uint8_t _num_queues;
|
|
net::hw_features _hw_features;
|
|
uint8_t _queues_ready = 0;
|
|
|
|
public:
|
|
rte_eth_dev_info _dev_info = {};
|
|
struct rte_eth_rxconf _rx_conf_default = {};
|
|
struct rte_eth_txconf _tx_conf_default = {};
|
|
|
|
private:
|
|
/**
|
|
* Initialise an individual port:
|
|
* - configure number of rx and tx rings
|
|
* - set up each rx ring, to pull from the main mbuf pool
|
|
* - set up each tx ring
|
|
* - start the port and report its status to stdout
|
|
*
|
|
* @return 0 in case of success and an appropriate error code in case of an
|
|
* error.
|
|
*/
|
|
int init_port();
|
|
|
|
/**
|
|
* Check the link status of out port in up to 9s, and print them finally.
|
|
*/
|
|
void check_port_link_status();
|
|
|
|
public:
|
|
dpdk_distributed_device(boost::program_options::variables_map opts,
|
|
uint8_t port_idx, uint8_t num_queues)
|
|
: _port_idx(port_idx)
|
|
, _num_queues(num_queues) {
|
|
_rx_conf_default.rx_thresh.pthresh = default_pthresh;
|
|
_rx_conf_default.rx_thresh.hthresh = default_rx_hthresh;
|
|
_rx_conf_default.rx_thresh.wthresh = default_wthresh;
|
|
|
|
|
|
_tx_conf_default.tx_thresh.pthresh = default_pthresh;
|
|
_tx_conf_default.tx_thresh.hthresh = default_tx_hthresh;
|
|
_tx_conf_default.tx_thresh.wthresh = default_wthresh;
|
|
|
|
_tx_conf_default.tx_free_thresh = 0; /* Use PMD default values */
|
|
_tx_conf_default.tx_rs_thresh = 0; /* Use PMD default values */
|
|
|
|
/* now initialise the port we will use */
|
|
int ret = init_port();
|
|
if (ret != 0) {
|
|
rte_exit(EXIT_FAILURE, "Cannot initialise port %u\n", _port_idx);
|
|
}
|
|
|
|
// Print the MAC
|
|
hw_address();
|
|
|
|
// Wait for a link
|
|
check_port_link_status();
|
|
|
|
printf("Created DPDK device\n");
|
|
}
|
|
ethernet_address hw_address() override {
|
|
struct ether_addr mac;
|
|
rte_eth_macaddr_get(_port_idx, &mac);
|
|
printf("%02x:%02x:%02x:%02x:%02x:%02x\n",
|
|
mac.addr_bytes[0], mac.addr_bytes[1], mac.addr_bytes[2],
|
|
mac.addr_bytes[3], mac.addr_bytes[4], mac.addr_bytes[5]);
|
|
|
|
return mac.addr_bytes;
|
|
}
|
|
net::hw_features hw_features() override {
|
|
return _hw_features;
|
|
}
|
|
virtual void init_local_queue(boost::program_options::variables_map opts) override;
|
|
uint8_t port_idx() { return _port_idx; }
|
|
};
|
|
|
|
class net_device : public net::device {
|
|
public:
|
|
explicit net_device(dpdk_distributed_device* dev, uint8_t qid);
|
|
|
|
virtual future<> send(packet p) override;
|
|
|
|
private:
|
|
|
|
bool init_mbuf_pools();
|
|
|
|
/**
|
|
* Polls for a burst of incoming packets. This function will not block and
|
|
* will immediately return after processing all available packets.
|
|
*
|
|
*/
|
|
void poll_rx_once();
|
|
|
|
/**
|
|
* Translates an rte_mbuf's into net::packet and feeds them to _rx_stream.
|
|
*
|
|
* @param bufs An array of received rte_mbuf's
|
|
* @param count Number of buffers in the bufs[]
|
|
*/
|
|
void process_packets(struct rte_mbuf **bufs, uint16_t count);
|
|
|
|
/**
|
|
* Copies one net::fragment into the cluster of rte_mbuf's.
|
|
*
|
|
* @param frag Fragment to copy (in)
|
|
* @param head Head of the cluster (out)
|
|
* @param last_seg Last segment of the cluster (out)
|
|
* @param nsegs Number of segments in the cluster (out)
|
|
*
|
|
* We return the "last_seg" to avoid traversing the cluster in order to get
|
|
* it.
|
|
*
|
|
* @return TRUE in case of success
|
|
*/
|
|
bool copy_one_frag(fragment& frag, rte_mbuf*& head, rte_mbuf*& last_seg,
|
|
unsigned& nsegs);
|
|
|
|
/**
|
|
* Allocates a single rte_mbuf and copies a given data into it.
|
|
*
|
|
* @param m New allocated rte_mbuf (out)
|
|
* @param data Data to copy from (in)
|
|
* @param l length of the data to copy (in)
|
|
*
|
|
* @return The actual number of bytes that has been copied
|
|
*/
|
|
size_t copy_one_data_buf(rte_mbuf*& m, char* data, size_t l);
|
|
|
|
private:
|
|
dpdk_distributed_device* _dev;
|
|
uint8_t _qid;
|
|
rte_mempool* _pktmbuf_pool;
|
|
reactor::poller _rx_poller;
|
|
};
|
|
|
|
int dpdk_distributed_device::init_port()
|
|
{
|
|
eal.get_port_hw_info(_port_idx, &_dev_info);
|
|
|
|
/* for port configuration all features are off by default */
|
|
rte_eth_conf port_conf = { 0 };
|
|
|
|
printf("Port %d: max_rx_queues %d max_tx_queues %d\n",
|
|
_port_idx, _dev_info.max_rx_queues, _dev_info.max_tx_queues);
|
|
|
|
if (_num_queues > _dev_info.max_rx_queues) {
|
|
_num_queues = _dev_info.max_rx_queues;
|
|
}
|
|
|
|
if (_num_queues > _dev_info.max_tx_queues) {
|
|
_num_queues = _dev_info.max_tx_queues;
|
|
}
|
|
|
|
printf("Port %d: using %d %s\n", _port_idx, _num_queues,
|
|
(_num_queues > 1) ? "queues" : "queue");
|
|
|
|
// Set RSS mode: enable RSS only if there are more than 1 Rx queues
|
|
// available.
|
|
if (_num_queues > 1) {
|
|
port_conf.rxmode.mq_mode = ETH_MQ_RX_RSS;
|
|
port_conf.rx_adv_conf.rss_conf.rss_hf = ETH_RSS_IPV4 | ETH_RSS_IPV4_UDP | ETH_RSS_IPV4_TCP;
|
|
port_conf.rx_adv_conf.rss_conf.rss_key = NULL;
|
|
} else {
|
|
port_conf.rxmode.mq_mode = ETH_MQ_RX_NONE;
|
|
}
|
|
|
|
// Set Rx VLAN stripping
|
|
if (_dev_info.rx_offload_capa & DEV_RX_OFFLOAD_VLAN_STRIP) {
|
|
port_conf.rxmode.hw_vlan_strip = 1;
|
|
}
|
|
|
|
// Set Rx checksum checking
|
|
if ( (_dev_info.rx_offload_capa & DEV_RX_OFFLOAD_IPV4_CKSUM) &&
|
|
(_dev_info.rx_offload_capa & DEV_RX_OFFLOAD_UDP_CKSUM) &&
|
|
(_dev_info.rx_offload_capa & DEV_RX_OFFLOAD_TCP_CKSUM)) {
|
|
printf("RX checksum offload supported\n");
|
|
port_conf.rxmode.hw_ip_checksum = 1;
|
|
_hw_features.rx_csum_offload = 1;
|
|
}
|
|
|
|
int retval;
|
|
|
|
printf("Port %u init ... ", _port_idx);
|
|
fflush(stdout);
|
|
|
|
/*
|
|
* Standard DPDK port initialisation - config port, then set up
|
|
* rx and tx rings.
|
|
*/
|
|
if ((retval = rte_eth_dev_configure(_port_idx, _num_queues, _num_queues,
|
|
&port_conf)) != 0) {
|
|
return retval;
|
|
}
|
|
|
|
//rte_eth_promiscuous_enable(port_num);
|
|
printf("done: \n");
|
|
|
|
return 0;
|
|
}
|
|
|
|
bool net_device::init_mbuf_pools()
|
|
{
|
|
// Allocate the same amount of buffers for Rx and Tx.
|
|
const unsigned num_mbufs = 2 * mbufs_per_queue;
|
|
sstring name = to_sstring(pktmbuf_pool_name) + to_sstring(_qid);
|
|
/* don't pass single-producer/single-consumer flags to mbuf create as it
|
|
* seems faster to use a cache instead */
|
|
printf("Creating mbuf pool '%s' [%u mbufs] ...\n", name.c_str(), num_mbufs);
|
|
|
|
//
|
|
// We currently allocate a one big mempool on the current CPU to fit all
|
|
// requested queues.
|
|
// TODO: Allocate a separate pool for each queue on the appropriate CPU.
|
|
//
|
|
_pktmbuf_pool = rte_mempool_create(name.c_str(), num_mbufs,
|
|
mbuf_size, mbuf_cache_size,
|
|
sizeof(struct rte_pktmbuf_pool_private), rte_pktmbuf_pool_init,
|
|
NULL, rte_pktmbuf_init, NULL, rte_socket_id(), 0);
|
|
|
|
return _pktmbuf_pool != NULL;
|
|
}
|
|
|
|
void dpdk_distributed_device::check_port_link_status()
|
|
{
|
|
using namespace std::literals::chrono_literals;
|
|
constexpr auto check_interval = 100ms;
|
|
const int max_check_time = 90; /* 9s (90 * 100ms) in total */
|
|
int count;
|
|
struct rte_eth_link link;
|
|
|
|
printf("\nChecking link status");
|
|
fflush(stdout);
|
|
for (count = 0; count <= max_check_time; count++) {
|
|
memset(&link, 0, sizeof(link));
|
|
rte_eth_link_get_nowait(_port_idx, &link);
|
|
|
|
if (link.link_status == 0) {
|
|
printf(".");
|
|
fflush(stdout);
|
|
std::this_thread::sleep_for(check_interval);
|
|
} else {
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* print link status */
|
|
if (link.link_status) {
|
|
printf("done\nPort %d Link Up - speed %u "
|
|
"Mbps - %s\n", _port_idx,
|
|
(unsigned)link.link_speed,
|
|
(link.link_duplex == ETH_LINK_FULL_DUPLEX) ?
|
|
("full-duplex") : ("half-duplex\n"));
|
|
} else {
|
|
printf("done\nPort %d Link Down\n", _port_idx);
|
|
}
|
|
}
|
|
|
|
|
|
net_device::net_device(dpdk_distributed_device* dev, uint8_t qid)
|
|
: _dev(dev), _qid(qid), _rx_poller([&] { poll_rx_once(); return true; })
|
|
{
|
|
if (!init_mbuf_pools()) {
|
|
rte_exit(EXIT_FAILURE, "Cannot initialize mbuf pools\n");
|
|
}
|
|
|
|
const uint16_t rx_ring_size = default_rx_ring_size;
|
|
const uint16_t tx_ring_size = default_tx_ring_size;
|
|
|
|
if (rte_eth_rx_queue_setup(_dev->port_idx(), _qid, rx_ring_size,
|
|
rte_eth_dev_socket_id(_dev->port_idx()),
|
|
&_dev->_rx_conf_default, _pktmbuf_pool) < 0) {
|
|
rte_exit(EXIT_FAILURE, "Cannot initialize rx queue\n");
|
|
}
|
|
|
|
if (rte_eth_tx_queue_setup(_dev->port_idx(), _qid, tx_ring_size,
|
|
rte_eth_dev_socket_id(_dev->port_idx()),
|
|
&_dev->_tx_conf_default) < 0) {
|
|
rte_exit(EXIT_FAILURE, "Cannot initialize tx queue\n");
|
|
}
|
|
}
|
|
|
|
void net_device::process_packets(struct rte_mbuf **bufs, uint16_t count)
|
|
{
|
|
for (uint16_t i = 0; i < count; i++) {
|
|
struct rte_mbuf *m = bufs[i];
|
|
offload_info oi;
|
|
|
|
if (!rte_pktmbuf_is_contiguous(m)) {
|
|
rte_exit(EXIT_FAILURE,
|
|
"DPDK-Rx: Have got a fragmented buffer - not supported\n");
|
|
}
|
|
|
|
fragment f{rte_pktmbuf_mtod(m, char*), rte_pktmbuf_data_len(m)};
|
|
|
|
packet p(f, make_deleter(deleter(), [m] { rte_pktmbuf_free(m); }));
|
|
|
|
// Set stipped VLAN value if available
|
|
if ((_dev->_dev_info.rx_offload_capa & DEV_RX_OFFLOAD_VLAN_STRIP) &&
|
|
(m->ol_flags & PKT_RX_VLAN_PKT)) {
|
|
|
|
oi.hw_vlan = true;
|
|
oi.vlan_tci = m->pkt.vlan_macip.f.vlan_tci;
|
|
}
|
|
|
|
if (_dev->hw_features().rx_csum_offload) {
|
|
if (m->ol_flags & (PKT_RX_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD)) {
|
|
// Packet with bad checksum, just drop it.
|
|
continue;
|
|
}
|
|
// Tell our code not to bother to calculate and check the IP and
|
|
// L4 (TCP or UDP) checksums later.
|
|
// TODO: Currently, ipv4::handle_received_packet() tests this
|
|
// oi.needs_ip_csum, while tcp<InetTraits>::received() instead
|
|
// tests _hw_features.rx_csum_offload directly (and there is
|
|
// a third variable, oi.needs_csum, which isn't used on rx, and
|
|
// doesn't even default to true). Need to clean up...
|
|
oi.needs_ip_csum = false;
|
|
}
|
|
|
|
p.set_offload_info(oi);
|
|
|
|
_dev->l2receive(std::move(p));
|
|
}
|
|
}
|
|
|
|
void net_device::poll_rx_once()
|
|
{
|
|
struct rte_mbuf *buf[packet_read_size];
|
|
|
|
/* read a port */
|
|
uint16_t rx_count = rte_eth_rx_burst(_dev->port_idx(), _qid,
|
|
buf, packet_read_size);
|
|
|
|
/* Now process the NIC packets read */
|
|
if (likely(rx_count > 0)) {
|
|
process_packets(buf, rx_count);
|
|
}
|
|
}
|
|
|
|
size_t net_device::copy_one_data_buf(rte_mbuf*& m, char* data, size_t l)
|
|
{
|
|
m = rte_pktmbuf_alloc(_pktmbuf_pool);
|
|
if (!m) {
|
|
return 0;
|
|
}
|
|
|
|
size_t len = std::min(l, mbuf_data_size);
|
|
|
|
// mbuf_put()
|
|
m->pkt.data_len += len;
|
|
m->pkt.pkt_len += len;
|
|
|
|
rte_memcpy(rte_pktmbuf_mtod(m, void*), data, len);
|
|
|
|
return len;
|
|
}
|
|
|
|
|
|
bool net_device::copy_one_frag(fragment& frag, rte_mbuf*& head,
|
|
rte_mbuf*& last_seg, unsigned& nsegs)
|
|
{
|
|
size_t len, left_to_copy = frag.size;
|
|
char* base = frag.base;
|
|
rte_mbuf* m;
|
|
|
|
if (!frag.size) {
|
|
rte_exit(EXIT_FAILURE, "DPDK Tx: Zero-size fragment");
|
|
}
|
|
|
|
// Create a HEAD of mbufs' cluster and copy the first bytes into it
|
|
len = copy_one_data_buf(head, base, left_to_copy);
|
|
if (!len) {
|
|
return false;
|
|
}
|
|
|
|
left_to_copy -= len;
|
|
base += len;
|
|
nsegs = 1;
|
|
|
|
// Copy the rest of the data into the new mbufs and chain them to the
|
|
// cluster
|
|
rte_mbuf* prev_seg = head;
|
|
while (left_to_copy) {
|
|
len = copy_one_data_buf(m, base, left_to_copy);
|
|
if (!len) {
|
|
rte_pktmbuf_free(head);
|
|
return false;
|
|
}
|
|
|
|
left_to_copy -= len;
|
|
base += len;
|
|
nsegs++;
|
|
|
|
prev_seg->pkt.next = m;
|
|
prev_seg = m;
|
|
}
|
|
|
|
// Return the last mbuf in the cluster
|
|
last_seg = prev_seg;
|
|
|
|
return true;
|
|
}
|
|
|
|
future<> net_device::send(packet p)
|
|
{
|
|
// sanity
|
|
if (!p.len()) {
|
|
return make_ready_future<>();
|
|
}
|
|
|
|
// Too fragmented - linearize
|
|
if (p.nr_frags() > max_frags) {
|
|
p.linearize();
|
|
}
|
|
|
|
/* TODO: configure the offload features here if any */
|
|
|
|
//
|
|
// We will copy the data for now and will implement a zero-copy in the
|
|
// future.
|
|
|
|
rte_mbuf *head = NULL, *last_seg = NULL;
|
|
unsigned total_nsegs = 0, nsegs = 0;
|
|
|
|
// Create a HEAD of the fragmented packet
|
|
if (!copy_one_frag(p.frag(0), head, last_seg, nsegs)) {
|
|
// Drop if we failed to allocate new mbuf
|
|
return make_ready_future<>();
|
|
}
|
|
|
|
total_nsegs += nsegs;
|
|
|
|
for (unsigned i = 1; i < p.nr_frags(); i++) {
|
|
|
|
rte_mbuf *h = NULL, *new_last_seg = NULL;
|
|
if (!copy_one_frag(p.frag(i), h, new_last_seg, nsegs)) {
|
|
rte_pktmbuf_free(head);
|
|
return make_ready_future<>();
|
|
}
|
|
|
|
total_nsegs += nsegs;
|
|
|
|
// Attach a new buffers' chain to the packet chain
|
|
last_seg->pkt.next = h;
|
|
last_seg = new_last_seg;
|
|
}
|
|
|
|
// Update the HEAD buffer with the packet info
|
|
head->pkt.pkt_len = p.len();
|
|
head->pkt.nb_segs = total_nsegs;
|
|
|
|
//
|
|
// Currently we will spin till completion.
|
|
// TODO: implement a poller + xmit queue
|
|
//
|
|
while(rte_eth_tx_burst(_dev->port_idx(), _qid, &head, 1) < 1);
|
|
|
|
return make_ready_future<>();
|
|
}
|
|
|
|
void dpdk_eal::init(boost::program_options::variables_map opts)
|
|
{
|
|
if (_initialized) {
|
|
return;
|
|
}
|
|
|
|
// TODO: Inherit these from the app parameters - "opts"
|
|
const char *argv[] = {"dpdk_args", "-c", "0x1", "-n", "1"};
|
|
int argc = sizeof(argv) / sizeof(char*);
|
|
|
|
/* initialise the EAL for all */
|
|
int ret = rte_eal_init(argc, const_cast<char**>(argv));
|
|
if (ret < 0) {
|
|
rte_exit(EXIT_FAILURE, "Cannot init EAL\n");
|
|
}
|
|
|
|
/* probe to determine the NIC devices available */
|
|
if (rte_eal_pci_probe() < 0) {
|
|
rte_exit(EXIT_FAILURE, "Cannot probe PCI\n");
|
|
}
|
|
|
|
_num_ports = rte_eth_dev_count();
|
|
assert(_num_ports <= RTE_MAX_ETHPORTS);
|
|
if (_num_ports == 0) {
|
|
rte_exit(EXIT_FAILURE, "No Ethernet ports - bye\n");
|
|
} else {
|
|
printf("ports number: %d\n", _num_ports);
|
|
}
|
|
|
|
_initialized = true;
|
|
}
|
|
|
|
void dpdk_distributed_device::init_local_queue(boost::program_options::variables_map opts) {
|
|
std::unique_ptr<device> ptr;
|
|
|
|
if (engine.cpu_id() < smp::count) {
|
|
ptr = std::make_unique<net_device>(this, engine.cpu_id());
|
|
|
|
// TODO: device reset of the cpus between queues
|
|
for (unsigned i = _num_queues; i < smp::count; i++) {
|
|
if (i != engine.cpu_id()) {
|
|
ptr->add_proxy(i);
|
|
}
|
|
}
|
|
smp::submit_to(0, [this] () mutable {
|
|
if (++_queues_ready == _num_queues) {
|
|
if (rte_eth_dev_start(_port_idx) < 0) {
|
|
rte_exit(EXIT_FAILURE, "Cannot start port %d\n", _port_idx);
|
|
}
|
|
}
|
|
});
|
|
} else {
|
|
ptr = create_proxy_net_device(0, this);
|
|
}
|
|
set_local_queue(std::move(ptr));
|
|
}
|
|
} // namespace dpdk
|
|
|
|
/******************************** Interface functions *************************/
|
|
|
|
std::unique_ptr<net::distributed_device> create_dpdk_net_device(
|
|
boost::program_options::variables_map opts,
|
|
uint8_t port_idx,
|
|
uint8_t num_queues)
|
|
{
|
|
if (engine.cpu_id() == 0) {
|
|
// Init a DPDK EAL
|
|
dpdk::eal.init(opts);
|
|
|
|
return std::make_unique<dpdk::dpdk_distributed_device>(opts, port_idx, num_queues);
|
|
} else {
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
boost::program_options::options_description
|
|
get_dpdk_net_options_description()
|
|
{
|
|
boost::program_options::options_description opts(
|
|
"DPDK net options");
|
|
#if 0
|
|
opts.add_options()
|
|
("csum-offload",
|
|
boost::program_options::value<std::string>()->default_value("on"),
|
|
"Enable checksum offload feature (on / off)")
|
|
("tso",
|
|
boost::program_options::value<std::string>()->default_value("on"),
|
|
"Enable TCP segment offload feature (on / off)")
|
|
("ufo",
|
|
boost::program_options::value<std::string>()->default_value("on"),
|
|
"Enable UDP fragmentation offload feature (on / off)")
|
|
;
|
|
#endif
|
|
return opts;
|
|
}
|
|
|
|
#endif // HAVE_DPDK
|