aboutsummaryrefslogtreecommitdiffstats
path: root/host/tests/packet_handler_benchmark.cpp
diff options
context:
space:
mode:
authorCiro Nishiguchi <ciro.nishiguchi@ni.com>2019-08-28 12:30:26 -0500
committerMartin Braun <martin.braun@ettus.com>2019-11-26 11:49:44 -0800
commit745fbf19bc22e98cee42acac04cda28c5f9bcbd4 (patch)
treeef419c637dc8f20064053051d4ae639b414fc262 /host/tests/packet_handler_benchmark.cpp
parent2d40c33b15ee91fdf5f0f7ca6987fe7dbf18205a (diff)
downloaduhd-745fbf19bc22e98cee42acac04cda28c5f9bcbd4.tar.gz
uhd-745fbf19bc22e98cee42acac04cda28c5f9bcbd4.tar.bz2
uhd-745fbf19bc22e98cee42acac04cda28c5f9bcbd4.zip
tests: Make packet handler benchmark include flow control
Add mock flow control to the packet handler benchmark to make it a better comparison to streamer_benchmark.
Diffstat (limited to 'host/tests/packet_handler_benchmark.cpp')
-rw-r--r--host/tests/packet_handler_benchmark.cpp446
1 files changed, 222 insertions, 224 deletions
diff --git a/host/tests/packet_handler_benchmark.cpp b/host/tests/packet_handler_benchmark.cpp
index ec7eff517..6d4849831 100644
--- a/host/tests/packet_handler_benchmark.cpp
+++ b/host/tests/packet_handler_benchmark.cpp
@@ -18,6 +18,7 @@
#include <uhd/convert.hpp>
#include <uhd/transport/chdr.hpp>
#include <uhd/transport/zero_copy.hpp>
+#include <uhd/transport/zero_copy_flow_ctrl.hpp>
#include <uhd/types/sid.hpp>
#include <uhd/utils/safe_main.hpp>
#include <uhd/utils/thread.hpp>
@@ -27,34 +28,155 @@
namespace po = boost::program_options;
using namespace uhd::transport;
-using namespace uhd::usrp;
-void benchmark_recv_packet_handler(const size_t spp, const std::string& format)
+static constexpr size_t MAX_HEADER_LEN = 16;
+static constexpr size_t LINE_SIZE = 8;
+
+//
+// Old device3 rx flow control cache and procedures
+//
+struct rx_fc_cache_t
{
- const size_t bpi = uhd::convert::get_bytes_per_item(format);
- const size_t frame_size = bpi * spp + DEVICE3_RX_MAX_HDR_LEN;
+ //! Flow control interval in bytes
+ size_t interval = 0;
+ //! Byte count at last flow control packet
+ uint32_t last_byte_count = 0;
+ //! This will wrap around, but that's OK, because math.
+ uint32_t total_bytes_consumed = 0;
+ //! This will wrap around, but that's OK, because math.
+ uint32_t total_packets_consumed = 0;
+ //! Sequence number of next flow control packet
+ uint64_t seq_num = 0;
+ uhd::sid_t sid;
+ uhd::transport::zero_copy_if::sptr xport;
+ std::function<uint32_t(uint32_t)> to_host;
+ std::function<uint32_t(uint32_t)> from_host;
+ std::function<void(
+ const uint32_t* packet_buff, uhd::transport::vrt::if_packet_info_t&)>
+ unpack;
+ std::function<void(uint32_t* packet_buff, uhd::transport::vrt::if_packet_info_t&)>
+ pack;
+};
+
+inline bool rx_flow_ctrl(
+ boost::shared_ptr<rx_fc_cache_t> fc_cache, uhd::transport::managed_buffer::sptr buff)
+{
+ // If the caller supplied a buffer
+ if (buff) {
+ // Unpack the header
+ uhd::transport::vrt::if_packet_info_t packet_info;
+ packet_info.num_packet_words32 = buff->size() / sizeof(uint32_t);
+ const uint32_t* pkt = buff->cast<const uint32_t*>();
+ try {
+ fc_cache->unpack(pkt, packet_info);
+ } catch (const std::exception& ex) {
+ // Log and ignore
+ UHD_LOGGER_ERROR("RX FLOW CTRL")
+ << "Error unpacking packet: " << ex.what() << std::endl;
+ return true;
+ }
- mock_zero_copy::sptr xport(new mock_zero_copy(
- vrt::if_packet_info_t::LINK_TYPE_CHDR, frame_size, frame_size));
+ // Update counters assuming the buffer is a consumed packet
+ if (not packet_info.error) {
+ const size_t bytes = 4 * (packet_info.num_header_words32 + packet_info.num_payload_words32);
+ fc_cache->total_bytes_consumed += bytes;
+ fc_cache->total_packets_consumed++;
+ }
+ }
- xport->set_reuse_recv_memory(true);
+ // Just return if there is no need to send a flow control packet
+ if (fc_cache->total_bytes_consumed - fc_cache->last_byte_count < fc_cache->interval) {
+ return true;
+ }
- sph::recv_packet_streamer streamer(spp);
- streamer.set_vrt_unpacker(&vrt::chdr::if_hdr_unpack_be);
- streamer.set_tick_rate(1.0);
- streamer.set_samp_rate(1.0);
+ // Time to send a flow control packet. For the benchmark, we should never
+ // reach this point.
+ UHD_THROW_INVALID_CODE_PATH();
+}
- uhd::convert::id_type id;
- id.output_format = format;
- id.num_inputs = 1;
- id.input_format = "sc16_item32_be";
- id.num_outputs = 1;
- streamer.set_converter(id);
+inline void handle_rx_flowctrl_ack(
+ boost::shared_ptr<rx_fc_cache_t> /*fc_cache*/, const uint32_t* /*payload*/)
+{
+ // For the benchmark, we should never reach this
+ UHD_THROW_INVALID_CODE_PATH();
+}
- streamer.set_xport_chan_get_buff(0,
- [xport](double timeout) { return xport->get_recv_buff(timeout); },
- false // flush
- );
+//
+// Old device3 tx flow control cache and procedures
+//
+struct tx_fc_cache_t
+{
+ uint32_t last_byte_ack = 0;
+ uint32_t last_seq_ack = 0;
+ uint32_t byte_count = 0;
+ uint32_t pkt_count = 0;
+ uint32_t window_size = 0;
+ uint32_t fc_ack_seqnum = 0;
+ bool fc_received = false;
+ std::function<uint32_t(uint32_t)> to_host;
+ std::function<uint32_t(uint32_t)> from_host;
+ std::function<void(
+ const uint32_t* packet_buff, uhd::transport::vrt::if_packet_info_t&)>
+ unpack;
+ std::function<void(uint32_t* packet_buff, uhd::transport::vrt::if_packet_info_t&)>
+ pack;
+};
+
+inline bool tx_flow_ctrl(boost::shared_ptr<tx_fc_cache_t> fc_cache,
+ uhd::transport::zero_copy_if::sptr /*xport*/,
+ uhd::transport::managed_buffer::sptr buff)
+{
+ while (true) {
+ // If there is space
+ if (fc_cache->window_size - (fc_cache->byte_count - fc_cache->last_byte_ack)
+ >= buff->size()) {
+ // All is good - packet will be sent
+ fc_cache->byte_count += buff->size();
+ // Round up to nearest word
+ if (fc_cache->byte_count % LINE_SIZE) {
+ fc_cache->byte_count += LINE_SIZE - (fc_cache->byte_count % LINE_SIZE);
+ }
+ fc_cache->pkt_count++;
+
+ // Just zero out the counts here to avoid actually tring to read flow
+ // control packets in the benchmark
+ fc_cache->byte_count = 0;
+ fc_cache->last_byte_ack = 0;
+ fc_cache->pkt_count = 0;
+
+ return true;
+ }
+
+ // Look for a flow control message to update the space available in the
+ // buffer. For the benchmark, we should never reach this point.
+ UHD_THROW_INVALID_CODE_PATH();
+ }
+ return false;
+}
+
+inline void tx_flow_ctrl_ack(boost::shared_ptr<tx_fc_cache_t> fc_cache,
+ uhd::transport::zero_copy_if::sptr /*send_xport*/,
+ uhd::sid_t /*send_sid*/)
+{
+ if (not fc_cache->fc_received) {
+ return;
+ }
+
+ // Time to send a flow control ACK packet. For the benchmark, we should
+ // never reach this point.
+ UHD_THROW_INVALID_CODE_PATH();
+}
+
+//
+// Benchmark functions
+//
+void benchmark_recv_packet_handler(const size_t spp, const std::string& format)
+{
+ const size_t bpi = uhd::convert::get_bytes_per_item(format);
+ const size_t frame_size = bpi * spp + MAX_HEADER_LEN;
+
+ mock_zero_copy::sptr xport(new mock_zero_copy(
+ vrt::if_packet_info_t::LINK_TYPE_CHDR, frame_size, frame_size));
// Create packet for packet handler to read
vrt::if_packet_info_t packet_info;
@@ -66,6 +188,47 @@ void benchmark_recv_packet_handler(const size_t spp, const std::string& format)
std::vector<uint32_t> recv_data(spp, 0);
xport->push_back_recv_packet(packet_info, recv_data);
+ xport->set_reuse_recv_memory(true);
+
+ // Configure xport flow control
+ boost::shared_ptr<rx_fc_cache_t> fc_cache(new rx_fc_cache_t());
+ fc_cache->to_host = uhd::ntohx<uint32_t>;
+ fc_cache->from_host = uhd::htonx<uint32_t>;
+ fc_cache->pack = vrt::chdr::if_hdr_pack_be;
+ fc_cache->unpack = vrt::chdr::if_hdr_unpack_be;
+ fc_cache->xport = xport;
+ fc_cache->interval = std::numeric_limits<std::size_t>::max();
+
+ auto zero_copy_xport = zero_copy_flow_ctrl::make(
+ xport, 0, [fc_cache](managed_buffer::sptr buff) {
+ return rx_flow_ctrl(fc_cache, buff);
+ });
+
+ // Create streamer
+ auto streamer = boost::make_shared<sph::recv_packet_streamer>(spp);
+ streamer->set_tick_rate(1.0);
+ streamer->set_samp_rate(1.0);
+
+ // Configure streamer xport
+ streamer->set_vrt_unpacker(&vrt::chdr::if_hdr_unpack_be);
+ streamer->set_xport_chan_get_buff(0,
+ [zero_copy_xport](double timeout) { return zero_copy_xport->get_recv_buff(timeout); },
+ false // flush
+ );
+
+ // Configure flow control ack
+ streamer->set_xport_handle_flowctrl_ack(
+ 0, [fc_cache](const uint32_t* payload) {
+ handle_rx_flowctrl_ack(fc_cache, payload);
+ });
+
+ // Configure converter
+ uhd::convert::id_type id;
+ id.output_format = format;
+ id.num_inputs = 1;
+ id.input_format = "sc16_item32_be";
+ id.num_outputs = 1;
+ streamer->set_converter(id);
// Allocate buffer
std::vector<uint8_t> buffer(spp * bpi);
@@ -78,7 +241,7 @@ void benchmark_recv_packet_handler(const size_t spp, const std::string& format)
const size_t iterations = 1e7;
for (size_t i = 0; i < iterations; i++) {
- streamer.recv(buffers, spp, md, 1.0, true);
+ streamer->recv(buffers, spp, md, 1.0, true);
}
const auto end_time = std::chrono::steady_clock::now();
@@ -93,26 +256,48 @@ void benchmark_send_packet_handler(
const size_t spp, const std::string& format, bool use_time_spec)
{
const size_t bpi = uhd::convert::get_bytes_per_item(format);
- const size_t frame_size = bpi * spp + DEVICE3_TX_MAX_HDR_LEN;
+ const size_t frame_size = bpi * spp + MAX_HEADER_LEN;
mock_zero_copy::sptr xport(new mock_zero_copy(
vrt::if_packet_info_t::LINK_TYPE_CHDR, frame_size, frame_size));
xport->set_reuse_send_memory(true);
- sph::send_packet_streamer streamer(spp);
- streamer.set_vrt_packer(&vrt::chdr::if_hdr_pack_be);
+ // Configure flow control
+ boost::shared_ptr<tx_fc_cache_t> fc_cache(new tx_fc_cache_t());
+ fc_cache->to_host = uhd::ntohx<uint32_t>;
+ fc_cache->from_host = uhd::htonx<uint32_t>;
+ fc_cache->pack = vrt::chdr::if_hdr_pack_be;
+ fc_cache->unpack = vrt::chdr::if_hdr_unpack_be;
+ fc_cache->window_size = UINT32_MAX;
+
+ auto zero_copy_xport = zero_copy_flow_ctrl::make(xport,
+ [fc_cache, xport](managed_buffer::sptr buff) {
+ return tx_flow_ctrl(fc_cache, xport, buff);
+ },
+ 0);
+ // Create streamer
+ auto streamer = boost::make_shared<sph::send_packet_streamer>(spp);
+ streamer->set_vrt_packer(&vrt::chdr::if_hdr_pack_be);
+
+ // Configure converter
uhd::convert::id_type id;
id.input_format = format;
id.num_inputs = 1;
id.output_format = "sc16_item32_be";
id.num_outputs = 1;
- streamer.set_converter(id);
- streamer.set_enable_trailer(false);
+ streamer->set_converter(id);
+ streamer->set_enable_trailer(false);
+
+ // Configure streamer xport
+ streamer->set_xport_chan_get_buff(
+ 0, [zero_copy_xport](double timeout) { return zero_copy_xport->get_send_buff(timeout); });
- streamer.set_xport_chan_get_buff(
- 0, [xport](double timeout) { return xport->get_send_buff(timeout); });
+ // Configure flow control ack
+ streamer->set_xport_chan_post_send_cb(0, [fc_cache, zero_copy_xport]() {
+ tx_flow_ctrl_ack(fc_cache, zero_copy_xport, 0);
+ });
// Allocate buffer
std::vector<uint8_t> buffer(spp * bpi);
@@ -130,7 +315,7 @@ void benchmark_send_packet_handler(
if (use_time_spec) {
md.time_spec = uhd::time_spec_t(i, 0.0);
}
- streamer.send(buffers, spp, md, 1.0);
+ streamer->send(buffers, spp, md, 1.0);
}
const auto end_time = std::chrono::steady_clock::now();
@@ -141,164 +326,6 @@ void benchmark_send_packet_handler(
<< time_per_packet * 1e9 << " ns/packet\n";
}
-void benchmark_device3_rx_flow_ctrl(bool send_flow_control_packet)
-{
- // Arbitrary sizes
- constexpr uint32_t fc_window = 10000;
-
- mock_zero_copy::sptr xport(new mock_zero_copy(vrt::if_packet_info_t::LINK_TYPE_CHDR));
-
- xport->set_reuse_recv_memory(true);
- xport->set_reuse_send_memory(true);
-
- boost::shared_ptr<rx_fc_cache_t> fc_cache(new rx_fc_cache_t());
- fc_cache->to_host = uhd::ntohx<uint32_t>;
- fc_cache->from_host = uhd::htonx<uint32_t>;
- fc_cache->pack = vrt::chdr::if_hdr_pack_be;
- fc_cache->unpack = vrt::chdr::if_hdr_unpack_be;
- fc_cache->xport = xport;
- fc_cache->interval = fc_window;
-
- // Create data buffer to pass to flow control function. Number of payload
- // words is arbitrary, just has to fit in the buffer.
- vrt::if_packet_info_t packet_info;
- packet_info.packet_type = vrt::if_packet_info_t::PACKET_TYPE_DATA;
- packet_info.num_payload_words32 = 100;
- packet_info.num_payload_bytes = packet_info.num_payload_words32 * sizeof(uint32_t);
- packet_info.has_tsf = false;
-
- std::vector<uint32_t> recv_data(packet_info.num_payload_words32, 0);
- xport->push_back_recv_packet(packet_info, recv_data);
-
- auto recv_buffer = xport->get_recv_buff(1.0);
-
- // Run benchmark
- const auto start_time = std::chrono::steady_clock::now();
-
- constexpr size_t iterations = 1e7;
-
- for (size_t i = 0; i < iterations; i++) {
- fc_cache->total_bytes_consumed = send_flow_control_packet ? fc_window : 0;
- fc_cache->last_byte_count = 0;
-
- rx_flow_ctrl(fc_cache, recv_buffer);
- }
-
- const auto end_time = std::chrono::steady_clock::now();
- const std::chrono::duration<double> elapsed_time(end_time - start_time);
-
- std::cout << elapsed_time.count() / iterations * 1e9 << " ns per call\n";
-}
-
-void benchmark_device3_handle_rx_flow_ctrl_ack()
-{
- // Arbitrary sizes
- constexpr uint32_t fc_window = 10000;
-
- mock_zero_copy::sptr xport(new mock_zero_copy(vrt::if_packet_info_t::LINK_TYPE_CHDR));
-
- xport->set_reuse_recv_memory(true);
- xport->set_reuse_send_memory(true);
-
- boost::shared_ptr<rx_fc_cache_t> fc_cache(new rx_fc_cache_t());
- fc_cache->to_host = uhd::ntohx<uint32_t>;
- fc_cache->from_host = uhd::htonx<uint32_t>;
- fc_cache->pack = vrt::chdr::if_hdr_pack_be;
- fc_cache->unpack = vrt::chdr::if_hdr_unpack_be;
- fc_cache->xport = xport;
- fc_cache->interval = fc_window;
- fc_cache->total_bytes_consumed = 100;
-
- // Payload should contain packet count and byte count
- std::vector<uint32_t> payload_data;
- payload_data.push_back(fc_cache->to_host(10)); // packet count
- payload_data.push_back(fc_cache->to_host(100)); // byte count
-
- // Run benchmark
- const auto start_time = std::chrono::steady_clock::now();
- constexpr size_t iterations = 1e7;
-
- for (size_t i = 0; i < iterations; i++) {
- handle_rx_flowctrl_ack(fc_cache, payload_data.data());
- }
-
- const auto end_time = std::chrono::steady_clock::now();
- const std::chrono::duration<double> elapsed_time(end_time - start_time);
-
- std::cout << elapsed_time.count() / iterations * 1e9 << " ns per call\n";
-}
-
-void benchmark_device3_tx_flow_ctrl(bool send_flow_control_packet)
-{
- // Arbitrary sizes
- constexpr uint32_t fc_window = 10000;
-
- mock_zero_copy::sptr xport(new mock_zero_copy(vrt::if_packet_info_t::LINK_TYPE_CHDR));
-
- xport->set_reuse_recv_memory(true);
-
- boost::shared_ptr<tx_fc_cache_t> fc_cache(new tx_fc_cache_t(fc_window));
-
- fc_cache->to_host = uhd::ntohx<uint32_t>;
- fc_cache->from_host = uhd::htonx<uint32_t>;
- fc_cache->pack = vrt::chdr::if_hdr_pack_be;
- fc_cache->unpack = vrt::chdr::if_hdr_unpack_be;
-
- xport->push_back_flow_ctrl_packet(
- vrt::if_packet_info_t::PACKET_TYPE_FC, 1 /*packet*/, fc_window /*bytes*/);
-
- // Run benchmark
- const auto start_time = std::chrono::steady_clock::now();
- constexpr size_t iterations = 1e7;
- managed_send_buffer::sptr send_buffer = xport->get_send_buff(0.0);
-
- for (size_t i = 0; i < iterations; i++) {
- fc_cache->byte_count = send_flow_control_packet ? fc_window : 0;
- fc_cache->last_byte_ack = 0;
-
- tx_flow_ctrl(fc_cache, xport, send_buffer);
- }
-
- const auto end_time = std::chrono::steady_clock::now();
- const std::chrono::duration<double> elapsed_time(end_time - start_time);
-
- std::cout << elapsed_time.count() / iterations * 1e9 << " ns per call\n";
-}
-
-void benchmark_device3_tx_flow_ctrl_ack()
-{
- // Arbitrary sizes
- constexpr uint32_t fc_window = 10000;
-
- mock_zero_copy::sptr xport(new mock_zero_copy(vrt::if_packet_info_t::LINK_TYPE_CHDR));
-
- xport->set_reuse_send_memory(true);
-
- boost::shared_ptr<tx_fc_cache_t> fc_cache(new tx_fc_cache_t(fc_window));
-
- fc_cache->to_host = uhd::ntohx<uint32_t>;
- fc_cache->from_host = uhd::htonx<uint32_t>;
- fc_cache->pack = vrt::chdr::if_hdr_pack_be;
- fc_cache->unpack = vrt::chdr::if_hdr_unpack_be;
-
- // Run benchmark
- const auto start_time = std::chrono::steady_clock::now();
- constexpr size_t iterations = 1e7;
- uhd::sid_t send_sid;
-
- for (size_t i = 0; i < iterations; i++) {
- // Setup fc_cache to require an ack
- fc_cache->fc_received = true;
-
- tx_flow_ctrl_ack(fc_cache, xport, send_sid);
- }
-
- const auto end_time = std::chrono::steady_clock::now();
- const std::chrono::duration<double> elapsed_time(end_time - start_time);
-
- std::cout << elapsed_time.count() / iterations * 1e9 << " ns per call\n";
-}
-
int UHD_SAFE_MAIN(int argc, char* argv[])
{
po::options_description desc("Allowed options");
@@ -320,63 +347,34 @@ int UHD_SAFE_MAIN(int argc, char* argv[])
}
const char* formats[] = {"sc16", "fc32", "fc64"};
- constexpr size_t rx_spp = 2000;
- constexpr size_t tx_spp = 1000;
+ constexpr size_t spp = 1000;
+ std::cout << "spp: " << spp << "\n";
std::cout << "----------------------------------------------------------\n";
- std::cout << "Benchmark of recv with no flow control and mock transport \n";
+ std::cout << "Benchmark of recv with mock link \n";
std::cout << "----------------------------------------------------------\n";
- std::cout << "spp: " << rx_spp << "\n";
for (size_t i = 0; i < std::extent<decltype(formats)>::value; i++) {
- benchmark_recv_packet_handler(rx_spp, formats[i]);
+ benchmark_recv_packet_handler(spp, formats[i]);
}
std::cout << "\n";
std::cout << "----------------------------------------------------------\n";
- std::cout << "Benchmark of send with no flow control and mock transport \n";
+ std::cout << "Benchmark of send with mock link \n";
std::cout << "----------------------------------------------------------\n";
- std::cout << "spp: " << tx_spp << "\n";
std::cout << "*** without timespec ***\n";
for (size_t i = 0; i < std::extent<decltype(formats)>::value; i++) {
- benchmark_send_packet_handler(tx_spp, formats[i], false);
+ benchmark_send_packet_handler(spp, formats[i], false);
}
std::cout << "\n";
std::cout << "*** with timespec ***\n";
for (size_t i = 0; i < std::extent<decltype(formats)>::value; i++) {
- benchmark_send_packet_handler(tx_spp, formats[i], true);
+ benchmark_send_packet_handler(spp, formats[i], true);
}
std::cout << "\n";
- std::cout << "----------------------------------------------------------\n";
- std::cout << " Benchmark of flow control functions with mock transport \n";
- std::cout << "----------------------------------------------------------\n";
- std::cout << "*** device3_tx_flow_ctrl with no flow control packet ***\n";
- benchmark_device3_tx_flow_ctrl(false);
- std::cout << "\n";
-
- std::cout << "*** device3_tx_flow_ctrl with flow control packet ***\n";
- benchmark_device3_tx_flow_ctrl(true);
- std::cout << "\n";
-
- std::cout << "*** device3_tx_flow_ctrl_ack ***\n";
- benchmark_device3_tx_flow_ctrl_ack();
- std::cout << "\n";
-
- std::cout << "*** device3_rx_flow_ctrl with no flow control packet ***\n";
- benchmark_device3_rx_flow_ctrl(false);
- std::cout << "\n";
-
- std::cout << "*** device3_rx_flow_ctrl with flow control packet ***\n";
- benchmark_device3_rx_flow_ctrl(true);
- std::cout << "\n";
-
- std::cout << "*** device3_handle_rx_flow_ctrl_ack ***\n";
- benchmark_device3_handle_rx_flow_ctrl_ack();
- std::cout << "\n";
-
return EXIT_SUCCESS;
}