diff options
author | Martin Braun <martin.braun@ettus.com> | 2019-02-21 15:58:04 -0800 |
---|---|---|
committer | Martin Braun <martin.braun@ettus.com> | 2019-02-22 16:12:23 -0800 |
commit | a272da1d65d7c3dd3da0180c10064d55db2a52dc (patch) | |
tree | 3f926cc4a79f46dd15bfc947f6567daefd1601c2 /host/lib/usrp/mpmd/mpmd_mboard_impl.cpp | |
parent | 0c658067bd1f75bd6f6175cec556d8384b647953 (diff) | |
download | uhd-a272da1d65d7c3dd3da0180c10064d55db2a52dc.tar.gz uhd-a272da1d65d7c3dd3da0180c10064d55db2a52dc.tar.bz2 uhd-a272da1d65d7c3dd3da0180c10064d55db2a52dc.zip |
mpmd: Allow reclaim failures on component updates
MPM has a flag that identifies component reloads as requiring to restart
the RPC server. This change honours that flag, and doesn't cause a fatal
failure when reclaims fail to ack for certain operations.
For example, running uhd_image_loader on an N310 could fail after the
FPGA was reloaded because the communication to the RPC server was
temporarily interrupted. This is not always avoidable, since the RPC
server does actually go down, and Ethernet connections might also be
lost. So, we cut our losses and accept failures in that case.
Diffstat (limited to 'host/lib/usrp/mpmd/mpmd_mboard_impl.cpp')
-rw-r--r-- | host/lib/usrp/mpmd/mpmd_mboard_impl.cpp | 40 |
1 files changed, 28 insertions, 12 deletions
diff --git a/host/lib/usrp/mpmd/mpmd_mboard_impl.cpp b/host/lib/usrp/mpmd/mpmd_mboard_impl.cpp index 11404ffaf..da4f99794 100644 --- a/host/lib/usrp/mpmd/mpmd_mboard_impl.cpp +++ b/host/lib/usrp/mpmd/mpmd_mboard_impl.cpp @@ -1,5 +1,6 @@ // // Copyright 2017 Ettus Research, a National Instruments Company +// Copyright 2019 Ettus Research, a National Instruments Brand // // SPDX-License-Identifier: GPL-3.0-or-later // @@ -301,12 +302,7 @@ mpmd_mboard_impl::mpmd_mboard_impl( mpmd_mboard_impl::~mpmd_mboard_impl() { - try { - dump_logs(); - } catch (...) { - UHD_LOG_WARNING("MPMD", "Could not flush log queue on exit!"); - } - UHD_SAFE_CALL(if (not rpc->request_with_token<bool>("unclaim")) { + UHD_SAFE_CALL(dump_logs(); if (not rpc->request_with_token<bool>("unclaim")) { UHD_LOG_WARNING("MPMD", "Failure to ack unclaim!"); }); } @@ -398,10 +394,25 @@ uhd::device_addr_t mpmd_mboard_impl::get_tx_hints() const bool mpmd_mboard_impl::claim() { try { - return _claim_rpc->request_with_token<bool>("reclaim"); - } catch (...) { - UHD_LOG_WARNING("MPMD", "Reclaim failed. Exiting claimer loop."); - return false; + auto result = _claim_rpc->request_with_token<bool>("reclaim"); + // When _allow_claim_failure_flag goes from true to false, we still have + // to wait for a successful reclaim before we can also set + // _allow_claim_failure_latch to false, because we have no way of + // synchronizing those events. + // In other words, we might be setting allow_claim_failure back to false + // too soon, but we have no way of knowing exactly when the right time + // is. + _allow_claim_failure_latch = _allow_claim_failure_flag.load(); + return result; + } catch (const uhd::runtime_error& ex) { + // Note: Any RPC error will raise a uhd::runtime_error. Other errors are + // not handled here. + if (_allow_claim_failure_latch) { + UHD_LOG_DEBUG("MPMD", ex.what()); + } else { + UHD_LOG_WARNING("MPMD", ex.what()); + } + return _allow_claim_failure_latch; } } @@ -420,8 +431,13 @@ uhd::task::sptr mpmd_mboard_impl::claim_device_and_make_task() auto now = std::chrono::steady_clock::now(); if (not this->claim()) { throw uhd::value_error("mpmd device reclaiming loop failed!"); - }; - this->dump_logs(); + } else { + try { + this->dump_logs(); + } catch(const uhd::runtime_error&) { + UHD_LOG_WARNING("MPMD", "Could not read back log queue!"); + } + } std::this_thread::sleep_until( now + std::chrono::milliseconds(MPMD_RECLAIM_INTERVAL_MS)); }); |