diff options
| author | Samuel O'Brien <sam.obrien@ni.com> | 2020-07-23 16:30:32 -0500 | 
|---|---|---|
| committer | Aaron Rossetto <aaron.rossetto@ni.com> | 2020-07-24 15:26:36 -0500 | 
| commit | 97852aba2393a20fd5e0c25313d26be4ce316a25 (patch) | |
| tree | f223a77d234f5c891f9094ef86f3e0e050c19b98 | |
| parent | 54d698e3707cf1be5d38537db783ebadd850e729 (diff) | |
| download | uhd-97852aba2393a20fd5e0c25313d26be4ce316a25.tar.gz uhd-97852aba2393a20fd5e0c25313d26be4ce316a25.tar.bz2 uhd-97852aba2393a20fd5e0c25313d26be4ce316a25.zip | |
mpm: Fix gevent errors on SIGTERM
Sometimes when running usrp_hwd.py in a terminal and then canceling it
with Ctrl+C, it prints a really large stacktrace into the terminal
resulting from an uncaught gevent BlockingSwitchOutError. It seems like
there was an attempt to catch this in usrp_hwd.py:kill_time(). This
try-except was surrounding a call to Process.join() which, to the best
of my knowledge, can't ever throw this exception.
Based on my troubleshooting, this error comes from the SIGTERM signal
handler of the RPC process. The handler (defined in
rpc_server.py:_rpc_server_process), is just a direct call to
RPCServer.stop(). When the server's backed is a thread pool, this call
may block when joining the thread pool, causing gevent to complain about
execution attempting to block in a signal handler.
This commit resolves this issue by simply triggering an event in the
signal handler which prompts a different thread to clean up the server
and end the process.
Signed-off-by: Samuel O'Brien <sam.obrien@ni.com>
| -rwxr-xr-x | mpm/python/usrp_hwd.py | 3 | ||||
| -rw-r--r-- | mpm/python/usrp_mpm/rpc_server.py | 15 | 
2 files changed, 13 insertions, 5 deletions
| diff --git a/mpm/python/usrp_hwd.py b/mpm/python/usrp_hwd.py index f79932231..3523fa9b4 100755 --- a/mpm/python/usrp_hwd.py +++ b/mpm/python/usrp_hwd.py @@ -102,10 +102,7 @@ def kill_time(sig, frame):          proc.terminate()          log.info("Terminating pid: {0}".format(proc.pid))      for proc in _PROCESSES: -        try:              proc.join() -        except BlockingSwitchOutError: -            log.debug("Caught BlockingSwitchOutError for {}".format(str(proc)))      log.info("System exiting")      sys.exit(0) diff --git a/mpm/python/usrp_mpm/rpc_server.py b/mpm/python/usrp_mpm/rpc_server.py index 8b87c52d8..65428f116 100644 --- a/mpm/python/usrp_mpm/rpc_server.py +++ b/mpm/python/usrp_mpm/rpc_server.py @@ -13,6 +13,8 @@ import copy  from random import choice  from string import ascii_letters, digits  from multiprocessing import Process +import threading +import sys  from gevent.server import StreamServer  from gevent.pool import Pool  from gevent import signal @@ -555,8 +557,17 @@ def _rpc_server_process(shared_state, port, default_args):          handle=MPMServer(shared_state, default_args),          spawn=connections)      # catch signals and stop the stream server -    signal(signal.SIGTERM, lambda *args: server.stop()) -    signal(signal.SIGINT, lambda *args: server.stop()) +    # Previously, the signal callbacks simply called server.stop() +    # gevent doesn't like this because server.stop() may block waiting +    # for greenlets to stop, and signal callbacks are not supposed to block +    stop_event = threading.Event() +    def stop_worker(): +        stop_event.wait() +        server.stop() +        sys.exit(0) +    threading.Thread(target=stop_worker, daemon=True).start() +    signal(signal.SIGTERM, lambda *args: stop_event.set()) +    signal(signal.SIGINT, lambda *args: stop_event.set())      server.serve_forever() | 
