forked from rwth-i6/returnn
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathDebug.py
440 lines (380 loc) · 14.1 KB
/
Debug.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
"""
Some generic debugging utilities.
"""
import os
import sys
import signal
try:
import thread
except ImportError:
import _thread as thread
import threading
signum_to_signame = {
k: v for v, k in reversed(sorted(signal.__dict__.items()))
if v.startswith('SIG') and not v.startswith('SIG_')}
global_exclude_thread_ids = set()
def auto_exclude_all_new_threads(func):
"""
:param T func:
:return: func wrapped
:rtype: T
"""
def wrapped(*args, **kwargs):
"""
:param args:
:param kwargs:
:return:
"""
# noinspection PyProtectedMember
old_threads = set(sys._current_frames().keys())
res = func(*args, **kwargs)
# noinspection PyProtectedMember
new_threads = set(sys._current_frames().keys())
new_threads -= old_threads
global_exclude_thread_ids.update(new_threads)
return res
return wrapped
def dump_all_thread_tracebacks(exclude_thread_ids=None, exclude_self=False):
"""
:param set[int] exclude_thread_ids:
:param bool exclude_self:
"""
if exclude_thread_ids is None:
exclude_thread_ids = set()
import better_exchook
import threading
if exclude_self:
exclude_thread_ids = set(list(exclude_thread_ids) + [threading.current_thread().ident])
if hasattr(sys, "_current_frames"):
print("")
threads = {t.ident: t for t in threading.enumerate()}
# noinspection PyProtectedMember
for tid, stack in sorted(sys._current_frames().items()):
# This is a bug in earlier Python versions.
# http://bugs.python.org/issue17094
# Note that this leaves out all threads not created via the threading module.
if tid not in threads:
continue
tags = []
thread_ = threads.get(tid)
if thread_:
assert isinstance(thread_, threading.Thread)
if thread_ is threading.currentThread():
tags += ["current"]
# noinspection PyUnresolvedReferences,PyProtectedMember
if isinstance(thread_, threading._MainThread):
tags += ["main"]
tags += [str(thread_)]
else:
tags += ["unknown with id %i" % tid]
print("Thread %s:" % ", ".join(tags))
if tid in global_exclude_thread_ids:
print("(Auto-ignored traceback.)")
elif tid in exclude_thread_ids:
print("(Excluded thread.)")
else:
better_exchook.print_tb(stack, file=sys.stdout)
print("")
print("That were all threads.")
else:
print("Does not have sys._current_frames, cannot get thread tracebacks.")
def setup_warn_with_traceback():
"""
Installs some hook for ``warnings.showwarning``.
"""
import warnings
import better_exchook
def warn_with_traceback(message, category, filename, lineno, file=None, line=None):
"""
:param message:
:param category:
:param filename:
:param lineno:
:param file:
:param line:
"""
log = file if hasattr(file, 'write') else sys.stderr
log.write(warnings.formatwarning(message, category, filename, lineno, line))
# noinspection PyProtectedMember
better_exchook.print_tb(sys._getframe(), file=log)
warnings.showwarning = warn_with_traceback
def init_better_exchook():
"""
Installs our own ``sys.excepthook``, which uses :mod:`better_exchook`,
but adds some special handling for the main thread.
"""
import better_exchook
def excepthook(exc_type, exc_obj, exc_tb):
"""
:param exc_type:
:param exc_obj:
:param exc_tb:
"""
# noinspection PyBroadException
try:
# noinspection PyUnresolvedReferences,PyProtectedMember
is_main_thread = isinstance(threading.currentThread(), threading._MainThread)
except Exception: # Can happen at a very late state while quitting.
if exc_type is KeyboardInterrupt:
return
else:
if is_main_thread:
if exc_type is KeyboardInterrupt and getattr(sys, "exited", False):
# Got SIGINT twice. Can happen.
return
# An unhandled exception in the main thread. This means that we are going to quit now.
sys.exited = True
print("Unhandled exception %s in thread %s, proc %i." % (exc_type, threading.currentThread(), os.getpid()))
if exc_type is KeyboardInterrupt:
return
# noinspection PyUnresolvedReferences,PyProtectedMember
if isinstance(threading.currentThread(), threading._MainThread):
main_thread_id = thread.get_ident()
if not isinstance(exc_type, Exception):
# We are the main thread and we got an exit-exception. This is likely fatal.
# This usually means an exit. (We ignore non-daemon threads and procs here.)
# Print the stack of all other threads.
dump_all_thread_tracebacks(exclude_thread_ids={main_thread_id})
better_exchook.better_exchook(exc_type, exc_obj, exc_tb, file=sys.stdout)
sys.excepthook = excepthook
from Util import to_bool
if os.environ.get("DEBUG_WARN_WITH_TRACEBACK") and to_bool(os.environ.get("DEBUG_WARN_WITH_TRACEBACK")):
setup_warn_with_traceback()
def format_signum(signum):
"""
:param int signum:
:return: string "signum (signame)"
:rtype: str
"""
return "%s (%s)" % (signum, signum_to_signame.get(signum, "unknown"))
# noinspection PyUnusedLocal
def signal_handler(signum, frame):
"""
Prints a message on stdout and dump all thread stacks.
:param int signum: e.g. signal.SIGUSR1
:param frame: ignored, will dump all threads
"""
print("Signal handler: got signal %s" % format_signum(signum))
dump_all_thread_tracebacks()
def install_signal_handler_if_default(signum, exceptions_are_fatal=False):
"""
:param int signum: e.g. signal.SIGUSR1
:param bool exceptions_are_fatal: if True, will reraise any exceptions. if False, will just print a message
:return: True iff no exception, False otherwise. not necessarily that we registered our own handler
:rtype: bool
"""
try:
if signal.getsignal(signum) == signal.SIG_DFL:
signal.signal(signum, signal_handler)
return True
except Exception as exc:
if exceptions_are_fatal:
raise
print("Cannot install signal handler for signal %s, exception %s" % (format_signum(signum), exc))
return False
def install_native_signal_handler():
"""
Installs some own custom C signal handler.
"""
try:
import ctypes
# TODO: Move C code here, automatically compile it on-the-fly or so.
# C code: https://github.com/albertz/playground/blob/master/signal_handler.c
# Maybe not needed because on Linux there is libSegFault.so anyway (installLibSigSegfault()).
lib = ctypes.CDLL("/u/zeyer/code/playground/signal_handler.so")
lib.install_signal_handler.return_type = None
lib.install_signal_handler()
print("Installed signal_handler.so.")
except Exception as exc:
print("installNativeSignalHandler exception: %s" % exc)
def install_lib_sig_segfault():
"""
Installs libSegFault (common on Unix/Linux).
"""
try:
os.environ.setdefault("SEGFAULT_SIGNALS", "all")
import ctypes
import ctypes.util
# libSegFault on Unix/Linux, not on MacOSX
libfn = ctypes.util.find_library("SegFault")
assert libfn
# Nothing more needed than loading it, it will automatically register itself.
ctypes.CDLL(libfn)
print("Installed libSegFault.so.")
except Exception as exc:
print("installLibSigSegfault exception: %s" % exc)
def init_faulthandler(sigusr1_chain=False):
"""
Maybe installs signal handlers, SIGUSR1 and SIGUSR2 and others.
If no signals handlers are installed yet for SIGUSR1/2, we try to install our own Python handler.
This also tries to install the handler from the fauldhandler module,
esp for SIGSEGV and others.
:param bool sigusr1_chain: whether the default SIGUSR1 handler should also be called.
"""
from Util import to_bool
# Enable libSigSegfault first, so that we can have both,
# because faulthandler will also call the original sig handler.
if os.environ.get("DEBUG_SIGNAL_HANDLER") and to_bool(os.environ.get("DEBUG_SIGNAL_HANDLER")):
install_lib_sig_segfault()
install_native_signal_handler()
if sys.platform != 'win32':
# In case that sigusr1_chain, we expect that there is already some handler
# for SIGUSR1, and then this will not overwrite this handler.
if install_signal_handler_if_default(signal.SIGUSR1):
# There is already some handler or we installed our own handler now,
# so in any case, it's safe that we chain then handler.
sigusr1_chain = True
# Why not also SIGUSR2... SGE can also send this signal.
install_signal_handler_if_default(signal.SIGUSR2)
try:
import faulthandler
except ImportError as e:
print("faulthandler import error. %s" % e)
else:
# Only enable if not yet enabled -- otherwise, leave it in its current state.
if not faulthandler.is_enabled():
faulthandler.enable()
if sys.platform != 'win32':
faulthandler.register(signal.SIGUSR1, all_threads=True, chain=sigusr1_chain)
@auto_exclude_all_new_threads
def init_ipython_kernel():
"""
Runs IPython in some background kernel, where you can connect to.
"""
# You can remotely connect to this kernel. See the output on stdout.
try:
# noinspection PyPackageRequirements,PyUnresolvedReferences
import IPython.kernel.zmq.ipkernel
# noinspection PyPackageRequirements,PyUnresolvedReferences
from IPython.kernel.zmq.ipkernel import Kernel
# noinspection PyPackageRequirements,PyUnresolvedReferences
from IPython.kernel.zmq.heartbeat import Heartbeat
# noinspection PyPackageRequirements,PyUnresolvedReferences
from IPython.kernel.zmq.session import Session
# noinspection PyPackageRequirements,PyUnresolvedReferences
from IPython.kernel import write_connection_file
# noinspection PyPackageRequirements,PyUnresolvedReferences
import zmq
# noinspection PyPackageRequirements,PyUnresolvedReferences
from zmq.eventloop import ioloop
# noinspection PyPackageRequirements,PyUnresolvedReferences
from zmq.eventloop.zmqstream import ZMQStream
# noinspection PyPackageRequirements,PyUnresolvedReferences
IPython.kernel.zmq.ipkernel.signal = lambda sig, f: None # Overwrite.
except ImportError as e:
print("IPython import error, cannot start IPython kernel. %s" % e)
return
import atexit
import socket
import logging
import threading
# Do in mainthread to avoid history sqlite DB errors at exit.
# https://github.com/ipython/ipython/issues/680
# noinspection PyUnresolvedReferences,PyProtectedMember
assert isinstance(threading.currentThread(), threading._MainThread)
try:
ip = socket.gethostbyname(socket.gethostname())
connection_file = "ipython-kernel-%s-%s.json" % (ip, os.getpid())
def cleanup_connection_file():
"""
Cleanup.
"""
try:
os.remove(connection_file)
except (IOError, OSError):
pass
atexit.register(cleanup_connection_file)
logger = logging.Logger("IPython")
logger.addHandler(logging.NullHandler())
session = Session(username=u'kernel')
context = zmq.Context.instance()
transport = "tcp"
addr = "%s://%s" % (transport, ip)
shell_socket = context.socket(zmq.ROUTER)
shell_port = shell_socket.bind_to_random_port(addr)
iopub_socket = context.socket(zmq.PUB)
iopub_port = iopub_socket.bind_to_random_port(addr)
control_socket = context.socket(zmq.ROUTER)
control_port = control_socket.bind_to_random_port(addr)
hb_ctx = zmq.Context()
heartbeat = Heartbeat(hb_ctx, (transport, ip, 0))
hb_port = heartbeat.port
heartbeat.start()
shell_stream = ZMQStream(shell_socket)
control_stream = ZMQStream(control_socket)
kernel = Kernel(session=session,
shell_streams=[shell_stream, control_stream],
iopub_socket=iopub_socket,
log=logger)
write_connection_file(connection_file,
shell_port=shell_port, iopub_port=iopub_port, control_port=control_port, hb_port=hb_port,
ip=ip)
# print "To connect another client to this IPython kernel, use:", \
# "ipython console --existing %s" % connection_file
except Exception as e:
print("Exception while initializing IPython ZMQ kernel. %s" % e)
return
def ipython_thread():
"""
IPython thread.
"""
kernel.start()
try:
ioloop.IOLoop.instance().start()
except KeyboardInterrupt:
pass
thread_ = threading.Thread(target=ipython_thread, name="IPython kernel")
thread_.daemon = True
thread_.start()
def init_cuda_not_in_main_proc_check():
"""
Installs some hook to Theano which checks that CUDA is only used in the main proc.
"""
# noinspection PyUnresolvedReferences,PyPackageRequirements
import theano.sandbox.cuda as cuda
if cuda.use.device_number is not None:
print("CUDA already initialized in proc %i" % os.getpid())
return
use_original = cuda.use
def use_wrapped(device, **kwargs):
"""
:param device:
:param kwargs:
"""
print("CUDA.use %s in proc %i" % (device, os.getpid()))
use_original(device=device, **kwargs)
cuda.use = use_wrapped
cuda.use.device_number = None
def debug_shell(user_ns=None, user_global_ns=None, exit_afterwards=True):
"""
Provides some interactive Python shell.
Uses IPython if possible.
Wraps to ``better_exchook.debug_shell``.
:param dict[str]|None user_ns:
:param dict[str]|None user_global_ns:
:param bool exit_afterwards: will do sys.exit(1) at the end
"""
print("Debug shell:")
from Util import ObjAsDict
import DebugHelpers
user_global_ns_new = dict(ObjAsDict(DebugHelpers).items())
if user_global_ns:
user_global_ns_new.update(user_global_ns) # may overwrite vars from DebugHelpers
user_global_ns_new["debug"] = DebugHelpers # make this available always
print("Available debug functions/utils (via DebugHelpers):")
for k, v in sorted(vars(DebugHelpers).items()):
if k[:1] == "_":
continue
print(" %s (%s)" % (k, type(v)))
print("Also DebugHelpers available as 'debug'.")
if not user_ns:
user_ns = {}
if user_ns:
print("Locals:")
for k, v in sorted(user_ns.items()):
print(" %s (%s)" % (k, type(v)))
import better_exchook
better_exchook.debug_shell(user_ns, user_global_ns_new)
if exit_afterwards:
print("Debug shell exit. Exit now.")
sys.exit(1)