mirror of
https://sourceware.org/git/binutils-gdb.git
synced 2025-01-18 12:24:38 +08:00
980548fd88
I ran into a GDB crash in gdb.base/bp-cmds-continue-ctrl-c.exp in my
multi-target branch, which turns out exposed a bug that exists in
master too.
That testcase has a breakpoint with a "continue" command associated.
Then the breakpoint is constantly being hit. At the same time, the
testcase is continualy interrupting the program with Ctrl-C, and
re-resuming it, in a loop.
Running that testcase manually under Valgrind, after a few sequences
of 'Ctrl-C' + 'continue', I got:
Breakpoint 1, Quit
(gdb) ==21270== Invalid read of size 8
==21270== at 0x4D8185: pyuw_this_id(frame_info*, void**, frame_id*) (py-unwind.c:461)
==21270== by 0x6D426A: compute_frame_id(frame_info*) (frame.c:505)
==21270== by 0x6D43B7: get_frame_id(frame_info*) (frame.c:537)
==21270== by 0x84F3B8: scoped_restore_current_thread::scoped_restore_current_thread() (thread.c:1678)
==21270== by 0x718E3D: fetch_inferior_event(void*) (infrun.c:4076)
==21270== by 0x7067C9: inferior_event_handler(inferior_event_type, void*) (inf-loop.c:43)
==21270== by 0x45BEF9: handle_target_event(int, void*) (linux-nat.c:4419)
==21270== by 0x6C4255: handle_file_event(file_handler*, int) (event-loop.c:733)
==21270== by 0x6C47F8: gdb_wait_for_event(int) (event-loop.c:859)
==21270== by 0x6C3666: gdb_do_one_event() (event-loop.c:322)
==21270== by 0x6C3712: start_event_loop() (event-loop.c:371)
==21270== by 0x746801: captured_command_loop() (main.c:329)
==21270== Address 0x0 is not stack'd, malloc'd or (recently) free'd
==21270==
==21270==
==21270== Process terminating with default action of signal 11 (SIGSEGV): dumping core
==21270== Access not within mapped region at address 0x0
==21270== at 0x4D8185: pyuw_this_id(frame_info*, void**, frame_id*) (py-unwind.c:461)
==21270== by 0x6D426A: compute_frame_id(frame_info*) (frame.c:505)
==21270== by 0x6D43B7: get_frame_id(frame_info*) (frame.c:537)
==21270== by 0x84F3B8: scoped_restore_current_thread::scoped_restore_current_thread() (thread.c:1678)
==21270== by 0x718E3D: fetch_inferior_event(void*) (infrun.c:4076)
==21270== by 0x7067C9: inferior_event_handler(inferior_event_type, void*) (inf-loop.c:43)
==21270== by 0x45BEF9: handle_target_event(int, void*) (linux-nat.c:4419)
==21270== by 0x6C4255: handle_file_event(file_handler*, int) (event-loop.c:733)
==21270== by 0x6C47F8: gdb_wait_for_event(int) (event-loop.c:859)
==21270== by 0x6C3666: gdb_do_one_event() (event-loop.c:322)
==21270== by 0x6C3712: start_event_loop() (event-loop.c:371)
==21270== by 0x746801: captured_command_loop() (main.c:329)
==21270== If you believe this happened as a result of a stack
==21270== overflow in your program's main thread (unlikely but
==21270== possible), you can try to increase the size of the
==21270== main thread stack using the --main-stacksize= flag.
==21270== The main thread stack size used in this run was 8388608.
==21270==
Above, when we get to compute_frame_id, fi->unwind is non-NULL,
meaning, we found an unwinder, in this case the Python unwinder, but
somehow, fi->prologue_cache is left NULL. pyuw_this_id then crashes
because it assumes fi->prologue_cache is non-NULL:
static void
pyuw_this_id (struct frame_info *this_frame, void **cache_ptr,
struct frame_id *this_id)
{
*this_id = ((cached_frame_info *) *cache_ptr)->frame_id;
^^^^^^^^^^
'*cache_ptr' here is 'fi->prologue_cache'.
There's a quit() call in pyuw_sniffer that I believe is the one that
sometimes triggers the crash above. The crash can be reproduced
easily with this hack to force a quit out of the python unwinder:
--- a/gdb/python/py-unwind.c
+++ b/gdb/python/py-unwind.c
@@ -497,6 +497,8 @@ pyuw_sniffer (const struct frame_unwind *self, struct frame_info *this_frame,
struct gdbarch *gdbarch = (struct gdbarch *) (self->unwind_data);
cached_frame_info *cached_frame;
+ quit ();
+
gdbpy_enter enter_py (gdbarch, current_language);
TRACE_PY_UNWIND (3, "%s (SP=%s, PC=%s)\n", __FUNCTION__,
After that quit is thrown, any subsequent operation that involves
unwinding results in GDB crashing with SIGSEGV like above.
The problem is that this commit:
commit 30a9c02fef
CommitDate: Sun Oct 8 23:16:42 2017 -0600
Subject: Remove cleanup from frame_prepare_for_sniffer
missed that we need to call frame_cleanup_after_sniffer before
rethrowing the exception too.
Without the fix, the "bt" added to
gdb.base/bp-cmds-continue-ctrl-c.exp in this commit makes GDB crash:
Running src/gdb/testsuite/gdb.base/bp-cmds-continue-ctrl-c.exp ...
ERROR: Process no longer exists
gdb/ChangeLog:
2018-02-14 Pedro Alves <palves@redhat.com>
* frame-unwind.c (frame_unwind_try_unwinder): Always call
frame_cleanup_after_sniffer on exception.
gdb/testsuite/ChangeLog:
2018-02-14 Pedro Alves <palves@redhat.com>
* gdb.base/bp-cmds-continue-ctrl-c.exp (do_test): Test "bt" after
getting a "Quit".
150 lines
4.0 KiB
Plaintext
150 lines
4.0 KiB
Plaintext
# Copyright 2017-2018 Free Software Foundation, Inc.
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation; either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
# Set a breakpoint with a "continue" command attached, let the
|
|
# inferior hit the breakpoint continuously. Check that we can use ^C
|
|
# to interrupt the command, and that if ^C is pressed while GDB has
|
|
# the terminal (between the stop and the re-resume), the resulting
|
|
# "Quit" doesn't mess up the debug session.
|
|
|
|
if [target_info exists gdb,nosignals] {
|
|
verbose "Skipping because of nosignals."
|
|
continue
|
|
}
|
|
|
|
# This test requires sending ^C to interrupt the running target.
|
|
if [target_info exists gdb,nointerrupts] {
|
|
verbose "Skipping because of nointerrupts."
|
|
return
|
|
}
|
|
|
|
standard_testfile
|
|
|
|
if {[prepare_for_testing "failed to prepare" $testfile $srcfile debug]} {
|
|
return -1
|
|
}
|
|
|
|
# See intro.
|
|
|
|
proc do_test {} {
|
|
global srcfile binfile
|
|
global gdb_prompt
|
|
|
|
gdb_test "break foo" "Breakpoint .*" "set breakpoint"
|
|
|
|
gdb_test \
|
|
[multi_line_input \
|
|
{commands} \
|
|
{ c} \
|
|
{end}] \
|
|
"" "commands"
|
|
|
|
set test "stop with control-c"
|
|
|
|
for {set iter 0} {$iter < 20} {incr iter} {
|
|
|
|
# Useful for debugging.
|
|
#send_user "iter: $iter\n"
|
|
|
|
# Consume one breakpoint hit (at least), to make sure that the
|
|
# continue actually continues between attempts, as opposed to
|
|
# "c" not actually resuming and then Ctrl-C managing to
|
|
# interrupt anyway.
|
|
if {[gdb_test_multiple "continue" "$test (continue)" {
|
|
-re "Continuing.*Breakpoint \[^\r\n\]*\r\n" {
|
|
}
|
|
}] != 0} {
|
|
return
|
|
}
|
|
|
|
set internal_pass "IPASS: $test (iter $iter)"
|
|
|
|
# Breakpoint commands run after the target is considered
|
|
# stopped, and thus run with GDB owning the terminal. That
|
|
# means that it is expected that a Ctrl-C that arrives between
|
|
# - GDB reporting the breakpoint hit, and,
|
|
# - the breakpoint command continuing the target
|
|
# results in a Quit.
|
|
|
|
after 200 {send_gdb "\003"}
|
|
if {[gdb_test_multiple "" "$test (unexpected)" {
|
|
-re "Program terminated with signal SIGALRM.*\r\n$gdb_prompt $" {
|
|
fail "$test (SIGALRM)"
|
|
return
|
|
}
|
|
-re "Program received signal SIGINT.*\r\n$gdb_prompt $" {
|
|
send_log "$internal_pass (SIGINT)\n"
|
|
}
|
|
-re "Quit\r\n$gdb_prompt $" {
|
|
send_log "$internal_pass (Quit)\n"
|
|
|
|
# Check that if we managed to quit somewhere deep in
|
|
# the unwinders, we can still unwind again.
|
|
set ok 0
|
|
gdb_test_multiple "bt" "$internal_pass (bt)" {
|
|
-re "#0.*$gdb_prompt $" {
|
|
send_log "$internal_pass (bt)\n"
|
|
set ok 1
|
|
}
|
|
}
|
|
if {!$ok} {
|
|
return
|
|
}
|
|
}
|
|
-re "Quit\r\n\r\nCommand aborted.\r\n$gdb_prompt $" {
|
|
send_log "$internal_pass (Command aborted)\n"
|
|
}
|
|
-re "Breakpoint \[^\r\n\]*$srcfile" {
|
|
exp_continue
|
|
}
|
|
}] != 0} {
|
|
break
|
|
}
|
|
}
|
|
|
|
gdb_assert {$iter == 20} "stop with control-c"
|
|
}
|
|
|
|
# With native debugging and "run" (with job control), if the inferior
|
|
# is running, the Ctrl-C reaches the inferior directly, not GDB. With
|
|
# native debugging and "attach", or with remote debugging, the Ctrl-C
|
|
# reaches GDB first. So for completeness, try both "run" and
|
|
# "attach".
|
|
|
|
with_test_prefix "run" {
|
|
clean_restart $binfile
|
|
|
|
if {![runto_main]} {
|
|
return -1
|
|
}
|
|
|
|
do_test
|
|
}
|
|
|
|
with_test_prefix "attach" {
|
|
if {[can_spawn_for_attach]} {
|
|
clean_restart $binfile
|
|
|
|
set test_spawn_id [spawn_wait_for_attach $binfile]
|
|
set testpid [spawn_id_get_pid $test_spawn_id]
|
|
|
|
gdb_test "attach $testpid" "Attaching to.*process $testpid.*" "attach"
|
|
|
|
do_test
|
|
|
|
kill_wait_spawned_process $test_spawn_id
|
|
}
|
|
}
|