2009-03-03 19:28:35 -08:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2008 The Android Open Source Project
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
* * Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in
|
|
|
|
* the documentation and/or other materials provided with the
|
|
|
|
* distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
|
|
|
|
* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
|
|
|
|
* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
|
|
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
|
|
|
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
|
|
|
|
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
|
|
|
|
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
|
|
|
|
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
* SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2012-10-29 17:37:13 -07:00
|
|
|
#include "linker.h"
|
|
|
|
|
2013-07-17 13:33:19 -07:00
|
|
|
#include <errno.h>
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
#include <inttypes.h>
|
2015-01-28 16:13:56 -08:00
|
|
|
#include <pthread.h>
|
2013-07-17 13:33:19 -07:00
|
|
|
#include <signal.h>
|
2009-03-03 19:28:35 -08:00
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
2015-01-28 16:13:56 -08:00
|
|
|
#include <string.h>
|
2013-07-17 13:33:19 -07:00
|
|
|
#include <sys/mman.h>
|
2012-03-07 09:04:18 -08:00
|
|
|
#include <sys/prctl.h>
|
2009-03-03 19:28:35 -08:00
|
|
|
#include <sys/socket.h>
|
2010-06-10 18:29:33 -07:00
|
|
|
#include <sys/un.h>
|
2013-07-17 13:33:19 -07:00
|
|
|
#include <unistd.h>
|
2009-03-03 19:28:35 -08:00
|
|
|
|
2012-10-29 17:37:13 -07:00
|
|
|
extern "C" int tgkill(int tgid, int tid, int sig);
|
2009-03-03 19:28:35 -08:00
|
|
|
|
2015-01-19 11:16:52 -08:00
|
|
|
// Crash actions have to be sent to the proper debuggerd.
|
|
|
|
// On 64 bit systems, the 32 bit debuggerd is named differently.
|
|
|
|
#if defined(TARGET_IS_64_BIT) && !defined(__LP64__)
|
|
|
|
#define DEBUGGER_SOCKET_NAME "android:debuggerd32"
|
2014-01-31 16:56:39 -08:00
|
|
|
#else
|
2012-06-06 18:37:48 -07:00
|
|
|
#define DEBUGGER_SOCKET_NAME "android:debuggerd"
|
2014-01-31 16:56:39 -08:00
|
|
|
#endif
|
2012-06-06 18:37:48 -07:00
|
|
|
|
2012-10-29 17:37:13 -07:00
|
|
|
enum debugger_action_t {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
// dump a crash
|
|
|
|
DEBUGGER_ACTION_CRASH,
|
|
|
|
// dump a tombstone file
|
|
|
|
DEBUGGER_ACTION_DUMP_TOMBSTONE,
|
|
|
|
// dump a backtrace only back to the socket
|
|
|
|
DEBUGGER_ACTION_DUMP_BACKTRACE,
|
2012-10-29 17:37:13 -07:00
|
|
|
};
|
2012-06-06 18:37:48 -07:00
|
|
|
|
|
|
|
/* message sent over the socket */
|
2015-01-19 11:16:52 -08:00
|
|
|
struct __attribute__((packed)) debugger_msg_t {
|
|
|
|
int32_t action;
|
2013-04-04 13:46:46 -07:00
|
|
|
pid_t tid;
|
2015-01-19 11:16:52 -08:00
|
|
|
uint64_t abort_msg_address;
|
2014-04-25 16:02:00 -07:00
|
|
|
int32_t original_si_code;
|
2012-10-29 17:37:13 -07:00
|
|
|
};
|
2009-10-16 12:13:34 -07:00
|
|
|
|
2012-03-07 09:04:18 -08:00
|
|
|
// see man(2) prctl, specifically the section about PR_GET_NAME
|
|
|
|
#define MAX_TASK_NAME_LEN (16)
|
2010-06-10 18:29:33 -07:00
|
|
|
|
2012-10-29 17:37:13 -07:00
|
|
|
static int socket_abstract_client(const char* name, int type) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
sockaddr_un addr;
|
|
|
|
|
|
|
|
// Test with length +1 for the *initial* '\0'.
|
|
|
|
size_t namelen = strlen(name);
|
|
|
|
if ((namelen + 1) > sizeof(addr.sun_path)) {
|
|
|
|
errno = EINVAL;
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
// This is used for abstract socket namespace, we need
|
|
|
|
// an initial '\0' at the start of the Unix socket path.
|
|
|
|
//
|
|
|
|
// Note: The path in this case is *not* supposed to be
|
|
|
|
// '\0'-terminated. ("man 7 unix" for the gory details.)
|
|
|
|
memset(&addr, 0, sizeof(addr));
|
|
|
|
addr.sun_family = AF_LOCAL;
|
|
|
|
addr.sun_path[0] = 0;
|
|
|
|
memcpy(addr.sun_path + 1, name, namelen);
|
|
|
|
|
|
|
|
socklen_t alen = namelen + offsetof(sockaddr_un, sun_path) + 1;
|
|
|
|
|
|
|
|
int s = socket(AF_LOCAL, type, 0);
|
|
|
|
if (s == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
int rc = TEMP_FAILURE_RETRY(connect(s, reinterpret_cast<sockaddr*>(&addr), alen));
|
|
|
|
if (rc == -1) {
|
|
|
|
close(s);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return s;
|
2010-06-10 18:29:33 -07:00
|
|
|
}
|
|
|
|
|
2011-07-29 12:46:34 -07:00
|
|
|
/*
|
2012-10-02 13:53:13 -07:00
|
|
|
* Writes a summary of the signal to the log file. We do this so that, if
|
|
|
|
* for some reason we're not able to contact debuggerd, there is still some
|
|
|
|
* indication of the failure in the log.
|
2011-07-29 12:46:34 -07:00
|
|
|
*
|
|
|
|
* We could be here as a result of native heap corruption, or while a
|
|
|
|
* mutex is being held, so we don't want to use any libc functions that
|
|
|
|
* could allocate memory or hold a lock.
|
|
|
|
*/
|
2013-07-17 13:33:19 -07:00
|
|
|
static void log_signal_summary(int signum, const siginfo_t* info) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
const char* signal_name = "???";
|
|
|
|
bool has_address = false;
|
|
|
|
switch (signum) {
|
|
|
|
case SIGABRT:
|
|
|
|
signal_name = "SIGABRT";
|
|
|
|
break;
|
|
|
|
case SIGBUS:
|
|
|
|
signal_name = "SIGBUS";
|
|
|
|
has_address = true;
|
|
|
|
break;
|
|
|
|
case SIGFPE:
|
|
|
|
signal_name = "SIGFPE";
|
|
|
|
has_address = true;
|
|
|
|
break;
|
2014-05-16 16:59:54 -07:00
|
|
|
case SIGILL:
|
|
|
|
signal_name = "SIGILL";
|
|
|
|
has_address = true;
|
|
|
|
break;
|
|
|
|
case SIGPIPE:
|
|
|
|
signal_name = "SIGPIPE";
|
|
|
|
break;
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
case SIGSEGV:
|
|
|
|
signal_name = "SIGSEGV";
|
|
|
|
has_address = true;
|
|
|
|
break;
|
2012-07-31 12:07:22 -07:00
|
|
|
#if defined(SIGSTKFLT)
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
case SIGSTKFLT:
|
|
|
|
signal_name = "SIGSTKFLT";
|
|
|
|
break;
|
2012-07-31 12:07:22 -07:00
|
|
|
#endif
|
2014-05-16 16:59:54 -07:00
|
|
|
case SIGTRAP:
|
|
|
|
signal_name = "SIGTRAP";
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
char thread_name[MAX_TASK_NAME_LEN + 1]; // one more for termination
|
2015-01-22 16:04:25 -08:00
|
|
|
if (prctl(PR_GET_NAME, reinterpret_cast<unsigned long>(thread_name), 0, 0, 0) != 0) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
strcpy(thread_name, "<name unknown>");
|
|
|
|
} else {
|
|
|
|
// short names are null terminated by prctl, but the man page
|
|
|
|
// implies that 16 byte names are not.
|
|
|
|
thread_name[MAX_TASK_NAME_LEN] = 0;
|
|
|
|
}
|
|
|
|
|
2014-08-29 12:02:36 -07:00
|
|
|
// "info" will be null if the siginfo_t information was not available.
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
// Many signals don't have an address or a code.
|
|
|
|
char code_desc[32]; // ", code -6"
|
|
|
|
char addr_desc[32]; // ", fault addr 0x1234"
|
|
|
|
addr_desc[0] = code_desc[0] = 0;
|
2014-08-29 12:02:36 -07:00
|
|
|
if (info != nullptr) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
// For a rethrown signal, this si_code will be right and the one debuggerd shows will
|
|
|
|
// always be SI_TKILL.
|
2014-08-26 20:48:11 -07:00
|
|
|
__libc_format_buffer(code_desc, sizeof(code_desc), ", code %d", info->si_code);
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
if (has_address) {
|
2014-08-26 20:48:11 -07:00
|
|
|
__libc_format_buffer(addr_desc, sizeof(addr_desc), ", fault addr %p", info->si_addr);
|
2012-10-02 13:53:13 -07:00
|
|
|
}
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
}
|
|
|
|
__libc_format_log(ANDROID_LOG_FATAL, "libc",
|
|
|
|
"Fatal signal %d (%s)%s%s in tid %d (%s)",
|
|
|
|
signum, signal_name, code_desc, addr_desc, gettid(), thread_name);
|
2011-07-29 12:46:34 -07:00
|
|
|
}
|
|
|
|
|
2012-10-02 13:53:13 -07:00
|
|
|
/*
|
|
|
|
* Returns true if the handler for signal "signum" has SA_SIGINFO set.
|
|
|
|
*/
|
2013-07-17 13:33:19 -07:00
|
|
|
static bool have_siginfo(int signum) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
struct sigaction old_action, new_action;
|
|
|
|
|
|
|
|
memset(&new_action, 0, sizeof(new_action));
|
|
|
|
new_action.sa_handler = SIG_DFL;
|
|
|
|
new_action.sa_flags = SA_RESTART;
|
|
|
|
sigemptyset(&new_action.sa_mask);
|
|
|
|
|
|
|
|
if (sigaction(signum, &new_action, &old_action) < 0) {
|
|
|
|
__libc_format_log(ANDROID_LOG_WARN, "libc", "Failed testing for SA_SIGINFO: %s",
|
|
|
|
strerror(errno));
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
bool result = (old_action.sa_flags & SA_SIGINFO) != 0;
|
|
|
|
|
2014-08-29 12:02:36 -07:00
|
|
|
if (sigaction(signum, &old_action, nullptr) == -1) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
__libc_format_log(ANDROID_LOG_WARN, "libc", "Restore failed in test for SA_SIGINFO: %s",
|
|
|
|
strerror(errno));
|
|
|
|
}
|
|
|
|
return result;
|
2012-10-02 13:53:13 -07:00
|
|
|
}
|
|
|
|
|
2014-04-25 16:02:00 -07:00
|
|
|
static void send_debuggerd_packet(siginfo_t* info) {
|
2014-07-23 13:56:23 -07:00
|
|
|
if (prctl(PR_GET_DUMPABLE, 0, 0, 0, 0) == 0) {
|
|
|
|
// process has disabled core dumps and PTRACE_ATTACH, and does not want to be dumped.
|
|
|
|
// Honor that intention by not connecting to debuggerd and asking it
|
|
|
|
// to dump our internal state.
|
|
|
|
__libc_format_log(ANDROID_LOG_INFO, "libc",
|
|
|
|
"Suppressing debuggerd output because prctl(PR_GET_DUMPABLE)==0");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2015-01-28 16:13:56 -08:00
|
|
|
// Mutex to prevent multiple crashing threads from trying to talk
|
|
|
|
// to debuggerd at the same time.
|
|
|
|
static pthread_mutex_t crash_mutex = PTHREAD_MUTEX_INITIALIZER;
|
|
|
|
int ret = pthread_mutex_trylock(&crash_mutex);
|
|
|
|
if (ret != 0) {
|
|
|
|
if (ret == EBUSY) {
|
|
|
|
__libc_format_log(ANDROID_LOG_INFO, "libc",
|
|
|
|
"Another thread has contacted debuggerd first, stop and wait for process to die.");
|
|
|
|
// This will never complete since the lock is never released.
|
|
|
|
pthread_mutex_lock(&crash_mutex);
|
|
|
|
} else {
|
|
|
|
__libc_format_log(ANDROID_LOG_INFO, "libc",
|
|
|
|
"pthread_mutex_trylock failed: %s", strerror(ret));
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-09-22 17:43:09 -07:00
|
|
|
int s = socket_abstract_client(DEBUGGER_SOCKET_NAME, SOCK_STREAM | SOCK_CLOEXEC);
|
2014-04-25 16:02:00 -07:00
|
|
|
if (s == -1) {
|
|
|
|
__libc_format_log(ANDROID_LOG_FATAL, "libc", "Unable to open connection to debuggerd: %s",
|
|
|
|
strerror(errno));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// debuggerd knows our pid from the credentials on the
|
|
|
|
// local socket but we need to tell it the tid of the crashing thread.
|
|
|
|
// debuggerd will be paranoid and verify that we sent a tid
|
|
|
|
// that's actually in our process.
|
|
|
|
debugger_msg_t msg;
|
|
|
|
msg.action = DEBUGGER_ACTION_CRASH;
|
|
|
|
msg.tid = gettid();
|
2014-05-14 10:02:03 -07:00
|
|
|
msg.abort_msg_address = reinterpret_cast<uintptr_t>(g_abort_message);
|
2014-08-29 12:02:36 -07:00
|
|
|
msg.original_si_code = (info != nullptr) ? info->si_code : 0;
|
2015-01-28 16:13:56 -08:00
|
|
|
ret = TEMP_FAILURE_RETRY(write(s, &msg, sizeof(msg)));
|
2014-04-25 16:02:00 -07:00
|
|
|
if (ret == sizeof(msg)) {
|
|
|
|
char debuggerd_ack;
|
|
|
|
ret = TEMP_FAILURE_RETRY(read(s, &debuggerd_ack, 1));
|
|
|
|
int saved_errno = errno;
|
|
|
|
notify_gdb_of_libraries();
|
|
|
|
errno = saved_errno;
|
|
|
|
} else {
|
|
|
|
// read or write failed -- broken connection?
|
|
|
|
__libc_format_log(ANDROID_LOG_FATAL, "libc", "Failed while talking to debuggerd: %s",
|
|
|
|
strerror(errno));
|
|
|
|
}
|
|
|
|
|
|
|
|
close(s);
|
|
|
|
}
|
|
|
|
|
2011-07-29 12:46:34 -07:00
|
|
|
/*
|
|
|
|
* Catches fatal signals so we can ask debuggerd to ptrace us before
|
|
|
|
* we crash.
|
|
|
|
*/
|
2014-04-25 16:02:00 -07:00
|
|
|
static void debuggerd_signal_handler(int signal_number, siginfo_t* info, void*) {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
// It's possible somebody cleared the SA_SIGINFO flag, which would mean
|
|
|
|
// our "info" arg holds an undefined value.
|
|
|
|
if (!have_siginfo(signal_number)) {
|
2014-08-29 12:02:36 -07:00
|
|
|
info = nullptr;
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
log_signal_summary(signal_number, info);
|
|
|
|
|
2014-04-25 16:02:00 -07:00
|
|
|
send_debuggerd_packet(info);
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
|
|
|
|
// Remove our net so we fault for real when we return.
|
|
|
|
signal(signal_number, SIG_DFL);
|
|
|
|
|
|
|
|
// These signals are not re-thrown when we resume. This means that
|
|
|
|
// crashing due to (say) SIGPIPE doesn't work the way you'd expect it
|
|
|
|
// to. We work around this by throwing them manually. We don't want
|
2014-04-25 16:02:00 -07:00
|
|
|
// to do this for *all* signals because it'll screw up the si_addr for
|
|
|
|
// faults like SIGSEGV. It does screw up the si_code, which is why we
|
|
|
|
// passed that to debuggerd above.
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
switch (signal_number) {
|
|
|
|
case SIGABRT:
|
|
|
|
case SIGFPE:
|
|
|
|
case SIGPIPE:
|
2013-10-25 17:38:02 -07:00
|
|
|
#if defined(SIGSTKFLT)
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
case SIGSTKFLT:
|
2012-07-31 12:07:22 -07:00
|
|
|
#endif
|
2014-05-16 17:34:13 -07:00
|
|
|
case SIGTRAP:
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
tgkill(getpid(), gettid(), signal_number);
|
|
|
|
break;
|
|
|
|
default: // SIGILL, SIGBUS, SIGSEGV
|
|
|
|
break;
|
|
|
|
}
|
2009-03-03 19:28:35 -08:00
|
|
|
}
|
|
|
|
|
2014-04-25 16:02:00 -07:00
|
|
|
__LIBC_HIDDEN__ void debuggerd_init() {
|
Make libc signal handler output more like debuggerd.
This has been annoying me for a while, because it's often quite misleading.
Today, for example, I saw:
Fatal signal 13 (SIGPIPE) at 0x6573 (code=0), thread 25971 (top)
where the apparent address is actually the pid of the signal source (in this
case the kernel on behalf of the thread itself).
This patch isn't as fancy as strace, but it at least means we never say
anything misleading. We could decode the si_code field like strace and
debuggerd, but I'm reluctant to do that without some way to share the code
between at least bionic and debuggerd.
Examples after:
Fatal signal 13 (SIGPIPE), code 0 in tid 9157 (top)
Fatal signal 11 (SIGSEGV), code 1, fault addr 0x0 in tid 9142 (crasher64)
Fatal signal 6 (SIGABRT), code -6 in tid 9132 (crasher64)
(Note that the code still shows as 0 for SIGPIPE in the signal handler itself
but as -6 (SI_TKILL) in debuggerd; this is actually correct --- debuggerd is
showing the re-raised signal sent at the end of the signal handler that
initially showed the correct code 0.)
Change-Id: I71cad4ab61f422a4f6687a60ac770371790278e0
2014-04-18 17:39:25 -07:00
|
|
|
struct sigaction action;
|
|
|
|
memset(&action, 0, sizeof(action));
|
|
|
|
sigemptyset(&action.sa_mask);
|
|
|
|
action.sa_sigaction = debuggerd_signal_handler;
|
|
|
|
action.sa_flags = SA_RESTART | SA_SIGINFO;
|
|
|
|
|
|
|
|
// Use the alternate signal stack if available so we can catch stack overflows.
|
|
|
|
action.sa_flags |= SA_ONSTACK;
|
|
|
|
|
2014-08-29 12:02:36 -07:00
|
|
|
sigaction(SIGABRT, &action, nullptr);
|
|
|
|
sigaction(SIGBUS, &action, nullptr);
|
|
|
|
sigaction(SIGFPE, &action, nullptr);
|
|
|
|
sigaction(SIGILL, &action, nullptr);
|
|
|
|
sigaction(SIGPIPE, &action, nullptr);
|
|
|
|
sigaction(SIGSEGV, &action, nullptr);
|
2012-07-31 12:07:22 -07:00
|
|
|
#if defined(SIGSTKFLT)
|
2014-08-29 12:02:36 -07:00
|
|
|
sigaction(SIGSTKFLT, &action, nullptr);
|
2012-07-31 12:07:22 -07:00
|
|
|
#endif
|
2014-08-29 12:02:36 -07:00
|
|
|
sigaction(SIGTRAP, &action, nullptr);
|
2009-03-03 19:28:35 -08:00
|
|
|
}
|