blob: 272c16a230af3c0935fa5946f6e0952561b1e7c7 [file] [log] [blame]
The Android Open Source Project1dc9e472009-03-03 19:28:35 -08001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * * Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in
12 * the documentation and/or other materials provided with the
13 * distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
18 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
19 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
22 * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 */
28
Elliott Hughes18a206c2012-10-29 17:37:13 -070029#include "linker.h"
Elliott Hughes18a206c2012-10-29 17:37:13 -070030
Elliott Hughes84114c82013-07-17 13:33:19 -070031#include <errno.h>
Elliott Hughes17e6a982014-04-18 17:39:25 -070032#include <inttypes.h>
Elliott Hughes84114c82013-07-17 13:33:19 -070033#include <signal.h>
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080034#include <stdio.h>
35#include <stdlib.h>
Elliott Hughes84114c82013-07-17 13:33:19 -070036#include <sys/mman.h>
Marco Nelissen3df3e672012-03-07 09:04:18 -080037#include <sys/prctl.h>
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080038#include <sys/socket.h>
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -070039#include <sys/un.h>
Elliott Hughes84114c82013-07-17 13:33:19 -070040#include <unistd.h>
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080041
Elliott Hughes18a206c2012-10-29 17:37:13 -070042extern "C" int tgkill(int tgid, int tid, int sig);
The Android Open Source Project1dc9e472009-03-03 19:28:35 -080043
Elliott Hughesf858bd12014-01-31 16:56:39 -080044#if __LP64__
45#define DEBUGGER_SOCKET_NAME "android:debuggerd64"
46#else
Jeff Brownb7630f02012-06-06 18:37:48 -070047#define DEBUGGER_SOCKET_NAME "android:debuggerd"
Elliott Hughesf858bd12014-01-31 16:56:39 -080048#endif
Jeff Brownb7630f02012-06-06 18:37:48 -070049
Elliott Hughes18a206c2012-10-29 17:37:13 -070050enum debugger_action_t {
Elliott Hughes17e6a982014-04-18 17:39:25 -070051 // dump a crash
52 DEBUGGER_ACTION_CRASH,
53 // dump a tombstone file
54 DEBUGGER_ACTION_DUMP_TOMBSTONE,
55 // dump a backtrace only back to the socket
56 DEBUGGER_ACTION_DUMP_BACKTRACE,
Elliott Hughes18a206c2012-10-29 17:37:13 -070057};
Jeff Brownb7630f02012-06-06 18:37:48 -070058
59/* message sent over the socket */
Elliott Hughes18a206c2012-10-29 17:37:13 -070060struct debugger_msg_t {
Elliott Hughes0d787c12013-04-04 13:46:46 -070061 // version 1 included:
62 debugger_action_t action;
63 pid_t tid;
64
65 // version 2 added:
66 uintptr_t abort_msg_address;
Elliott Hughesb7e289e2014-04-25 16:02:00 -070067
68 // version 3 added:
69 int32_t original_si_code;
Elliott Hughes18a206c2012-10-29 17:37:13 -070070};
David 'Digit' Turner7934a792009-10-16 12:13:34 -070071
Marco Nelissen3df3e672012-03-07 09:04:18 -080072// see man(2) prctl, specifically the section about PR_GET_NAME
73#define MAX_TASK_NAME_LEN (16)
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -070074
Elliott Hughes18a206c2012-10-29 17:37:13 -070075static int socket_abstract_client(const char* name, int type) {
Elliott Hughes17e6a982014-04-18 17:39:25 -070076 sockaddr_un addr;
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -070077
Elliott Hughes17e6a982014-04-18 17:39:25 -070078 // Test with length +1 for the *initial* '\0'.
79 size_t namelen = strlen(name);
80 if ((namelen + 1) > sizeof(addr.sun_path)) {
81 errno = EINVAL;
82 return -1;
83 }
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -070084
Elliott Hughes17e6a982014-04-18 17:39:25 -070085 // This is used for abstract socket namespace, we need
86 // an initial '\0' at the start of the Unix socket path.
87 //
88 // Note: The path in this case is *not* supposed to be
89 // '\0'-terminated. ("man 7 unix" for the gory details.)
90 memset(&addr, 0, sizeof(addr));
91 addr.sun_family = AF_LOCAL;
92 addr.sun_path[0] = 0;
93 memcpy(addr.sun_path + 1, name, namelen);
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -070094
Elliott Hughes17e6a982014-04-18 17:39:25 -070095 socklen_t alen = namelen + offsetof(sockaddr_un, sun_path) + 1;
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -070096
Elliott Hughes17e6a982014-04-18 17:39:25 -070097 int s = socket(AF_LOCAL, type, 0);
98 if (s == -1) {
99 return -1;
100 }
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -0700101
Elliott Hughes17e6a982014-04-18 17:39:25 -0700102 int rc = TEMP_FAILURE_RETRY(connect(s, reinterpret_cast<sockaddr*>(&addr), alen));
103 if (rc == -1) {
104 close(s);
105 return -1;
106 }
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -0700107
Elliott Hughes17e6a982014-04-18 17:39:25 -0700108 return s;
David 'Digit' Turner8bff9a32010-06-10 18:29:33 -0700109}
110
Andy McFaddenec92af82011-07-29 12:46:34 -0700111/*
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700112 * Writes a summary of the signal to the log file. We do this so that, if
113 * for some reason we're not able to contact debuggerd, there is still some
114 * indication of the failure in the log.
Andy McFaddenec92af82011-07-29 12:46:34 -0700115 *
116 * We could be here as a result of native heap corruption, or while a
117 * mutex is being held, so we don't want to use any libc functions that
118 * could allocate memory or hold a lock.
119 */
Elliott Hughes84114c82013-07-17 13:33:19 -0700120static void log_signal_summary(int signum, const siginfo_t* info) {
Elliott Hughes17e6a982014-04-18 17:39:25 -0700121 const char* signal_name = "???";
122 bool has_address = false;
123 switch (signum) {
124 case SIGILL:
125 signal_name = "SIGILL";
126 has_address = true;
127 break;
128 case SIGABRT:
129 signal_name = "SIGABRT";
130 break;
131 case SIGBUS:
132 signal_name = "SIGBUS";
133 has_address = true;
134 break;
135 case SIGFPE:
136 signal_name = "SIGFPE";
137 has_address = true;
138 break;
139 case SIGSEGV:
140 signal_name = "SIGSEGV";
141 has_address = true;
142 break;
Raghu Gandhamd7daacb2012-07-31 12:07:22 -0700143#if defined(SIGSTKFLT)
Elliott Hughes17e6a982014-04-18 17:39:25 -0700144 case SIGSTKFLT:
145 signal_name = "SIGSTKFLT";
146 break;
Raghu Gandhamd7daacb2012-07-31 12:07:22 -0700147#endif
Elliott Hughes17e6a982014-04-18 17:39:25 -0700148 case SIGPIPE:
149 signal_name = "SIGPIPE";
150 break;
151 }
Andy McFaddenec92af82011-07-29 12:46:34 -0700152
Elliott Hughes17e6a982014-04-18 17:39:25 -0700153 char thread_name[MAX_TASK_NAME_LEN + 1]; // one more for termination
154 if (prctl(PR_GET_NAME, (unsigned long)thread_name, 0, 0, 0) != 0) {
155 strcpy(thread_name, "<name unknown>");
156 } else {
157 // short names are null terminated by prctl, but the man page
158 // implies that 16 byte names are not.
159 thread_name[MAX_TASK_NAME_LEN] = 0;
160 }
Elliott Hughes18a206c2012-10-29 17:37:13 -0700161
Elliott Hughes17e6a982014-04-18 17:39:25 -0700162 // "info" will be NULL if the siginfo_t information was not available.
163 // Many signals don't have an address or a code.
164 char code_desc[32]; // ", code -6"
165 char addr_desc[32]; // ", fault addr 0x1234"
166 addr_desc[0] = code_desc[0] = 0;
167 if (info != NULL) {
168 // For a rethrown signal, this si_code will be right and the one debuggerd shows will
169 // always be SI_TKILL.
170 snprintf(code_desc, sizeof(code_desc), ", code %d", info->si_code);
171 if (has_address) {
172 snprintf(addr_desc, sizeof(addr_desc), ", fault addr %p", info->si_addr);
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700173 }
Elliott Hughes17e6a982014-04-18 17:39:25 -0700174 }
175 __libc_format_log(ANDROID_LOG_FATAL, "libc",
176 "Fatal signal %d (%s)%s%s in tid %d (%s)",
177 signum, signal_name, code_desc, addr_desc, gettid(), thread_name);
Andy McFaddenec92af82011-07-29 12:46:34 -0700178}
179
180/*
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700181 * Returns true if the handler for signal "signum" has SA_SIGINFO set.
182 */
Elliott Hughes84114c82013-07-17 13:33:19 -0700183static bool have_siginfo(int signum) {
Elliott Hughes17e6a982014-04-18 17:39:25 -0700184 struct sigaction old_action, new_action;
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700185
Elliott Hughes17e6a982014-04-18 17:39:25 -0700186 memset(&new_action, 0, sizeof(new_action));
187 new_action.sa_handler = SIG_DFL;
188 new_action.sa_flags = SA_RESTART;
189 sigemptyset(&new_action.sa_mask);
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700190
Elliott Hughes17e6a982014-04-18 17:39:25 -0700191 if (sigaction(signum, &new_action, &old_action) < 0) {
192 __libc_format_log(ANDROID_LOG_WARN, "libc", "Failed testing for SA_SIGINFO: %s",
193 strerror(errno));
194 return false;
195 }
196 bool result = (old_action.sa_flags & SA_SIGINFO) != 0;
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700197
Elliott Hughes17e6a982014-04-18 17:39:25 -0700198 if (sigaction(signum, &old_action, NULL) == -1) {
199 __libc_format_log(ANDROID_LOG_WARN, "libc", "Restore failed in test for SA_SIGINFO: %s",
200 strerror(errno));
201 }
202 return result;
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700203}
204
Elliott Hughesb7e289e2014-04-25 16:02:00 -0700205static void send_debuggerd_packet(siginfo_t* info) {
206 int s = socket_abstract_client(DEBUGGER_SOCKET_NAME, SOCK_STREAM);
207 if (s == -1) {
208 __libc_format_log(ANDROID_LOG_FATAL, "libc", "Unable to open connection to debuggerd: %s",
209 strerror(errno));
210 return;
211 }
212
213 // debuggerd knows our pid from the credentials on the
214 // local socket but we need to tell it the tid of the crashing thread.
215 // debuggerd will be paranoid and verify that we sent a tid
216 // that's actually in our process.
217 debugger_msg_t msg;
218 msg.action = DEBUGGER_ACTION_CRASH;
219 msg.tid = gettid();
220 msg.abort_msg_address = reinterpret_cast<uintptr_t>(gAbortMessage);
221 msg.original_si_code = (info != NULL) ? info->si_code : 0;
222 int ret = TEMP_FAILURE_RETRY(write(s, &msg, sizeof(msg)));
223 if (ret == sizeof(msg)) {
224 char debuggerd_ack;
225 ret = TEMP_FAILURE_RETRY(read(s, &debuggerd_ack, 1));
226 int saved_errno = errno;
227 notify_gdb_of_libraries();
228 errno = saved_errno;
229 } else {
230 // read or write failed -- broken connection?
231 __libc_format_log(ANDROID_LOG_FATAL, "libc", "Failed while talking to debuggerd: %s",
232 strerror(errno));
233 }
234
235 close(s);
236}
237
Andy McFadden1db6f2d2012-10-02 13:53:13 -0700238/*
Andy McFaddenec92af82011-07-29 12:46:34 -0700239 * Catches fatal signals so we can ask debuggerd to ptrace us before
240 * we crash.
241 */
Elliott Hughesb7e289e2014-04-25 16:02:00 -0700242static void debuggerd_signal_handler(int signal_number, siginfo_t* info, void*) {
Elliott Hughes17e6a982014-04-18 17:39:25 -0700243 // It's possible somebody cleared the SA_SIGINFO flag, which would mean
244 // our "info" arg holds an undefined value.
245 if (!have_siginfo(signal_number)) {
246 info = NULL;
247 }
248
249 log_signal_summary(signal_number, info);
250
Elliott Hughesb7e289e2014-04-25 16:02:00 -0700251 send_debuggerd_packet(info);
Andy McFaddenca9a0712012-03-08 11:14:37 -0800252
Elliott Hughes17e6a982014-04-18 17:39:25 -0700253 // Remove our net so we fault for real when we return.
254 signal(signal_number, SIG_DFL);
255
256 // These signals are not re-thrown when we resume. This means that
257 // crashing due to (say) SIGPIPE doesn't work the way you'd expect it
258 // to. We work around this by throwing them manually. We don't want
Elliott Hughesb7e289e2014-04-25 16:02:00 -0700259 // to do this for *all* signals because it'll screw up the si_addr for
260 // faults like SIGSEGV. It does screw up the si_code, which is why we
261 // passed that to debuggerd above.
Elliott Hughes17e6a982014-04-18 17:39:25 -0700262 switch (signal_number) {
263 case SIGABRT:
264 case SIGFPE:
265 case SIGPIPE:
Elliott Hughes4eeb1f12013-10-25 17:38:02 -0700266#if defined(SIGSTKFLT)
Elliott Hughes17e6a982014-04-18 17:39:25 -0700267 case SIGSTKFLT:
Raghu Gandhamd7daacb2012-07-31 12:07:22 -0700268#endif
Elliott Hughes17e6a982014-04-18 17:39:25 -0700269 tgkill(getpid(), gettid(), signal_number);
270 break;
271 default: // SIGILL, SIGBUS, SIGSEGV
272 break;
273 }
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800274}
275
Elliott Hughesb7e289e2014-04-25 16:02:00 -0700276__LIBC_HIDDEN__ void debuggerd_init() {
Elliott Hughes17e6a982014-04-18 17:39:25 -0700277 struct sigaction action;
278 memset(&action, 0, sizeof(action));
279 sigemptyset(&action.sa_mask);
280 action.sa_sigaction = debuggerd_signal_handler;
281 action.sa_flags = SA_RESTART | SA_SIGINFO;
Andy McFaddenec92af82011-07-29 12:46:34 -0700282
Elliott Hughes17e6a982014-04-18 17:39:25 -0700283 // Use the alternate signal stack if available so we can catch stack overflows.
284 action.sa_flags |= SA_ONSTACK;
Elliott Hughes84114c82013-07-17 13:33:19 -0700285
Elliott Hughes17e6a982014-04-18 17:39:25 -0700286 sigaction(SIGABRT, &action, NULL);
287 sigaction(SIGBUS, &action, NULL);
288 sigaction(SIGFPE, &action, NULL);
289 sigaction(SIGILL, &action, NULL);
290 sigaction(SIGPIPE, &action, NULL);
291 sigaction(SIGSEGV, &action, NULL);
Raghu Gandhamd7daacb2012-07-31 12:07:22 -0700292#if defined(SIGSTKFLT)
Elliott Hughes17e6a982014-04-18 17:39:25 -0700293 sigaction(SIGSTKFLT, &action, NULL);
Raghu Gandhamd7daacb2012-07-31 12:07:22 -0700294#endif
Elliott Hughes17e6a982014-04-18 17:39:25 -0700295 sigaction(SIGTRAP, &action, NULL);
The Android Open Source Project1dc9e472009-03-03 19:28:35 -0800296}