blob: 33a07ad973dcf6495fef7a79d1aab55082cb0afc [file] [log] [blame]
Elliott Hughes11e45072011-08-16 17:40:46 -07001// Copyright 2011 Google Inc. All Rights Reserved.
2// Author: enh@google.com (Elliott Hughes)
3
Elliott Hughes42ee1422011-09-06 12:33:32 -07004#include "utils.h"
5
Elliott Hughes92b3b562011-09-08 16:32:26 -07006#include <pthread.h>
Elliott Hughes42ee1422011-09-06 12:33:32 -07007#include <sys/syscall.h>
8#include <sys/types.h>
9#include <unistd.h>
10
Elliott Hughes90a33692011-08-30 13:27:07 -070011#include "UniquePtr.h"
buzbeec143c552011-08-20 17:38:58 -070012#include "file.h"
Elliott Hughes11e45072011-08-16 17:40:46 -070013#include "object.h"
buzbeec143c552011-08-20 17:38:58 -070014#include "os.h"
Elliott Hughes11e45072011-08-16 17:40:46 -070015
Elliott Hughesdcc24742011-09-07 14:02:44 -070016#if defined(HAVE_PRCTL)
17#include <sys/prctl.h>
18#endif
19
Elliott Hughes11e45072011-08-16 17:40:46 -070020namespace art {
21
Elliott Hughesd92bec42011-09-02 17:04:36 -070022bool ReadFileToString(const std::string& file_name, std::string* result) {
23 UniquePtr<File> file(OS::OpenFile(file_name.c_str(), false));
24 if (file.get() == NULL) {
25 return false;
26 }
buzbeec143c552011-08-20 17:38:58 -070027
buzbeec143c552011-08-20 17:38:58 -070028 char buf[8 * KB];
29 while (true) {
30 int64_t n = file->Read(buf, sizeof(buf));
Elliott Hughesd92bec42011-09-02 17:04:36 -070031 if (n == -1) {
32 return false;
buzbeec143c552011-08-20 17:38:58 -070033 }
Elliott Hughesd92bec42011-09-02 17:04:36 -070034 if (n == 0) {
35 return true;
36 }
37 result->append(buf, n);
buzbeec143c552011-08-20 17:38:58 -070038 }
buzbeec143c552011-08-20 17:38:58 -070039}
40
Elliott Hughese27955c2011-08-26 15:21:24 -070041std::string GetIsoDate() {
42 time_t now = time(NULL);
43 struct tm tmbuf;
44 struct tm* ptm = localtime_r(&now, &tmbuf);
45 return StringPrintf("%04d-%02d-%02d %02d:%02d:%02d",
46 ptm->tm_year + 1900, ptm->tm_mon+1, ptm->tm_mday,
47 ptm->tm_hour, ptm->tm_min, ptm->tm_sec);
48}
49
Elliott Hughes5174fe62011-08-23 15:12:35 -070050std::string PrettyDescriptor(const String* java_descriptor) {
51 std::string descriptor(java_descriptor->ToModifiedUtf8());
52
Elliott Hughes11e45072011-08-16 17:40:46 -070053 // Count the number of '['s to get the dimensionality.
Elliott Hughes5174fe62011-08-23 15:12:35 -070054 const char* c = descriptor.c_str();
Elliott Hughes11e45072011-08-16 17:40:46 -070055 size_t dim = 0;
56 while (*c == '[') {
57 dim++;
58 c++;
59 }
60
61 // Reference or primitive?
62 if (*c == 'L') {
63 // "[[La/b/C;" -> "a.b.C[][]".
64 c++; // Skip the 'L'.
65 } else {
66 // "[[B" -> "byte[][]".
67 // To make life easier, we make primitives look like unqualified
68 // reference types.
69 switch (*c) {
70 case 'B': c = "byte;"; break;
71 case 'C': c = "char;"; break;
72 case 'D': c = "double;"; break;
73 case 'F': c = "float;"; break;
74 case 'I': c = "int;"; break;
75 case 'J': c = "long;"; break;
76 case 'S': c = "short;"; break;
77 case 'Z': c = "boolean;"; break;
Elliott Hughes5174fe62011-08-23 15:12:35 -070078 default: return descriptor;
Elliott Hughes11e45072011-08-16 17:40:46 -070079 }
80 }
81
82 // At this point, 'c' is a string of the form "fully/qualified/Type;"
83 // or "primitive;". Rewrite the type with '.' instead of '/':
84 std::string result;
85 const char* p = c;
86 while (*p != ';') {
87 char ch = *p++;
88 if (ch == '/') {
89 ch = '.';
90 }
91 result.push_back(ch);
92 }
93 // ...and replace the semicolon with 'dim' "[]" pairs:
94 while (dim--) {
95 result += "[]";
96 }
97 return result;
98}
99
Elliott Hughes54e7df12011-09-16 11:47:04 -0700100std::string PrettyField(const Field* f, bool with_type) {
Elliott Hughesa2501992011-08-26 19:39:54 -0700101 if (f == NULL) {
102 return "null";
103 }
Elliott Hughes54e7df12011-09-16 11:47:04 -0700104 std::string result;
105 if (with_type) {
106 result += PrettyDescriptor(f->GetType()->GetDescriptor());
107 result += ' ';
108 }
109 result += PrettyDescriptor(f->GetDeclaringClass()->GetDescriptor());
Elliott Hughesa2501992011-08-26 19:39:54 -0700110 result += '.';
111 result += f->GetName()->ToModifiedUtf8();
112 return result;
113}
114
Elliott Hughesa0b8feb2011-08-20 09:50:55 -0700115std::string PrettyMethod(const Method* m, bool with_signature) {
116 if (m == NULL) {
117 return "null";
118 }
119 Class* c = m->GetDeclaringClass();
Elliott Hughes5174fe62011-08-23 15:12:35 -0700120 std::string result(PrettyDescriptor(c->GetDescriptor()));
Elliott Hughesa0b8feb2011-08-20 09:50:55 -0700121 result += '.';
122 result += m->GetName()->ToModifiedUtf8();
123 if (with_signature) {
124 // TODO: iterate over the signature's elements and pass them all to
125 // PrettyDescriptor? We'd need to pull out the return type specially, too.
126 result += m->GetSignature()->ToModifiedUtf8();
127 }
128 return result;
129}
130
Elliott Hughes54e7df12011-09-16 11:47:04 -0700131std::string PrettyTypeOf(const Object* obj) {
Elliott Hughes11e45072011-08-16 17:40:46 -0700132 if (obj == NULL) {
133 return "null";
134 }
135 if (obj->GetClass() == NULL) {
136 return "(raw)";
137 }
Elliott Hughes5174fe62011-08-23 15:12:35 -0700138 std::string result(PrettyDescriptor(obj->GetClass()->GetDescriptor()));
Elliott Hughes11e45072011-08-16 17:40:46 -0700139 if (obj->IsClass()) {
Elliott Hughes5174fe62011-08-23 15:12:35 -0700140 result += "<" + PrettyDescriptor(obj->AsClass()->GetDescriptor()) + ">";
Elliott Hughes11e45072011-08-16 17:40:46 -0700141 }
142 return result;
143}
144
Elliott Hughes54e7df12011-09-16 11:47:04 -0700145std::string PrettyClass(const Class* c) {
146 if (c == NULL) {
147 return "null";
148 }
149 std::string result;
150 result += "java.lang.Class<";
151 result += PrettyDescriptor(c->GetDescriptor());
152 result += ">";
153 return result;
154}
155
Elliott Hughes79082e32011-08-25 12:07:32 -0700156std::string MangleForJni(const std::string& s) {
157 std::string result;
158 size_t char_count = CountModifiedUtf8Chars(s.c_str());
159 const char* cp = &s[0];
160 for (size_t i = 0; i < char_count; ++i) {
161 uint16_t ch = GetUtf16FromUtf8(&cp);
162 if (ch == '$' || ch > 127) {
163 StringAppendF(&result, "_0%04x", ch);
164 } else {
165 switch (ch) {
166 case '_':
167 result += "_1";
168 break;
169 case ';':
170 result += "_2";
171 break;
172 case '[':
173 result += "_3";
174 break;
175 case '/':
176 result += "_";
177 break;
178 default:
179 result.push_back(ch);
180 break;
181 }
182 }
183 }
184 return result;
185}
186
187std::string JniShortName(const Method* m) {
188 Class* declaring_class = m->GetDeclaringClass();
189
190 std::string class_name(declaring_class->GetDescriptor()->ToModifiedUtf8());
191 // Remove the leading 'L' and trailing ';'...
192 CHECK(class_name[0] == 'L') << class_name;
193 CHECK(class_name[class_name.size() - 1] == ';') << class_name;
194 class_name.erase(0, 1);
195 class_name.erase(class_name.size() - 1, 1);
196
197 std::string method_name(m->GetName()->ToModifiedUtf8());
198
199 std::string short_name;
200 short_name += "Java_";
201 short_name += MangleForJni(class_name);
202 short_name += "_";
203 short_name += MangleForJni(method_name);
204 return short_name;
205}
206
207std::string JniLongName(const Method* m) {
208 std::string long_name;
209 long_name += JniShortName(m);
210 long_name += "__";
211
212 std::string signature(m->GetSignature()->ToModifiedUtf8());
213 signature.erase(0, 1);
214 signature.erase(signature.begin() + signature.find(')'), signature.end());
215
216 long_name += MangleForJni(signature);
217
218 return long_name;
219}
220
Elliott Hughes64bf5a32011-09-20 14:43:12 -0700221namespace {
222
223// Helper for IsValidMemberNameUtf8(), a bit vector indicating valid low ascii.
224uint32_t DEX_MEMBER_VALID_LOW_ASCII[4] = {
225 0x00000000, // 00..1f low control characters; nothing valid
226 0x03ff2010, // 20..3f digits and symbols; valid: '0'..'9', '$', '-'
227 0x87fffffe, // 40..5f uppercase etc.; valid: 'A'..'Z', '_'
228 0x07fffffe // 60..7f lowercase etc.; valid: 'a'..'z'
229};
230
231// Helper for IsValidMemberNameUtf8(); do not call directly.
232bool IsValidMemberNameUtf8Slow(const char** pUtf8Ptr) {
233 /*
234 * It's a multibyte encoded character. Decode it and analyze. We
235 * accept anything that isn't (a) an improperly encoded low value,
236 * (b) an improper surrogate pair, (c) an encoded '\0', (d) a high
237 * control character, or (e) a high space, layout, or special
238 * character (U+00a0, U+2000..U+200f, U+2028..U+202f,
239 * U+fff0..U+ffff). This is all specified in the dex format
240 * document.
241 */
242
243 uint16_t utf16 = GetUtf16FromUtf8(pUtf8Ptr);
244
245 // Perform follow-up tests based on the high 8 bits.
246 switch (utf16 >> 8) {
247 case 0x00:
248 // It's only valid if it's above the ISO-8859-1 high space (0xa0).
249 return (utf16 > 0x00a0);
250 case 0xd8:
251 case 0xd9:
252 case 0xda:
253 case 0xdb:
254 // It's a leading surrogate. Check to see that a trailing
255 // surrogate follows.
256 utf16 = GetUtf16FromUtf8(pUtf8Ptr);
257 return (utf16 >= 0xdc00) && (utf16 <= 0xdfff);
258 case 0xdc:
259 case 0xdd:
260 case 0xde:
261 case 0xdf:
262 // It's a trailing surrogate, which is not valid at this point.
263 return false;
264 case 0x20:
265 case 0xff:
266 // It's in the range that has spaces, controls, and specials.
267 switch (utf16 & 0xfff8) {
268 case 0x2000:
269 case 0x2008:
270 case 0x2028:
271 case 0xfff0:
272 case 0xfff8:
273 return false;
274 }
275 break;
276 }
277 return true;
278}
279
280/* Return whether the pointed-at modified-UTF-8 encoded character is
281 * valid as part of a member name, updating the pointer to point past
282 * the consumed character. This will consume two encoded UTF-16 code
283 * points if the character is encoded as a surrogate pair. Also, if
284 * this function returns false, then the given pointer may only have
285 * been partially advanced.
286 */
287bool IsValidMemberNameUtf8(const char** pUtf8Ptr) {
288 uint8_t c = (uint8_t) **pUtf8Ptr;
289 if (c <= 0x7f) {
290 // It's low-ascii, so check the table.
291 uint32_t wordIdx = c >> 5;
292 uint32_t bitIdx = c & 0x1f;
293 (*pUtf8Ptr)++;
294 return (DEX_MEMBER_VALID_LOW_ASCII[wordIdx] & (1 << bitIdx)) != 0;
295 }
296
297 // It's a multibyte encoded character. Call a non-inline function
298 // for the heavy lifting.
299 return IsValidMemberNameUtf8Slow(pUtf8Ptr);
300}
301
302} // namespace
303
304bool IsValidClassName(const char* s, bool isClassName, bool dot_or_slash) {
305 char separator = (dot_or_slash ? '.' : '/');
306
307 int arrayCount = 0;
308 while (*s == '[') {
309 arrayCount++;
310 s++;
311 }
312
313 if (arrayCount > 255) {
314 // Arrays may have no more than 255 dimensions.
315 return false;
316 }
317
318 if (arrayCount != 0) {
319 /*
320 * If we're looking at an array of some sort, then it doesn't
321 * matter if what is being asked for is a class name; the
322 * format looks the same as a type descriptor in that case, so
323 * treat it as such.
324 */
325 isClassName = false;
326 }
327
328 if (!isClassName) {
329 /*
330 * We are looking for a descriptor. Either validate it as a
331 * single-character primitive type, or continue on to check the
332 * embedded class name (bracketed by "L" and ";").
333 */
334 switch (*(s++)) {
335 case 'B':
336 case 'C':
337 case 'D':
338 case 'F':
339 case 'I':
340 case 'J':
341 case 'S':
342 case 'Z':
343 // These are all single-character descriptors for primitive types.
344 return (*s == '\0');
345 case 'V':
346 // Non-array void is valid, but you can't have an array of void.
347 return (arrayCount == 0) && (*s == '\0');
348 case 'L':
349 // Class name: Break out and continue below.
350 break;
351 default:
352 // Oddball descriptor character.
353 return false;
354 }
355 }
356
357 /*
358 * We just consumed the 'L' that introduces a class name as part
359 * of a type descriptor, or we are looking for an unadorned class
360 * name.
361 */
362
363 bool sepOrFirst = true; // first character or just encountered a separator.
364 for (;;) {
365 uint8_t c = (uint8_t) *s;
366 switch (c) {
367 case '\0':
368 /*
369 * Premature end for a type descriptor, but valid for
370 * a class name as long as we haven't encountered an
371 * empty component (including the degenerate case of
372 * the empty string "").
373 */
374 return isClassName && !sepOrFirst;
375 case ';':
376 /*
377 * Invalid character for a class name, but the
378 * legitimate end of a type descriptor. In the latter
379 * case, make sure that this is the end of the string
380 * and that it doesn't end with an empty component
381 * (including the degenerate case of "L;").
382 */
383 return !isClassName && !sepOrFirst && (s[1] == '\0');
384 case '/':
385 case '.':
386 if (c != separator) {
387 // The wrong separator character.
388 return false;
389 }
390 if (sepOrFirst) {
391 // Separator at start or two separators in a row.
392 return false;
393 }
394 sepOrFirst = true;
395 s++;
396 break;
397 default:
398 if (!IsValidMemberNameUtf8(&s)) {
399 return false;
400 }
401 sepOrFirst = false;
402 break;
403 }
404 }
405}
406
Elliott Hughes34023802011-08-30 12:06:17 -0700407void Split(const std::string& s, char delim, std::vector<std::string>& result) {
408 const char* p = s.data();
409 const char* end = p + s.size();
410 while (p != end) {
411 if (*p == delim) {
412 ++p;
413 } else {
414 const char* start = p;
415 while (++p != end && *p != delim) {
416 // Skip to the next occurrence of the delimiter.
417 }
418 result.push_back(std::string(start, p - start));
419 }
420 }
421}
422
Elliott Hughesdcc24742011-09-07 14:02:44 -0700423void SetThreadName(const char *threadName) {
424 int hasAt = 0;
425 int hasDot = 0;
426 const char *s = threadName;
427 while (*s) {
428 if (*s == '.') {
429 hasDot = 1;
430 } else if (*s == '@') {
431 hasAt = 1;
432 }
433 s++;
434 }
435 int len = s - threadName;
436 if (len < 15 || hasAt || !hasDot) {
437 s = threadName;
438 } else {
439 s = threadName + len - 15;
440 }
441#if defined(HAVE_ANDROID_PTHREAD_SETNAME_NP)
442 /* pthread_setname_np fails rather than truncating long strings */
443 char buf[16]; // MAX_TASK_COMM_LEN=16 is hard-coded into bionic
444 strncpy(buf, s, sizeof(buf)-1);
445 buf[sizeof(buf)-1] = '\0';
446 errno = pthread_setname_np(pthread_self(), buf);
447 if (errno != 0) {
448 PLOG(WARNING) << "Unable to set the name of current thread to '" << buf << "'";
449 }
450#elif defined(HAVE_PRCTL)
451 prctl(PR_SET_NAME, (unsigned long) s, 0, 0, 0);
452#else
453#error no implementation for SetThreadName
454#endif
455}
456
Elliott Hughes11e45072011-08-16 17:40:46 -0700457} // namespace art
Elliott Hughes42ee1422011-09-06 12:33:32 -0700458
459// Neither bionic nor glibc exposes gettid(2).
460#define __KERNEL__
461#include <linux/unistd.h>
462namespace art {
463#ifdef _syscall0
464_syscall0(pid_t, GetTid)
465#else
466pid_t GetTid() { return syscall(__NR_gettid); }
467#endif
468} // namespace art
469#undef __KERNEL__