blob: 8494f9895e684cbe318426b7647bfbba44c72fd3 [file] [log] [blame]
/*
* Copyright (C) 2016 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#define LOG_TAG "incidentd"
#include "Section.h"
#include "protobuf.h"
#include <binder/IServiceManager.h>
#include <mutex>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <wait.h>
#include <unistd.h>
using namespace std;
const int64_t REMOTE_CALL_TIMEOUT_MS = 10 * 1000; // 10 seconds
const int64_t INCIDENT_HELPER_TIMEOUT_MS = 5 * 1000; // 5 seconds
const char* INCIDENT_HELPER = "/system/bin/incident_helper";
const uid_t IH_UID = 9999; // run incident_helper as nobody
const gid_t IH_GID = 9999;
// ================================================================================
Section::Section(int i)
:id(i)
{
}
Section::~Section()
{
}
status_t
Section::WriteHeader(ReportRequestSet* requests, size_t size) const
{
ssize_t amt;
uint8_t buf[20];
uint8_t* p = write_length_delimited_tag_header(buf, this->id, size);
return requests->write(buf, p-buf);
}
// ================================================================================
FileSection::FileSection(int id, const char* filename)
: Section(id), mFilename(filename) {
name = "cat ";
name += filename;
}
FileSection::~FileSection() {}
status_t FileSection::Execute(ReportRequestSet* requests) const {
Fpipe p2cPipe;
Fpipe c2pPipe;
FdBuffer buffer;
// initiate pipes to pass data to/from incident_helper
if (p2cPipe.init() == -1) {
return -errno;
}
if (c2pPipe.init() == -1) {
return -errno;
}
// fork a child process
pid_t pid = fork();
if (pid == -1) {
ALOGW("FileSection '%s' failed to fork", this->name.string());
return -errno;
}
// child process
if (pid == 0) {
if (setgid(IH_GID) == -1) {
ALOGW("FileSection '%s' can't change gid: %s", this->name.string(), strerror(errno));
exit(EXIT_FAILURE);
}
if (setuid(IH_UID) == -1) {
ALOGW("FileSection '%s' can't change uid: %s", this->name.string(), strerror(errno));
exit(EXIT_FAILURE);
}
if (dup2(p2cPipe.readFd(), STDIN_FILENO) != 0 || !p2cPipe.close()) {
ALOGW("FileSection '%s' failed to set up stdin: %s", this->name.string(), strerror(errno));
exit(EXIT_FAILURE);
}
if (dup2(c2pPipe.writeFd(), STDOUT_FILENO) != 1 || !c2pPipe.close()) {
ALOGW("FileSection '%s' failed to set up stdout: %s", this->name.string(), strerror(errno));
exit(EXIT_FAILURE);
}
// execute incident_helper to parse raw file data and generate protobuf
char sectionID[8]; // section id is expected to be smaller than 8 digits
sprintf(sectionID, "%d", this->id);
const char* args[]{INCIDENT_HELPER, "-s", sectionID, NULL};
execv(INCIDENT_HELPER, const_cast<char**>(args));
ALOGW("FileSection '%s' failed in child process: %s", this->name.string(), strerror(errno));
return -1;
}
// parent process
// close fds used in child process
close(p2cPipe.readFd());
close(c2pPipe.writeFd());
// read from mFilename and pump buffer to incident_helper
status_t err = NO_ERROR;
int fd = open(mFilename, O_RDONLY, 0444);
if (fd == -1) {
ALOGW("FileSection '%s' failed to open file", this->name.string());
return -errno;
}
err = buffer.readProcessedDataInStream(fd,
p2cPipe.writeFd(), c2pPipe.readFd(), INCIDENT_HELPER_TIMEOUT_MS);
if (err != NO_ERROR) {
ALOGW("FileSection '%s' failed to read data from incident helper: %s",
this->name.string(), strerror(-err));
kill(pid, SIGKILL); // kill child process if meets error
return err;
}
if (buffer.timedOut()) {
ALOGW("FileSection '%s' timed out reading from incident helper!", this->name.string());
kill(pid, SIGKILL); // kill the child process if timed out
}
// has to block here to reap child process
int status;
int w = waitpid(pid, &status, 0);
if (w < 0 || status == -1) {
ALOGW("FileSection '%s' abnormal child process: %s", this->name.string(), strerror(-err));
return -errno;
}
// write parsed data to reporter
ALOGD("section '%s' wrote %zd bytes in %d ms", this->name.string(), buffer.size(),
(int)buffer.durationMs());
WriteHeader(requests, buffer.size());
err = buffer.write(requests);
if (err != NO_ERROR) {
ALOGW("FileSection '%s' failed writing: %s", this->name.string(), strerror(-err));
return err;
}
return NO_ERROR;
}
// ================================================================================
struct WorkerThreadData : public virtual RefBase
{
const WorkerThreadSection* section;
int fds[2];
// Lock protects these fields
mutex lock;
bool workerDone;
status_t workerError;
WorkerThreadData(const WorkerThreadSection* section);
virtual ~WorkerThreadData();
int readFd() { return fds[0]; }
int writeFd() { return fds[1]; }
};
WorkerThreadData::WorkerThreadData(const WorkerThreadSection* sec)
:section(sec),
workerDone(false),
workerError(NO_ERROR)
{
fds[0] = -1;
fds[1] = -1;
}
WorkerThreadData::~WorkerThreadData()
{
}
// ================================================================================
WorkerThreadSection::WorkerThreadSection(int id)
:Section(id)
{
}
WorkerThreadSection::~WorkerThreadSection()
{
}
static void*
worker_thread_func(void* cookie)
{
WorkerThreadData* data = (WorkerThreadData*)cookie;
status_t err = data->section->BlockingCall(data->writeFd());
{
unique_lock<mutex> lock(data->lock);
data->workerDone = true;
data->workerError = err;
}
close(data->writeFd());
data->decStrong(data->section);
// data might be gone now. don't use it after this point in this thread.
return NULL;
}
status_t
WorkerThreadSection::Execute(ReportRequestSet* requests) const
{
status_t err = NO_ERROR;
pthread_t thread;
pthread_attr_t attr;
bool timedOut = false;
FdBuffer buffer;
// Data shared between this thread and the worker thread.
sp<WorkerThreadData> data = new WorkerThreadData(this);
// Create the pipe
err = pipe(data->fds);
if (err != 0) {
return -errno;
}
// The worker thread needs a reference and we can't let the count go to zero
// if that thread is slow to start.
data->incStrong(this);
// Create the thread
err = pthread_attr_init(&attr);
if (err != 0) {
return -err;
}
// TODO: Do we need to tweak thread priority?
err = pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
if (err != 0) {
pthread_attr_destroy(&attr);
return -err;
}
err = pthread_create(&thread, &attr, worker_thread_func, (void*)data.get());
if (err != 0) {
pthread_attr_destroy(&attr);
return -err;
}
pthread_attr_destroy(&attr);
// Loop reading until either the timeout or the worker side is done (i.e. eof).
err = buffer.read(data->readFd(), REMOTE_CALL_TIMEOUT_MS);
if (err != NO_ERROR) {
// TODO: Log this error into the incident report.
ALOGW("WorkerThreadSection '%s' reader failed with error '%s'", this->name.string(),
strerror(-err));
}
// Done with the read fd. The worker thread closes the write one so
// we never race and get here first.
close(data->readFd());
// If the worker side is finished, then return its error (which may overwrite
// our possible error -- but it's more interesting anyway). If not, then we timed out.
{
unique_lock<mutex> lock(data->lock);
if (!data->workerDone) {
// We timed out
timedOut = true;
} else {
if (data->workerError != NO_ERROR) {
err = data->workerError;
// TODO: Log this error into the incident report.
ALOGW("WorkerThreadSection '%s' worker failed with error '%s'", this->name.string(),
strerror(-err));
}
}
}
if (timedOut || buffer.timedOut()) {
ALOGW("WorkerThreadSection '%s' timed out", this->name.string());
return NO_ERROR;
}
if (buffer.truncated()) {
// TODO: Log this into the incident report.
}
// TODO: There was an error with the command or buffering. Report that. For now
// just exit with a log messasge.
if (err != NO_ERROR) {
ALOGW("WorkerThreadSection '%s' failed with error '%s'", this->name.string(),
strerror(-err));
return NO_ERROR;
}
// Write the data that was collected
ALOGD("section '%s' wrote %zd bytes in %d ms", name.string(), buffer.size(),
(int)buffer.durationMs());
WriteHeader(requests, buffer.size());
err = buffer.write(requests);
if (err != NO_ERROR) {
ALOGW("WorkerThreadSection '%s' failed writing: '%s'", this->name.string(), strerror(-err));
return err;
}
return NO_ERROR;
}
// ================================================================================
CommandSection::CommandSection(int id, const char* first, ...)
:Section(id)
{
va_list args;
int count = 0;
va_start(args, first);
while (va_arg(args, const char*) != NULL) {
count++;
}
va_end(args);
mCommand = (const char**)malloc(sizeof(const char*) * count);
mCommand[0] = first;
name = first;
name += " ";
va_start(args, first);
for (int i=0; i<count; i++) {
const char* arg = va_arg(args, const char*);
mCommand[i+1] = arg;
if (arg != NULL) {
name += va_arg(args, const char*);
name += " ";
}
}
va_end(args);
}
CommandSection::~CommandSection()
{
}
status_t
CommandSection::Execute(ReportRequestSet* /*requests*/) const
{
return NO_ERROR;
}
// ================================================================================
DumpsysSection::DumpsysSection(int id, const char* service, ...)
:WorkerThreadSection(id),
mService(service)
{
name = "dumpsys ";
name += service;
va_list args;
va_start(args, service);
while (true) {
const char* arg = va_arg(args, const char*);
if (arg == NULL) {
break;
}
mArgs.add(String16(arg));
name += " ";
name += arg;
}
va_end(args);
}
DumpsysSection::~DumpsysSection()
{
}
status_t
DumpsysSection::BlockingCall(int pipeWriteFd) const
{
// checkService won't wait for the service to show up like getService will.
sp<IBinder> service = defaultServiceManager()->checkService(mService);
if (service == NULL) {
// Returning an error interrupts the entire incident report, so just
// log the failure.
// TODO: have a meta record inside the report that would log this
// failure inside the report, because the fact that we can't find
// the service is good data in and of itself. This is running in
// another thread so lock that carefully...
ALOGW("DumpsysSection: Can't lookup service: %s", String8(mService).string());
return NO_ERROR;
}
service->dump(pipeWriteFd, mArgs);
return NO_ERROR;
}