2010-04-14 04:48:59 +02:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2010 The Android Open Source Project
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2017-09-06 22:43:57 +02:00
|
|
|
#include "sigchld_handler.h"
|
2017-07-29 00:22:23 +02:00
|
|
|
|
2010-04-14 04:48:59 +02:00
|
|
|
#include <signal.h>
|
2017-04-07 01:30:22 +02:00
|
|
|
#include <string.h>
|
2023-11-03 18:33:17 +01:00
|
|
|
#include <sys/signalfd.h>
|
2010-04-14 04:48:59 +02:00
|
|
|
#include <sys/socket.h>
|
2015-03-28 07:20:44 +01:00
|
|
|
#include <sys/types.h>
|
2017-07-29 00:22:23 +02:00
|
|
|
#include <sys/wait.h>
|
2015-03-28 07:20:44 +01:00
|
|
|
#include <unistd.h>
|
|
|
|
|
2017-07-29 00:22:23 +02:00
|
|
|
#include <android-base/chrono_utils.h>
|
2022-10-21 21:44:02 +02:00
|
|
|
#include <android-base/file.h>
|
2017-04-07 01:30:22 +02:00
|
|
|
#include <android-base/logging.h>
|
2017-07-29 00:22:23 +02:00
|
|
|
#include <android-base/scopeguard.h>
|
|
|
|
#include <android-base/stringprintf.h>
|
2010-04-14 04:48:59 +02:00
|
|
|
|
2019-10-09 16:23:02 +02:00
|
|
|
#include <thread>
|
|
|
|
|
2023-11-03 18:33:17 +01:00
|
|
|
#include "epoll.h"
|
2010-04-14 04:48:59 +02:00
|
|
|
#include "init.h"
|
2015-07-31 21:45:25 +02:00
|
|
|
#include "service.h"
|
2019-06-26 19:46:20 +02:00
|
|
|
#include "service_list.h"
|
2010-04-14 04:48:59 +02:00
|
|
|
|
2017-07-29 00:22:23 +02:00
|
|
|
using android::base::boot_clock;
|
|
|
|
using android::base::make_scope_guard;
|
2022-10-21 21:44:02 +02:00
|
|
|
using android::base::ReadFileToString;
|
2019-10-09 16:23:02 +02:00
|
|
|
using android::base::StringPrintf;
|
|
|
|
using android::base::Timer;
|
2017-07-29 00:22:23 +02:00
|
|
|
|
2017-06-22 21:53:17 +02:00
|
|
|
namespace android {
|
|
|
|
namespace init {
|
|
|
|
|
2019-10-09 16:23:02 +02:00
|
|
|
static pid_t ReapOneProcess() {
|
2017-07-29 00:22:23 +02:00
|
|
|
siginfo_t siginfo = {};
|
|
|
|
// This returns a zombie pid or informs us that there are no zombies left to be reaped.
|
|
|
|
// It does NOT reap the pid; that is done below.
|
|
|
|
if (TEMP_FAILURE_RETRY(waitid(P_ALL, 0, &siginfo, WEXITED | WNOHANG | WNOWAIT)) != 0) {
|
|
|
|
PLOG(ERROR) << "waitid failed";
|
2019-10-09 16:23:02 +02:00
|
|
|
return 0;
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
|
|
|
|
2022-10-19 19:52:23 +02:00
|
|
|
const pid_t pid = siginfo.si_pid;
|
|
|
|
if (pid == 0) {
|
|
|
|
DCHECK_EQ(siginfo.si_signo, 0);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
DCHECK_EQ(siginfo.si_signo, SIGCHLD);
|
2017-07-29 00:22:23 +02:00
|
|
|
|
|
|
|
// At this point we know we have a zombie pid, so we use this scopeguard to reap the pid
|
|
|
|
// whenever the function returns from this point forward.
|
|
|
|
// We do NOT want to reap the zombie earlier as in Service::Reap(), we kill(-pid, ...) and we
|
|
|
|
// want the pid to remain valid throughout that (and potentially future) usages.
|
|
|
|
auto reaper = make_scope_guard([pid] { TEMP_FAILURE_RETRY(waitpid(pid, nullptr, WNOHANG)); });
|
|
|
|
|
|
|
|
std::string name;
|
|
|
|
std::string wait_string;
|
2017-09-13 00:58:47 +02:00
|
|
|
Service* service = nullptr;
|
|
|
|
|
2019-04-24 00:11:07 +02:00
|
|
|
if (SubcontextChildReap(pid)) {
|
2017-09-13 00:58:47 +02:00
|
|
|
name = "Subcontext";
|
2017-07-29 00:22:23 +02:00
|
|
|
} else {
|
2017-09-13 00:58:47 +02:00
|
|
|
service = ServiceList::GetInstance().FindService(pid, &Service::pid);
|
|
|
|
|
|
|
|
if (service) {
|
|
|
|
name = StringPrintf("Service '%s' (pid %d)", service->name().c_str(), pid);
|
|
|
|
if (service->flags() & SVC_EXEC) {
|
|
|
|
auto exec_duration = boot_clock::now() - service->time_started();
|
|
|
|
auto exec_duration_ms =
|
|
|
|
std::chrono::duration_cast<std::chrono::milliseconds>(exec_duration).count();
|
|
|
|
wait_string = StringPrintf(" waiting took %f seconds", exec_duration_ms / 1000.0f);
|
2019-07-31 20:35:18 +02:00
|
|
|
} else if (service->flags() & SVC_ONESHOT) {
|
|
|
|
auto exec_duration = boot_clock::now() - service->time_started();
|
|
|
|
auto exec_duration_ms =
|
|
|
|
std::chrono::duration_cast<std::chrono::milliseconds>(exec_duration)
|
|
|
|
.count();
|
|
|
|
wait_string = StringPrintf(" oneshot service took %f seconds in background",
|
|
|
|
exec_duration_ms / 1000.0f);
|
2017-09-13 00:58:47 +02:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
name = StringPrintf("Untracked pid %d", pid);
|
|
|
|
}
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
|
|
|
|
2018-04-13 19:38:57 +02:00
|
|
|
if (siginfo.si_code == CLD_EXITED) {
|
|
|
|
LOG(INFO) << name << " exited with status " << siginfo.si_status << wait_string;
|
|
|
|
} else {
|
|
|
|
LOG(INFO) << name << " received signal " << siginfo.si_status << wait_string;
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
|
|
|
|
2022-03-08 04:10:57 +01:00
|
|
|
if (!service) {
|
|
|
|
LOG(INFO) << name << " did not have an associated service entry and will not be reaped";
|
|
|
|
return pid;
|
|
|
|
}
|
2017-07-29 00:22:23 +02:00
|
|
|
|
2018-04-13 19:38:57 +02:00
|
|
|
service->Reap(siginfo);
|
2017-07-29 00:22:23 +02:00
|
|
|
|
|
|
|
if (service->flags() & SVC_TEMPORARY) {
|
2017-07-28 01:20:58 +02:00
|
|
|
ServiceList::GetInstance().RemoveService(*service);
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
|
|
|
|
2019-10-09 16:23:02 +02:00
|
|
|
return pid;
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
|
|
|
|
2023-11-20 23:38:55 +01:00
|
|
|
std::set<pid_t> ReapAnyOutstandingChildren() {
|
|
|
|
std::set<pid_t> reaped_pids;
|
|
|
|
for (;;) {
|
|
|
|
const pid_t pid = ReapOneProcess();
|
|
|
|
if (pid <= 0) {
|
|
|
|
return reaped_pids;
|
|
|
|
}
|
|
|
|
reaped_pids.emplace(pid);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void ReapAndRemove(std::vector<pid_t>& alive_pids) {
|
|
|
|
for (auto pid : ReapAnyOutstandingChildren()) {
|
|
|
|
const auto it = std::find(alive_pids.begin(), alive_pids.end(), pid);
|
|
|
|
if (it != alive_pids.end()) {
|
|
|
|
alive_pids.erase(it);
|
|
|
|
}
|
2019-10-09 16:23:02 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-11-16 20:19:08 +01:00
|
|
|
static void HandleSignal(int signal_fd) {
|
2023-11-03 18:33:17 +01:00
|
|
|
signalfd_siginfo siginfo;
|
|
|
|
ssize_t bytes_read = TEMP_FAILURE_RETRY(read(signal_fd, &siginfo, sizeof(siginfo)));
|
|
|
|
if (bytes_read != sizeof(siginfo)) {
|
|
|
|
LOG(WARNING) << "Unexpected: " << __func__ << " read " << bytes_read << " bytes instead of "
|
|
|
|
<< sizeof(siginfo);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void WaitToBeReaped(int sigchld_fd, const std::vector<pid_t>& pids,
|
|
|
|
std::chrono::milliseconds timeout) {
|
2019-10-09 16:23:02 +02:00
|
|
|
Timer t;
|
2023-11-03 18:33:17 +01:00
|
|
|
Epoll epoll;
|
|
|
|
if (sigchld_fd >= 0) {
|
2023-11-16 20:19:08 +01:00
|
|
|
if (auto result = epoll.Open(); result.ok()) {
|
|
|
|
result =
|
|
|
|
epoll.RegisterHandler(sigchld_fd, [sigchld_fd]() { HandleSignal(sigchld_fd); });
|
|
|
|
if (!result.ok()) {
|
|
|
|
LOG(WARNING) << __func__
|
|
|
|
<< " RegisterHandler() failed. Falling back to sleep_for(): "
|
|
|
|
<< result.error();
|
|
|
|
sigchld_fd = -1;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
LOG(WARNING) << __func__ << " Epoll::Open() failed. Falling back to sleep_for(): "
|
|
|
|
<< result.error();
|
|
|
|
sigchld_fd = -1;
|
|
|
|
}
|
2023-11-03 18:33:17 +01:00
|
|
|
}
|
2023-11-16 20:19:08 +01:00
|
|
|
std::vector<pid_t> alive_pids(pids);
|
|
|
|
ReapAndRemove(alive_pids);
|
2019-10-09 16:23:02 +02:00
|
|
|
while (!alive_pids.empty() && t.duration() < timeout) {
|
2023-11-03 18:33:17 +01:00
|
|
|
if (sigchld_fd >= 0) {
|
2023-11-16 20:19:08 +01:00
|
|
|
auto result = epoll.Wait(std::max(timeout - t.duration(), 0ms));
|
|
|
|
if (result.ok()) {
|
|
|
|
ReapAndRemove(alive_pids);
|
|
|
|
continue;
|
|
|
|
} else {
|
|
|
|
LOG(WARNING) << "Epoll::Wait() failed " << result.error();
|
|
|
|
}
|
2023-11-03 18:33:17 +01:00
|
|
|
}
|
2023-11-16 20:19:08 +01:00
|
|
|
std::this_thread::sleep_for(50ms);
|
|
|
|
ReapAndRemove(alive_pids);
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
2019-10-09 16:23:02 +02:00
|
|
|
LOG(INFO) << "Waiting for " << pids.size() << " pids to be reaped took " << t << " with "
|
|
|
|
<< alive_pids.size() << " of them still running";
|
2023-11-01 22:29:07 +01:00
|
|
|
for (pid_t pid : alive_pids) {
|
2022-10-21 21:44:02 +02:00
|
|
|
std::string status = "(no-such-pid)";
|
|
|
|
ReadFileToString(StringPrintf("/proc/%d/status", pid), &status);
|
2023-11-01 22:29:07 +01:00
|
|
|
LOG(INFO) << "Still running: " << pid << '\n' << status;
|
2022-10-21 21:44:02 +02:00
|
|
|
}
|
2017-07-29 00:22:23 +02:00
|
|
|
}
|
|
|
|
|
2017-06-22 21:53:17 +02:00
|
|
|
} // namespace init
|
|
|
|
} // namespace android
|