| // Copyright (c) 2013 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "base/process/kill.h" |
| |
| #include <errno.h> |
| #include <signal.h> |
| #include <sys/event.h> |
| #include <sys/types.h> |
| #include <sys/wait.h> |
| |
| #include "base/files/file_util.h" |
| #include "base/files/scoped_file.h" |
| #include "base/logging.h" |
| #include "base/posix/eintr_wrapper.h" |
| |
| namespace base { |
| |
| namespace { |
| |
| const int kWaitBeforeKillSeconds = 2; |
| |
| // Reap |child| process. This call blocks until completion. |
| void BlockingReap(pid_t child) { |
| const pid_t result = HANDLE_EINTR(waitpid(child, NULL, 0)); |
| if (result == -1) { |
| DPLOG(ERROR) << "waitpid(" << child << ", NULL, 0)"; |
| } |
| } |
| |
| // Waits for |timeout| seconds for the given |child| to exit and reap it. If |
| // the child doesn't exit within the time specified, kills it. |
| // |
| // This function takes two approaches: first, it tries to use kqueue to |
| // observe when the process exits. kevent can monitor a kqueue with a |
| // timeout, so this method is preferred to wait for a specified period of |
| // time. Once the kqueue indicates the process has exited, waitpid will reap |
| // the exited child. If the kqueue doesn't provide an exit event notification, |
| // before the timeout expires, or if the kqueue fails or misbehaves, the |
| // process will be mercilessly killed and reaped. |
| // |
| // A child process passed to this function may be in one of several states: |
| // running, terminated and not yet reaped, and (apparently, and unfortunately) |
| // terminated and already reaped. Normally, a process will at least have been |
| // asked to exit before this function is called, but this is not required. |
| // If a process is terminating and unreaped, there may be a window between the |
| // time that kqueue will no longer recognize it and when it becomes an actual |
| // zombie that a non-blocking (WNOHANG) waitpid can reap. This condition is |
| // detected when kqueue indicates that the process is not running and a |
| // non-blocking waitpid fails to reap the process but indicates that it is |
| // still running. In this event, a blocking attempt to reap the process |
| // collects the known-dying child, preventing zombies from congregating. |
| // |
| // In the event that the kqueue misbehaves entirely, as it might under a |
| // EMFILE condition ("too many open files", or out of file descriptors), this |
| // function will forcibly kill and reap the child without delay. This |
| // eliminates another potential zombie vector. (If you're out of file |
| // descriptors, you're probably deep into something else, but that doesn't |
| // mean that zombies be allowed to kick you while you're down.) |
| // |
| // The fact that this function seemingly can be called to wait on a child |
| // that's not only already terminated but already reaped is a bit of a |
| // problem: a reaped child's pid can be reclaimed and may refer to a distinct |
| // process in that case. The fact that this function can seemingly be called |
| // to wait on a process that's not even a child is also a problem: kqueue will |
| // work in that case, but waitpid won't, and killing a non-child might not be |
| // the best approach. |
| void WaitForChildToDie(pid_t child, int timeout) { |
| DCHECK_GT(child, 0); |
| DCHECK_GT(timeout, 0); |
| |
| // DON'T ADD ANY EARLY RETURNS TO THIS FUNCTION without ensuring that |
| // |child| has been reaped. Specifically, even if a kqueue, kevent, or other |
| // call fails, this function should fall back to the last resort of trying |
| // to kill and reap the process. Not observing this rule will resurrect |
| // zombies. |
| |
| int result; |
| |
| ScopedFD kq(HANDLE_EINTR(kqueue())); |
| if (!kq.is_valid()) { |
| DPLOG(ERROR) << "kqueue()"; |
| } else { |
| struct kevent change = {0}; |
| EV_SET(&change, child, EVFILT_PROC, EV_ADD, NOTE_EXIT, 0, NULL); |
| result = HANDLE_EINTR(kevent(kq.get(), &change, 1, NULL, 0, NULL)); |
| |
| if (result == -1) { |
| if (errno != ESRCH) { |
| DPLOG(ERROR) << "kevent (setup " << child << ")"; |
| } else { |
| // At this point, one of the following has occurred: |
| // 1. The process has died but has not yet been reaped. |
| // 2. The process has died and has already been reaped. |
| // 3. The process is in the process of dying. It's no longer |
| // kqueueable, but it may not be waitable yet either. Mark calls |
| // this case the "zombie death race". |
| |
| result = HANDLE_EINTR(waitpid(child, NULL, WNOHANG)); |
| |
| if (result != 0) { |
| // A positive result indicates case 1. waitpid succeeded and reaped |
| // the child. A result of -1 indicates case 2. The child has already |
| // been reaped. In both of these cases, no further action is |
| // necessary. |
| return; |
| } |
| |
| // |result| is 0, indicating case 3. The process will be waitable in |
| // short order. Fall back out of the kqueue code to kill it (for good |
| // measure) and reap it. |
| } |
| } else { |
| // Keep track of the elapsed time to be able to restart kevent if it's |
| // interrupted. |
| TimeDelta remaining_delta = TimeDelta::FromSeconds(timeout); |
| TimeTicks deadline = TimeTicks::Now() + remaining_delta; |
| result = -1; |
| struct kevent event = {0}; |
| while (remaining_delta.InMilliseconds() > 0) { |
| const struct timespec remaining_timespec = remaining_delta.ToTimeSpec(); |
| result = kevent(kq.get(), NULL, 0, &event, 1, &remaining_timespec); |
| if (result == -1 && errno == EINTR) { |
| remaining_delta = deadline - TimeTicks::Now(); |
| result = 0; |
| } else { |
| break; |
| } |
| } |
| |
| if (result == -1) { |
| DPLOG(ERROR) << "kevent (wait " << child << ")"; |
| } else if (result > 1) { |
| DLOG(ERROR) << "kevent (wait " << child << "): unexpected result " |
| << result; |
| } else if (result == 1) { |
| if ((event.fflags & NOTE_EXIT) && |
| (event.ident == static_cast<uintptr_t>(child))) { |
| // The process is dead or dying. This won't block for long, if at |
| // all. |
| BlockingReap(child); |
| return; |
| } else { |
| DLOG(ERROR) << "kevent (wait " << child |
| << "): unexpected event: fflags=" << event.fflags |
| << ", ident=" << event.ident; |
| } |
| } |
| } |
| } |
| |
| // The child is still alive, or is very freshly dead. Be sure by sending it |
| // a signal. This is safe even if it's freshly dead, because it will be a |
| // zombie (or on the way to zombiedom) and kill will return 0 even if the |
| // signal is not delivered to a live process. |
| result = kill(child, SIGKILL); |
| if (result == -1) { |
| DPLOG(ERROR) << "kill(" << child << ", SIGKILL)"; |
| } else { |
| // The child is definitely on the way out now. BlockingReap won't need to |
| // wait for long, if at all. |
| BlockingReap(child); |
| } |
| } |
| |
| } // namespace |
| |
| void EnsureProcessTerminated(Process process) { |
| WaitForChildToDie(process.Pid(), kWaitBeforeKillSeconds); |
| } |
| |
| } // namespace base |