/* * Copyright (C) 2008 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ // sys/mount.h has to come before linux/fs.h due to redefinition of MS_RDONLY, MS_BIND, etc #include <sys/mount.h> #include <linux/fs.h> #include <grp.h> #include <paths.h> #include <signal.h> #include <stdlib.h> #include <sys/types.h> #include <sys/wait.h> #include <unistd.h> #include "cutils/fs.h" #include "cutils/multiuser.h" #include "cutils/sched_policy.h" #include "debugger.h" #include "jni_internal.h" #include "JNIHelp.h" #include "ScopedLocalRef.h" #include "ScopedPrimitiveArray.h" #include "ScopedUtfChars.h" #include "thread.h" #if defined(HAVE_PRCTL) #include <sys/prctl.h> #endif #include <selinux/android.h> #if defined(__linux__) #include <sys/personality.h> #include <sys/utsname.h> #include <sys/capability.h> #endif namespace art { static pid_t gSystemServerPid = 0; // Must match values in dalvik.system.Zygote. enum MountExternalKind { MOUNT_EXTERNAL_NONE = 0, MOUNT_EXTERNAL_SINGLEUSER = 1, MOUNT_EXTERNAL_MULTIUSER = 2, MOUNT_EXTERNAL_MULTIUSER_ALL = 3, }; // This signal handler is for zygote mode, since the zygote must reap its children static void SigChldHandler(int /*signal_number*/) { pid_t pid; int status; while ((pid = waitpid(-1, &status, WNOHANG)) > 0) { // Log process-death status that we care about. In general it is // not safe to call LOG(...) from a signal handler because of // possible reentrancy. However, we know a priori that the // current implementation of LOG() is safe to call from a SIGCHLD // handler in the zygote process. If the LOG() implementation // changes its locking strategy or its use of syscalls within the // lazy-init critical section, its use here may become unsafe. if (WIFEXITED(status)) { if (WEXITSTATUS(status)) { LOG(INFO) << "Process " << pid << " exited cleanly (" << WEXITSTATUS(status) << ")"; } else if (false) { LOG(INFO) << "Process " << pid << " exited cleanly (" << WEXITSTATUS(status) << ")"; } } else if (WIFSIGNALED(status)) { if (WTERMSIG(status) != SIGKILL) { LOG(INFO) << "Process " << pid << " terminated by signal (" << WTERMSIG(status) << ")"; } else if (false) { LOG(INFO) << "Process " << pid << " terminated by signal (" << WTERMSIG(status) << ")"; } #ifdef WCOREDUMP if (WCOREDUMP(status)) { LOG(INFO) << "Process " << pid << " dumped core"; } #endif /* ifdef WCOREDUMP */ } // If the just-crashed process is the system_server, bring down zygote // so that it is restarted by init and system server will be restarted // from there. if (pid == gSystemServerPid) { LOG(ERROR) << "Exit zygote because system server (" << pid << ") has terminated"; kill(getpid(), SIGKILL); } } if (pid < 0) { PLOG(WARNING) << "Zygote SIGCHLD error in waitpid"; } } // Configures the SIGCHLD handler for the zygote process. This is configured // very late, because earlier in the runtime we may fork() and exec() // other processes, and we want to waitpid() for those rather than // have them be harvested immediately. // // This ends up being called repeatedly before each fork(), but there's // no real harm in that. static void SetSigChldHandler() { struct sigaction sa; memset(&sa, 0, sizeof(sa)); sa.sa_handler = SigChldHandler; int err = sigaction(SIGCHLD, &sa, NULL); if (err < 0) { PLOG(WARNING) << "Error setting SIGCHLD handler"; } } // Sets the SIGCHLD handler back to default behavior in zygote children. static void UnsetSigChldHandler() { struct sigaction sa; memset(&sa, 0, sizeof(sa)); sa.sa_handler = SIG_DFL; int err = sigaction(SIGCHLD, &sa, NULL); if (err < 0) { PLOG(WARNING) << "Error unsetting SIGCHLD handler"; } } // Calls POSIX setgroups() using the int[] object as an argument. // A NULL argument is tolerated. static void SetGids(JNIEnv* env, jintArray javaGids) { if (javaGids == NULL) { return; } COMPILE_ASSERT(sizeof(gid_t) == sizeof(jint), sizeof_gid_and_jint_are_differerent); ScopedIntArrayRO gids(env, javaGids); CHECK(gids.get() != NULL); int rc = setgroups(gids.size(), reinterpret_cast<const gid_t*>(&gids[0])); if (rc == -1) { PLOG(FATAL) << "setgroups failed"; } } // Sets the resource limits via setrlimit(2) for the values in the // two-dimensional array of integers that's passed in. The second dimension // contains a tuple of length 3: (resource, rlim_cur, rlim_max). NULL is // treated as an empty array. static void SetRLimits(JNIEnv* env, jobjectArray javaRlimits) { if (javaRlimits == NULL) { return; } rlimit rlim; memset(&rlim, 0, sizeof(rlim)); for (int i = 0; i < env->GetArrayLength(javaRlimits); ++i) { ScopedLocalRef<jobject> javaRlimitObject(env, env->GetObjectArrayElement(javaRlimits, i)); ScopedIntArrayRO javaRlimit(env, reinterpret_cast<jintArray>(javaRlimitObject.get())); if (javaRlimit.size() != 3) { LOG(FATAL) << "rlimits array must have a second dimension of size 3"; } rlim.rlim_cur = javaRlimit[1]; rlim.rlim_max = javaRlimit[2]; int rc = setrlimit(javaRlimit[0], &rlim); if (rc == -1) { PLOG(FATAL) << "setrlimit(" << javaRlimit[0] << ", " << "{" << rlim.rlim_cur << ", " << rlim.rlim_max << "}) failed"; } } } #if defined(HAVE_ANDROID_OS) // The debug malloc library needs to know whether it's the zygote or a child. extern "C" int gMallocLeakZygoteChild; static void EnableDebugger() { // To let a non-privileged gdbserver attach to this // process, we must set our dumpable flag. if (prctl(PR_SET_DUMPABLE, 1, 0, 0, 0) == -1) { PLOG(ERROR) << "prctl(PR_SET_DUMPABLE) failed for pid " << getpid(); } // We don't want core dumps, though, so set the core dump size to 0. rlimit rl; rl.rlim_cur = 0; rl.rlim_max = RLIM_INFINITY; if (setrlimit(RLIMIT_CORE, &rl) == -1) { PLOG(ERROR) << "setrlimit(RLIMIT_CORE) failed for pid " << getpid(); } } static void EnableKeepCapabilities() { int rc = prctl(PR_SET_KEEPCAPS, 1, 0, 0, 0); if (rc == -1) { PLOG(FATAL) << "prctl(PR_SET_KEEPCAPS) failed"; } } static void DropCapabilitiesBoundingSet() { for (int i = 0; prctl(PR_CAPBSET_READ, i, 0, 0, 0) >= 0; i++) { if (i == CAP_NET_RAW) { // Don't break /system/bin/ping continue; } int rc = prctl(PR_CAPBSET_DROP, i, 0, 0, 0); if (rc == -1) { if (errno == EINVAL) { PLOG(ERROR) << "prctl(PR_CAPBSET_DROP) failed with EINVAL. Please verify " << "your kernel is compiled with file capabilities support"; } else { PLOG(FATAL) << "prctl(PR_CAPBSET_DROP) failed"; } } } } static void SetCapabilities(int64_t permitted, int64_t effective) { __user_cap_header_struct capheader; __user_cap_data_struct capdata; memset(&capheader, 0, sizeof(capheader)); memset(&capdata, 0, sizeof(capdata)); capheader.version = _LINUX_CAPABILITY_VERSION; capheader.pid = 0; capdata.effective = effective; capdata.permitted = permitted; if (capset(&capheader, &capdata) != 0) { PLOG(FATAL) << "capset(" << permitted << ", " << effective << ") failed"; } } static void SetSchedulerPolicy() { errno = -set_sched_policy(0, SP_DEFAULT); if (errno != 0) { PLOG(FATAL) << "set_sched_policy(0, SP_DEFAULT) failed"; } } #else static int gMallocLeakZygoteChild = 0; static void EnableDebugger() {} static void EnableKeepCapabilities() {} static void DropCapabilitiesBoundingSet() {} static void SetCapabilities(int64_t, int64_t) {} static void SetSchedulerPolicy() {} #endif static void EnableDebugFeatures(uint32_t debug_flags) { // Must match values in dalvik.system.Zygote. enum { DEBUG_ENABLE_DEBUGGER = 1, DEBUG_ENABLE_CHECKJNI = 1 << 1, DEBUG_ENABLE_ASSERT = 1 << 2, DEBUG_ENABLE_SAFEMODE = 1 << 3, DEBUG_ENABLE_JNI_LOGGING = 1 << 4, }; if ((debug_flags & DEBUG_ENABLE_CHECKJNI) != 0) { Runtime* runtime = Runtime::Current(); JavaVMExt* vm = runtime->GetJavaVM(); if (!vm->check_jni) { LOG(DEBUG) << "Late-enabling -Xcheck:jni"; vm->SetCheckJniEnabled(true); // There's only one thread running at this point, so only one JNIEnv to fix up. Thread::Current()->GetJniEnv()->SetCheckJniEnabled(true); } else { LOG(DEBUG) << "Not late-enabling -Xcheck:jni (already on)"; } debug_flags &= ~DEBUG_ENABLE_CHECKJNI; } if ((debug_flags & DEBUG_ENABLE_JNI_LOGGING) != 0) { gLogVerbosity.third_party_jni = true; debug_flags &= ~DEBUG_ENABLE_JNI_LOGGING; } Dbg::SetJdwpAllowed((debug_flags & DEBUG_ENABLE_DEBUGGER) != 0); if ((debug_flags & DEBUG_ENABLE_DEBUGGER) != 0) { EnableDebugger(); } debug_flags &= ~DEBUG_ENABLE_DEBUGGER; // These two are for backwards compatibility with Dalvik. debug_flags &= ~DEBUG_ENABLE_ASSERT; debug_flags &= ~DEBUG_ENABLE_SAFEMODE; if (debug_flags != 0) { LOG(ERROR) << StringPrintf("Unknown bits set in debug_flags: %#x", debug_flags); } } // Create a private mount namespace and bind mount appropriate emulated // storage for the given user. static bool MountEmulatedStorage(uid_t uid, jint mount_mode) { if (mount_mode == MOUNT_EXTERNAL_NONE) { return true; } // See storage config details at http://source.android.com/tech/storage/ userid_t user_id = multiuser_get_user_id(uid); // Create a second private mount namespace for our process if (unshare(CLONE_NEWNS) == -1) { PLOG(WARNING) << "Failed to unshare()"; return false; } // Create bind mounts to expose external storage if (mount_mode == MOUNT_EXTERNAL_MULTIUSER || mount_mode == MOUNT_EXTERNAL_MULTIUSER_ALL) { // These paths must already be created by init.rc const char* source = getenv("EMULATED_STORAGE_SOURCE"); const char* target = getenv("EMULATED_STORAGE_TARGET"); const char* legacy = getenv("EXTERNAL_STORAGE"); if (source == NULL || target == NULL || legacy == NULL) { LOG(WARNING) << "Storage environment undefined; unable to provide external storage"; return false; } // Prepare source paths // /mnt/shell/emulated/0 std::string source_user(StringPrintf("%s/%d", source, user_id)); // /storage/emulated/0 std::string target_user(StringPrintf("%s/%d", target, user_id)); if (fs_prepare_dir(source_user.c_str(), 0000, 0, 0) == -1 || fs_prepare_dir(target_user.c_str(), 0000, 0, 0) == -1) { return false; } if (mount_mode == MOUNT_EXTERNAL_MULTIUSER_ALL) { // Mount entire external storage tree for all users if (mount(source, target, NULL, MS_BIND, NULL) == -1) { PLOG(WARNING) << "Failed to mount " << source << " to " << target; return false; } } else { // Only mount user-specific external storage if (mount(source_user.c_str(), target_user.c_str(), NULL, MS_BIND, NULL) == -1) { PLOG(WARNING) << "Failed to mount " << source_user << " to " << target_user; return false; } } if (fs_prepare_dir(legacy, 0000, 0, 0) == -1) { return false; } // Finally, mount user-specific path into place for legacy users if (mount(target_user.c_str(), legacy, NULL, MS_BIND | MS_REC, NULL) == -1) { PLOG(WARNING) << "Failed to mount " << target_user << " to " << legacy; return false; } } else { LOG(WARNING) << "Mount mode " << mount_mode << " unsupported"; return false; } return true; } #if defined(__linux__) static bool NeedsNoRandomizeWorkaround() { #if !defined(__arm__) return false; #else int major; int minor; struct utsname uts; if (uname(&uts) == -1) { return false; } if (sscanf(uts.release, "%d.%d", &major, &minor) != 2) { return false; } // Kernels before 3.4.* need the workaround. return (major < 3) || ((major == 3) && (minor < 4)); #endif } #endif // Utility routine to fork zygote and specialize the child process. static pid_t ForkAndSpecializeCommon(JNIEnv* env, uid_t uid, gid_t gid, jintArray javaGids, jint debug_flags, jobjectArray javaRlimits, jlong permittedCapabilities, jlong effectiveCapabilities, jint mount_external, jstring java_se_info, jstring java_se_name, bool is_system_server) { Runtime* runtime = Runtime::Current(); CHECK(runtime->IsZygote()) << "runtime instance not started with -Xzygote"; if (!runtime->PreZygoteFork()) { LOG(FATAL) << "pre-fork heap failed"; } SetSigChldHandler(); // Grab thread before fork potentially makes Thread::pthread_key_self_ unusable. Thread* self = Thread::Current(); // dvmDumpLoaderStats("zygote"); // TODO: ? pid_t pid = fork(); if (pid == 0) { // The child process. gMallocLeakZygoteChild = 1; // Keep capabilities across UID change, unless we're staying root. if (uid != 0) { EnableKeepCapabilities(); } DropCapabilitiesBoundingSet(); if (!MountEmulatedStorage(uid, mount_external)) { PLOG(WARNING) << "Failed to mount emulated storage"; if (errno == ENOTCONN || errno == EROFS) { // When device is actively encrypting, we get ENOTCONN here // since FUSE was mounted before the framework restarted. // When encrypted device is booting, we get EROFS since // FUSE hasn't been created yet by init. // In either case, continue without external storage. } else { LOG(FATAL) << "Cannot continue without emulated storage"; } } SetGids(env, javaGids); SetRLimits(env, javaRlimits); int rc = setresgid(gid, gid, gid); if (rc == -1) { PLOG(FATAL) << "setresgid(" << gid << ") failed"; } rc = setresuid(uid, uid, uid); if (rc == -1) { PLOG(FATAL) << "setresuid(" << uid << ") failed"; } #if defined(__linux__) if (NeedsNoRandomizeWorkaround()) { // Work around ARM kernel ASLR lossage (http://b/5817320). int old_personality = personality(0xffffffff); int new_personality = personality(old_personality | ADDR_NO_RANDOMIZE); if (new_personality == -1) { PLOG(WARNING) << "personality(" << new_personality << ") failed"; } } #endif SetCapabilities(permittedCapabilities, effectiveCapabilities); SetSchedulerPolicy(); #if defined(HAVE_ANDROID_OS) { // NOLINT(whitespace/braces) const char* se_info_c_str = NULL; UniquePtr<ScopedUtfChars> se_info; if (java_se_info != NULL) { se_info.reset(new ScopedUtfChars(env, java_se_info)); se_info_c_str = se_info->c_str(); CHECK(se_info_c_str != NULL); } const char* se_name_c_str = NULL; UniquePtr<ScopedUtfChars> se_name; if (java_se_name != NULL) { se_name.reset(new ScopedUtfChars(env, java_se_name)); se_name_c_str = se_name->c_str(); CHECK(se_name_c_str != NULL); } rc = selinux_android_setcontext(uid, is_system_server, se_info_c_str, se_name_c_str); if (rc == -1) { PLOG(FATAL) << "selinux_android_setcontext(" << uid << ", " << (is_system_server ? "true" : "false") << ", " << "\"" << se_info_c_str << "\", \"" << se_name_c_str << "\") failed"; } } #else UNUSED(is_system_server); UNUSED(java_se_info); UNUSED(java_se_name); #endif // Our system thread ID, etc, has changed so reset Thread state. self->InitAfterFork(); EnableDebugFeatures(debug_flags); UnsetSigChldHandler(); runtime->DidForkFromZygote(); } else if (pid > 0) { // the parent process } return pid; } static jint Zygote_nativeForkAndSpecialize(JNIEnv* env, jclass, jint uid, jint gid, jintArray gids, jint debug_flags, jobjectArray rlimits, jint mount_external, jstring se_info, jstring se_name) { return ForkAndSpecializeCommon(env, uid, gid, gids, debug_flags, rlimits, 0, 0, mount_external, se_info, se_name, false); } static jint Zygote_nativeForkSystemServer(JNIEnv* env, jclass, uid_t uid, gid_t gid, jintArray gids, jint debug_flags, jobjectArray rlimits, jlong permittedCapabilities, jlong effectiveCapabilities) { pid_t pid = ForkAndSpecializeCommon(env, uid, gid, gids, debug_flags, rlimits, permittedCapabilities, effectiveCapabilities, MOUNT_EXTERNAL_NONE, NULL, NULL, true); if (pid > 0) { // The zygote process checks whether the child process has died or not. LOG(INFO) << "System server process " << pid << " has been created"; gSystemServerPid = pid; // There is a slight window that the system server process has crashed // but it went unnoticed because we haven't published its pid yet. So // we recheck here just to make sure that all is well. int status; if (waitpid(pid, &status, WNOHANG) == pid) { LOG(FATAL) << "System server process " << pid << " has died. Restarting Zygote!"; } } return pid; } static JNINativeMethod gMethods[] = { NATIVE_METHOD(Zygote, nativeForkAndSpecialize, "(II[II[[IILjava/lang/String;Ljava/lang/String;)I"), NATIVE_METHOD(Zygote, nativeForkSystemServer, "(II[II[[IJJ)I"), }; void register_dalvik_system_Zygote(JNIEnv* env) { REGISTER_NATIVE_METHODS("dalvik/system/Zygote"); } } // namespace art