| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 1 | /* | 
|  | 2 | * Copyright (C) 2019 The Android Open Source Project | 
|  | 3 | * | 
|  | 4 | * Licensed under the Apache License, Version 2.0 (the "License"); | 
|  | 5 | * you may not use this file except in compliance with the License. | 
|  | 6 | * You may obtain a copy of the License at | 
|  | 7 | * | 
|  | 8 | *      http://www.apache.org/licenses/LICENSE-2.0 | 
|  | 9 | * | 
|  | 10 | * Unless required by applicable law or agreed to in writing, software | 
|  | 11 | * distributed under the License is distributed on an "AS IS" BASIS, | 
|  | 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
|  | 13 | * See the License for the specific language governing permissions and | 
|  | 14 | * limitations under the License. | 
|  | 15 | */ | 
|  | 16 |  | 
|  | 17 | #include "mount_namespace.h" | 
|  | 18 |  | 
|  | 19 | #include <sys/mount.h> | 
|  | 20 |  | 
|  | 21 | #include <string> | 
|  | 22 | #include <vector> | 
|  | 23 |  | 
|  | 24 | #include <android-base/file.h> | 
|  | 25 | #include <android-base/logging.h> | 
|  | 26 | #include <android-base/properties.h> | 
| Jooyung Han | 5bb9d21 | 2019-11-25 13:50:44 +0900 | [diff] [blame] | 27 | #include <android-base/result.h> | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 28 | #include <android-base/unique_fd.h> | 
|  | 29 |  | 
|  | 30 | #include "util.h" | 
|  | 31 |  | 
|  | 32 | namespace android { | 
|  | 33 | namespace init { | 
|  | 34 | namespace { | 
|  | 35 |  | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 36 | static bool BindMount(const std::string& source, const std::string& mount_point) { | 
|  | 37 | if (mount(source.c_str(), mount_point.c_str(), nullptr, MS_BIND | MS_REC, nullptr) == -1) { | 
| Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 38 | PLOG(ERROR) << "Failed to bind mount " << source; | 
|  | 39 | return false; | 
|  | 40 | } | 
|  | 41 | return true; | 
|  | 42 | } | 
|  | 43 |  | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 44 | static bool ChangeMount(const std::string& mount_point, unsigned long mountflags) { | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 45 | if (mount(nullptr, mount_point.c_str(), nullptr, mountflags, nullptr) == -1) { | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 46 | PLOG(ERROR) << "Failed to remount " << mount_point << " as " << std::hex << mountflags; | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 47 | return false; | 
|  | 48 | } | 
|  | 49 | return true; | 
|  | 50 | } | 
|  | 51 |  | 
|  | 52 | static int OpenMountNamespace() { | 
|  | 53 | int fd = open("/proc/self/ns/mnt", O_RDONLY | O_CLOEXEC); | 
|  | 54 | if (fd < 0) { | 
|  | 55 | PLOG(ERROR) << "Cannot open fd for current mount namespace"; | 
|  | 56 | } | 
|  | 57 | return fd; | 
|  | 58 | } | 
|  | 59 |  | 
|  | 60 | static std::string GetMountNamespaceId() { | 
|  | 61 | std::string ret; | 
|  | 62 | if (!android::base::Readlink("/proc/self/ns/mnt", &ret)) { | 
|  | 63 | PLOG(ERROR) << "Failed to read namespace ID"; | 
|  | 64 | return ""; | 
|  | 65 | } | 
|  | 66 | return ret; | 
|  | 67 | } | 
|  | 68 |  | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 69 | static android::base::unique_fd bootstrap_ns_fd; | 
|  | 70 | static android::base::unique_fd default_ns_fd; | 
|  | 71 |  | 
|  | 72 | static std::string bootstrap_ns_id; | 
|  | 73 | static std::string default_ns_id; | 
|  | 74 |  | 
|  | 75 | }  // namespace | 
|  | 76 |  | 
| Jooyung Han | 566c652 | 2023-08-09 07:05:31 +0000 | [diff] [blame] | 77 | // In case we have two sets of APEXes (non-updatable, updatable), we need two separate mount | 
|  | 78 | // namespaces. | 
|  | 79 | bool NeedsTwoMountNamespaces() { | 
|  | 80 | if (IsRecoveryMode()) return false; | 
|  | 81 | // In microdroid, there's only one set of APEXes in built-in directories include block devices. | 
|  | 82 | if (IsMicrodroid()) return false; | 
|  | 83 | return true; | 
|  | 84 | } | 
|  | 85 |  | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 86 | bool SetupMountNamespaces() { | 
|  | 87 | // Set the propagation type of / as shared so that any mounting event (e.g. | 
|  | 88 | // /data) is by default visible to all processes. When private mounting is | 
|  | 89 | // needed for /foo/bar, then we will make /foo/bar as a mount point (by | 
|  | 90 | // bind-mounting by to itself) and set the propagation type of the mount | 
|  | 91 | // point to private. | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 92 | if (!ChangeMount("/", MS_SHARED | MS_REC)) return false; | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 93 |  | 
| Jiyong Park | 7b4801a | 2019-02-25 16:41:38 +0900 | [diff] [blame] | 94 | // /apex is a private mountpoint to give different sets of APEXes for | 
| Jiyong Park | dcbaf9f | 2019-02-22 22:15:25 +0900 | [diff] [blame] | 95 | // the bootstrap and default mount namespaces. The processes running with | 
|  | 96 | // the bootstrap namespace get APEXes from the read-only partition. | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 97 | if (!(ChangeMount("/apex", MS_PRIVATE))) return false; | 
| Jiyong Park | dcbaf9f | 2019-02-22 22:15:25 +0900 | [diff] [blame] | 98 |  | 
| Kiyoung Kim | 99df54b | 2019-11-22 16:14:10 +0900 | [diff] [blame] | 99 | // /linkerconfig is a private mountpoint to give a different linker configuration | 
|  | 100 | // based on the mount namespace. Subdirectory will be bind-mounted based on current mount | 
|  | 101 | // namespace | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 102 | if (!(ChangeMount("/linkerconfig", MS_PRIVATE))) return false; | 
| Kiyoung Kim | 99df54b | 2019-11-22 16:14:10 +0900 | [diff] [blame] | 103 |  | 
| Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 104 | // The two mount namespaces present challenges for scoped storage, because | 
|  | 105 | // vold, which is responsible for most of the mounting, lives in the | 
|  | 106 | // bootstrap mount namespace, whereas most other daemons and all apps live | 
|  | 107 | // in the default namespace.  Scoped storage has a need for a | 
|  | 108 | // /mnt/installer view that is a slave bind mount of /mnt/user - in other | 
|  | 109 | // words, all mounts under /mnt/user should automatically show up under | 
|  | 110 | // /mnt/installer. However, additional mounts done under /mnt/installer | 
|  | 111 | // should not propagate back to /mnt/user. In a single mount namespace | 
|  | 112 | // this is easy to achieve, by simply marking the /mnt/installer a slave | 
|  | 113 | // bind mount. Unfortunately, if /mnt/installer is only created and | 
|  | 114 | // bind mounted after the two namespaces are created below, we end up | 
|  | 115 | // with the following situation: | 
|  | 116 | // /mnt/user and /mnt/installer share the same peer group in both the | 
|  | 117 | // bootstrap and default namespaces. Marking /mnt/installer slave in either | 
|  | 118 | // namespace means that it won't propagate events to the /mnt/installer in | 
|  | 119 | // the other namespace, which is still something we require - vold is the | 
|  | 120 | // one doing the mounting under /mnt/installer, and those mounts should | 
|  | 121 | // show up in the default namespace as well. | 
|  | 122 | // | 
|  | 123 | // The simplest solution is to do the bind mount before the two namespaces | 
|  | 124 | // are created: the effect is that in both namespaces, /mnt/installer is a | 
|  | 125 | // slave to the /mnt/user mount, and at the same time /mnt/installer in the | 
|  | 126 | // bootstrap namespace shares a peer group with /mnt/installer in the | 
|  | 127 | // default namespace. | 
| Ricky Wai | a4c163d | 2020-04-21 12:16:43 +0100 | [diff] [blame] | 128 | // /mnt/androidwritable is similar to /mnt/installer but serves for | 
|  | 129 | // MOUNT_EXTERNAL_ANDROID_WRITABLE apps. | 
| Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 130 | if (!mkdir_recursive("/mnt/user", 0755)) return false; | 
|  | 131 | if (!mkdir_recursive("/mnt/installer", 0755)) return false; | 
| Ricky Wai | a4c163d | 2020-04-21 12:16:43 +0100 | [diff] [blame] | 132 | if (!mkdir_recursive("/mnt/androidwritable", 0755)) return false; | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 133 | if (!(BindMount("/mnt/user", "/mnt/installer"))) return false; | 
|  | 134 | if (!(BindMount("/mnt/user", "/mnt/androidwritable"))) return false; | 
| Ricky Wai | a4c163d | 2020-04-21 12:16:43 +0100 | [diff] [blame] | 135 | // First, make /mnt/installer and /mnt/androidwritable a slave bind mount | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 136 | if (!(ChangeMount("/mnt/installer", MS_SLAVE))) return false; | 
|  | 137 | if (!(ChangeMount("/mnt/androidwritable", MS_SLAVE))) return false; | 
| Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 138 | // Then, make it shared again - effectively creating a new peer group, that | 
|  | 139 | // will be inherited by new mount namespaces. | 
| Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 140 | if (!(ChangeMount("/mnt/installer", MS_SHARED))) return false; | 
|  | 141 | if (!(ChangeMount("/mnt/androidwritable", MS_SHARED))) return false; | 
| Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 142 |  | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 143 | bootstrap_ns_fd.reset(OpenMountNamespace()); | 
|  | 144 | bootstrap_ns_id = GetMountNamespaceId(); | 
|  | 145 |  | 
| Jiyong Park | 7b4801a | 2019-02-25 16:41:38 +0900 | [diff] [blame] | 146 | // When APEXes are updatable (e.g. not-flattened), we create separate mount | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 147 | // namespaces for processes that are started before and after the APEX is | 
| Jiyong Park | 7b4801a | 2019-02-25 16:41:38 +0900 | [diff] [blame] | 148 | // activated by apexd. In the namespace for pre-apexd processes, small | 
|  | 149 | // number of essential APEXes (e.g. com.android.runtime) are activated. | 
|  | 150 | // In the namespace for post-apexd processes, all APEXes are activated. | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 151 | bool success = true; | 
| Jooyung Han | 653b063 | 2021-07-29 17:11:23 +0900 | [diff] [blame] | 152 | if (NeedsTwoMountNamespaces()) { | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 153 | // Creating a new namespace by cloning, saving, and switching back to | 
|  | 154 | // the original namespace. | 
|  | 155 | if (unshare(CLONE_NEWNS) == -1) { | 
|  | 156 | PLOG(ERROR) << "Cannot create mount namespace"; | 
|  | 157 | return false; | 
|  | 158 | } | 
|  | 159 | default_ns_fd.reset(OpenMountNamespace()); | 
|  | 160 | default_ns_id = GetMountNamespaceId(); | 
|  | 161 |  | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 162 | if (setns(bootstrap_ns_fd.get(), CLONE_NEWNS) == -1) { | 
|  | 163 | PLOG(ERROR) << "Cannot switch back to bootstrap mount namespace"; | 
|  | 164 | return false; | 
|  | 165 | } | 
| Jooyung Han | 566c652 | 2023-08-09 07:05:31 +0000 | [diff] [blame] | 166 |  | 
|  | 167 | // Some components (e.g. servicemanager) need to access bootstrap | 
|  | 168 | // APEXes from the default mount namespace. To achieve that, we bind-mount | 
|  | 169 | // /apex to /bootstrap-apex in the bootstrap mount namespace. Since /bootstrap-apex | 
|  | 170 | // is "shared", the mounts are visible in the default mount namespace as well. | 
|  | 171 | // | 
|  | 172 | // The end result will look like: | 
|  | 173 | //   in the bootstrap mount namespace: | 
|  | 174 | //     /apex  (== /bootstrap-apex) | 
|  | 175 | //       {bootstrap APEXes from the read-only partition} | 
|  | 176 | // | 
|  | 177 | //   in the default mount namespace: | 
|  | 178 | //     /bootstrap-apex | 
|  | 179 | //       {bootstrap APEXes from the read-only partition} | 
|  | 180 | //     /apex | 
|  | 181 | //       {APEXes, can be from /data partition} | 
|  | 182 | if (!(BindMount("/bootstrap-apex", "/apex"))) return false; | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 183 | } else { | 
|  | 184 | // Otherwise, default == bootstrap | 
|  | 185 | default_ns_fd.reset(OpenMountNamespace()); | 
|  | 186 | default_ns_id = GetMountNamespaceId(); | 
|  | 187 | } | 
| Shikha Malhotra | 720694d | 2021-07-30 12:35:27 +0000 | [diff] [blame] | 188 |  | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 189 | LOG(INFO) << "SetupMountNamespaces done"; | 
|  | 190 | return success; | 
|  | 191 | } | 
|  | 192 |  | 
| Jooyung Han | 5eb441c | 2022-07-23 01:41:18 +0900 | [diff] [blame] | 193 | // Switch the mount namespace of the current process from bootstrap to default OR from default to | 
|  | 194 | // bootstrap. If the current mount namespace is neither bootstrap nor default, keep it that way. | 
| Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 195 | Result<void> SwitchToMountNamespaceIfNeeded(MountNamespace target_mount_namespace) { | 
| Jooyung Han | 918971c | 2023-06-23 14:16:31 +0900 | [diff] [blame] | 196 | if (IsRecoveryMode()) { | 
| Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 197 | // we don't have multiple namespaces in recovery mode or if apex is not updatable | 
|  | 198 | return {}; | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 199 | } | 
| Jooyung Han | 5eb441c | 2022-07-23 01:41:18 +0900 | [diff] [blame] | 200 |  | 
|  | 201 | const std::string current_namespace_id = GetMountNamespaceId(); | 
|  | 202 | MountNamespace current_mount_namespace; | 
|  | 203 | if (current_namespace_id == bootstrap_ns_id) { | 
|  | 204 | current_mount_namespace = NS_BOOTSTRAP; | 
|  | 205 | } else if (current_namespace_id == default_ns_id) { | 
|  | 206 | current_mount_namespace = NS_DEFAULT; | 
|  | 207 | } else { | 
|  | 208 | // services with `namespace mnt` start in its own mount namespace. So we need to keep it. | 
|  | 209 | return {}; | 
|  | 210 | } | 
|  | 211 |  | 
|  | 212 | // We're already in the target mount namespace. | 
|  | 213 | if (current_mount_namespace == target_mount_namespace) { | 
|  | 214 | return {}; | 
|  | 215 | } | 
|  | 216 |  | 
| Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 217 | const auto& ns_fd = target_mount_namespace == NS_BOOTSTRAP ? bootstrap_ns_fd : default_ns_fd; | 
|  | 218 | const auto& ns_name = target_mount_namespace == NS_BOOTSTRAP ? "bootstrap" : "default"; | 
| Jooyung Han | 5eb441c | 2022-07-23 01:41:18 +0900 | [diff] [blame] | 219 | if (ns_fd.get() != -1) { | 
| Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 220 | if (setns(ns_fd.get(), CLONE_NEWNS) == -1) { | 
|  | 221 | return ErrnoError() << "Failed to switch to " << ns_name << " mount namespace."; | 
| Kiyoung Kim | e4d3f21 | 2019-12-16 14:31:04 +0900 | [diff] [blame] | 222 | } | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 223 | } | 
| Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 224 | return {}; | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 225 | } | 
|  | 226 |  | 
| Kiyoung Kim | 0cbee0d | 2021-03-02 16:45:27 +0900 | [diff] [blame] | 227 | base::Result<MountNamespace> GetCurrentMountNamespace() { | 
|  | 228 | std::string current_namespace_id = GetMountNamespaceId(); | 
|  | 229 | if (current_namespace_id == "") { | 
|  | 230 | return Error() << "Failed to get current mount namespace ID"; | 
|  | 231 | } | 
|  | 232 |  | 
|  | 233 | if (current_namespace_id == bootstrap_ns_id) { | 
|  | 234 | return NS_BOOTSTRAP; | 
|  | 235 | } else if (current_namespace_id == default_ns_id) { | 
|  | 236 | return NS_DEFAULT; | 
|  | 237 | } | 
|  | 238 |  | 
|  | 239 | return Error() << "Failed to find current mount namespace"; | 
|  | 240 | } | 
|  | 241 |  | 
| Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 242 | }  // namespace init | 
|  | 243 | }  // namespace android |