Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2019 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #include "mount_namespace.h" |
| 18 | |
| 19 | #include <sys/mount.h> |
| 20 | |
| 21 | #include <string> |
| 22 | #include <vector> |
| 23 | |
| 24 | #include <android-base/file.h> |
| 25 | #include <android-base/logging.h> |
| 26 | #include <android-base/properties.h> |
Jooyung Han | 5bb9d21 | 2019-11-25 13:50:44 +0900 | [diff] [blame] | 27 | #include <android-base/result.h> |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 28 | #include <android-base/unique_fd.h> |
| 29 | |
| 30 | #include "util.h" |
| 31 | |
| 32 | namespace android { |
| 33 | namespace init { |
| 34 | namespace { |
| 35 | |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 36 | static bool BindMount(const std::string& source, const std::string& mount_point) { |
| 37 | if (mount(source.c_str(), mount_point.c_str(), nullptr, MS_BIND | MS_REC, nullptr) == -1) { |
Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 38 | PLOG(ERROR) << "Failed to bind mount " << source; |
| 39 | return false; |
| 40 | } |
| 41 | return true; |
| 42 | } |
| 43 | |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 44 | static bool ChangeMount(const std::string& mount_point, unsigned long mountflags) { |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 45 | if (mount(nullptr, mount_point.c_str(), nullptr, mountflags, nullptr) == -1) { |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 46 | PLOG(ERROR) << "Failed to remount " << mount_point << " as " << std::hex << mountflags; |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 47 | return false; |
| 48 | } |
| 49 | return true; |
| 50 | } |
| 51 | |
| 52 | static int OpenMountNamespace() { |
| 53 | int fd = open("/proc/self/ns/mnt", O_RDONLY | O_CLOEXEC); |
| 54 | if (fd < 0) { |
| 55 | PLOG(ERROR) << "Cannot open fd for current mount namespace"; |
| 56 | } |
| 57 | return fd; |
| 58 | } |
| 59 | |
| 60 | static std::string GetMountNamespaceId() { |
| 61 | std::string ret; |
| 62 | if (!android::base::Readlink("/proc/self/ns/mnt", &ret)) { |
| 63 | PLOG(ERROR) << "Failed to read namespace ID"; |
| 64 | return ""; |
| 65 | } |
| 66 | return ret; |
| 67 | } |
| 68 | |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 69 | static android::base::unique_fd bootstrap_ns_fd; |
| 70 | static android::base::unique_fd default_ns_fd; |
| 71 | |
| 72 | static std::string bootstrap_ns_id; |
| 73 | static std::string default_ns_id; |
| 74 | |
| 75 | } // namespace |
| 76 | |
Jooyung Han | 201801c | 2023-07-20 17:25:47 +0900 | [diff] [blame^] | 77 | // In case we have two sets of APEXes (non-updatable, updatable), we need two separate mount |
| 78 | // namespaces. |
| 79 | bool NeedsTwoMountNamespaces() { |
| 80 | if (IsRecoveryMode()) return false; |
| 81 | // In microdroid, there's only one set of APEXes in built-in directories include block devices. |
| 82 | if (IsMicrodroid()) return false; |
| 83 | return true; |
| 84 | } |
| 85 | |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 86 | bool SetupMountNamespaces() { |
| 87 | // Set the propagation type of / as shared so that any mounting event (e.g. |
| 88 | // /data) is by default visible to all processes. When private mounting is |
| 89 | // needed for /foo/bar, then we will make /foo/bar as a mount point (by |
| 90 | // bind-mounting by to itself) and set the propagation type of the mount |
| 91 | // point to private. |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 92 | if (!ChangeMount("/", MS_SHARED | MS_REC)) return false; |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 93 | |
Jiyong Park | 7b4801a | 2019-02-25 16:41:38 +0900 | [diff] [blame] | 94 | // /apex is a private mountpoint to give different sets of APEXes for |
Jiyong Park | dcbaf9f | 2019-02-22 22:15:25 +0900 | [diff] [blame] | 95 | // the bootstrap and default mount namespaces. The processes running with |
| 96 | // the bootstrap namespace get APEXes from the read-only partition. |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 97 | if (!(ChangeMount("/apex", MS_PRIVATE))) return false; |
Jiyong Park | dcbaf9f | 2019-02-22 22:15:25 +0900 | [diff] [blame] | 98 | |
Jooyung Han | 201801c | 2023-07-20 17:25:47 +0900 | [diff] [blame^] | 99 | // However, some components (e.g. servicemanager) need to access bootstrap |
| 100 | // APEXes from the default mount namespace. To achieve that, we bind-mount |
| 101 | // /apex with /bootstrap-apex (not private) in the bootstrap mount namespace. |
| 102 | // Bootstrap APEXes are mounted in /apex and also visible in /bootstrap-apex. |
| 103 | // In the default mount namespace, we detach /bootstrap-apex from /apex and |
| 104 | // bootstrap APEXes are still be visible in /bootstrap-apex. |
| 105 | // |
| 106 | // The end result will look like: |
| 107 | // in the bootstrap mount namespace: |
| 108 | // /apex (== /bootstrap-apex) |
| 109 | // {bootstrap APEXes from the read-only partition} |
| 110 | // |
| 111 | // in the default mount namespace: |
| 112 | // /bootstrap-apex |
| 113 | // {bootstrap APEXes from the read-only partition} |
| 114 | // /apex |
| 115 | // {APEXes, can be from /data partition} |
| 116 | if (NeedsTwoMountNamespaces()) { |
| 117 | if (!(BindMount("/bootstrap-apex", "/apex"))) return false; |
| 118 | } |
| 119 | |
Kiyoung Kim | 99df54b | 2019-11-22 16:14:10 +0900 | [diff] [blame] | 120 | // /linkerconfig is a private mountpoint to give a different linker configuration |
| 121 | // based on the mount namespace. Subdirectory will be bind-mounted based on current mount |
| 122 | // namespace |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 123 | if (!(ChangeMount("/linkerconfig", MS_PRIVATE))) return false; |
Kiyoung Kim | 99df54b | 2019-11-22 16:14:10 +0900 | [diff] [blame] | 124 | |
Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 125 | // The two mount namespaces present challenges for scoped storage, because |
| 126 | // vold, which is responsible for most of the mounting, lives in the |
| 127 | // bootstrap mount namespace, whereas most other daemons and all apps live |
| 128 | // in the default namespace. Scoped storage has a need for a |
| 129 | // /mnt/installer view that is a slave bind mount of /mnt/user - in other |
| 130 | // words, all mounts under /mnt/user should automatically show up under |
| 131 | // /mnt/installer. However, additional mounts done under /mnt/installer |
| 132 | // should not propagate back to /mnt/user. In a single mount namespace |
| 133 | // this is easy to achieve, by simply marking the /mnt/installer a slave |
| 134 | // bind mount. Unfortunately, if /mnt/installer is only created and |
| 135 | // bind mounted after the two namespaces are created below, we end up |
| 136 | // with the following situation: |
| 137 | // /mnt/user and /mnt/installer share the same peer group in both the |
| 138 | // bootstrap and default namespaces. Marking /mnt/installer slave in either |
| 139 | // namespace means that it won't propagate events to the /mnt/installer in |
| 140 | // the other namespace, which is still something we require - vold is the |
| 141 | // one doing the mounting under /mnt/installer, and those mounts should |
| 142 | // show up in the default namespace as well. |
| 143 | // |
| 144 | // The simplest solution is to do the bind mount before the two namespaces |
| 145 | // are created: the effect is that in both namespaces, /mnt/installer is a |
| 146 | // slave to the /mnt/user mount, and at the same time /mnt/installer in the |
| 147 | // bootstrap namespace shares a peer group with /mnt/installer in the |
| 148 | // default namespace. |
Ricky Wai | a4c163d | 2020-04-21 12:16:43 +0100 | [diff] [blame] | 149 | // /mnt/androidwritable is similar to /mnt/installer but serves for |
| 150 | // MOUNT_EXTERNAL_ANDROID_WRITABLE apps. |
Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 151 | if (!mkdir_recursive("/mnt/user", 0755)) return false; |
| 152 | if (!mkdir_recursive("/mnt/installer", 0755)) return false; |
Ricky Wai | a4c163d | 2020-04-21 12:16:43 +0100 | [diff] [blame] | 153 | if (!mkdir_recursive("/mnt/androidwritable", 0755)) return false; |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 154 | if (!(BindMount("/mnt/user", "/mnt/installer"))) return false; |
| 155 | if (!(BindMount("/mnt/user", "/mnt/androidwritable"))) return false; |
Ricky Wai | a4c163d | 2020-04-21 12:16:43 +0100 | [diff] [blame] | 156 | // First, make /mnt/installer and /mnt/androidwritable a slave bind mount |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 157 | if (!(ChangeMount("/mnt/installer", MS_SLAVE))) return false; |
| 158 | if (!(ChangeMount("/mnt/androidwritable", MS_SLAVE))) return false; |
Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 159 | // Then, make it shared again - effectively creating a new peer group, that |
| 160 | // will be inherited by new mount namespaces. |
Elliott Hughes | e79b8c2 | 2020-07-28 11:09:03 -0700 | [diff] [blame] | 161 | if (!(ChangeMount("/mnt/installer", MS_SHARED))) return false; |
| 162 | if (!(ChangeMount("/mnt/androidwritable", MS_SHARED))) return false; |
Martijn Coenen | c70c066 | 2020-01-10 15:42:15 +0100 | [diff] [blame] | 163 | |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 164 | bootstrap_ns_fd.reset(OpenMountNamespace()); |
| 165 | bootstrap_ns_id = GetMountNamespaceId(); |
| 166 | |
Jiyong Park | 7b4801a | 2019-02-25 16:41:38 +0900 | [diff] [blame] | 167 | // When APEXes are updatable (e.g. not-flattened), we create separate mount |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 168 | // namespaces for processes that are started before and after the APEX is |
Jiyong Park | 7b4801a | 2019-02-25 16:41:38 +0900 | [diff] [blame] | 169 | // activated by apexd. In the namespace for pre-apexd processes, small |
| 170 | // number of essential APEXes (e.g. com.android.runtime) are activated. |
| 171 | // In the namespace for post-apexd processes, all APEXes are activated. |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 172 | bool success = true; |
Jooyung Han | 653b063 | 2021-07-29 17:11:23 +0900 | [diff] [blame] | 173 | if (NeedsTwoMountNamespaces()) { |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 174 | // Creating a new namespace by cloning, saving, and switching back to |
| 175 | // the original namespace. |
| 176 | if (unshare(CLONE_NEWNS) == -1) { |
| 177 | PLOG(ERROR) << "Cannot create mount namespace"; |
| 178 | return false; |
| 179 | } |
| 180 | default_ns_fd.reset(OpenMountNamespace()); |
| 181 | default_ns_id = GetMountNamespaceId(); |
| 182 | |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 183 | if (setns(bootstrap_ns_fd.get(), CLONE_NEWNS) == -1) { |
| 184 | PLOG(ERROR) << "Cannot switch back to bootstrap mount namespace"; |
| 185 | return false; |
| 186 | } |
| 187 | } else { |
| 188 | // Otherwise, default == bootstrap |
| 189 | default_ns_fd.reset(OpenMountNamespace()); |
| 190 | default_ns_id = GetMountNamespaceId(); |
| 191 | } |
Shikha Malhotra | 720694d | 2021-07-30 12:35:27 +0000 | [diff] [blame] | 192 | |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 193 | LOG(INFO) << "SetupMountNamespaces done"; |
| 194 | return success; |
| 195 | } |
| 196 | |
Jooyung Han | 5eb441c | 2022-07-23 01:41:18 +0900 | [diff] [blame] | 197 | // Switch the mount namespace of the current process from bootstrap to default OR from default to |
| 198 | // bootstrap. If the current mount namespace is neither bootstrap nor default, keep it that way. |
Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 199 | Result<void> SwitchToMountNamespaceIfNeeded(MountNamespace target_mount_namespace) { |
Jooyung Han | 918971c | 2023-06-23 14:16:31 +0900 | [diff] [blame] | 200 | if (IsRecoveryMode()) { |
Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 201 | // we don't have multiple namespaces in recovery mode or if apex is not updatable |
| 202 | return {}; |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 203 | } |
Jooyung Han | 5eb441c | 2022-07-23 01:41:18 +0900 | [diff] [blame] | 204 | |
| 205 | const std::string current_namespace_id = GetMountNamespaceId(); |
| 206 | MountNamespace current_mount_namespace; |
| 207 | if (current_namespace_id == bootstrap_ns_id) { |
| 208 | current_mount_namespace = NS_BOOTSTRAP; |
| 209 | } else if (current_namespace_id == default_ns_id) { |
| 210 | current_mount_namespace = NS_DEFAULT; |
| 211 | } else { |
| 212 | // services with `namespace mnt` start in its own mount namespace. So we need to keep it. |
| 213 | return {}; |
| 214 | } |
| 215 | |
| 216 | // We're already in the target mount namespace. |
| 217 | if (current_mount_namespace == target_mount_namespace) { |
| 218 | return {}; |
| 219 | } |
| 220 | |
Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 221 | const auto& ns_fd = target_mount_namespace == NS_BOOTSTRAP ? bootstrap_ns_fd : default_ns_fd; |
| 222 | const auto& ns_name = target_mount_namespace == NS_BOOTSTRAP ? "bootstrap" : "default"; |
Jooyung Han | 5eb441c | 2022-07-23 01:41:18 +0900 | [diff] [blame] | 223 | if (ns_fd.get() != -1) { |
Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 224 | if (setns(ns_fd.get(), CLONE_NEWNS) == -1) { |
| 225 | return ErrnoError() << "Failed to switch to " << ns_name << " mount namespace."; |
Kiyoung Kim | e4d3f21 | 2019-12-16 14:31:04 +0900 | [diff] [blame] | 226 | } |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 227 | } |
Jooyung Han | 4f23d5a | 2020-06-09 13:44:17 +0900 | [diff] [blame] | 228 | return {}; |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 229 | } |
| 230 | |
Kiyoung Kim | 0cbee0d | 2021-03-02 16:45:27 +0900 | [diff] [blame] | 231 | base::Result<MountNamespace> GetCurrentMountNamespace() { |
| 232 | std::string current_namespace_id = GetMountNamespaceId(); |
| 233 | if (current_namespace_id == "") { |
| 234 | return Error() << "Failed to get current mount namespace ID"; |
| 235 | } |
| 236 | |
| 237 | if (current_namespace_id == bootstrap_ns_id) { |
| 238 | return NS_BOOTSTRAP; |
| 239 | } else if (current_namespace_id == default_ns_id) { |
| 240 | return NS_DEFAULT; |
| 241 | } |
| 242 | |
| 243 | return Error() << "Failed to find current mount namespace"; |
| 244 | } |
| 245 | |
Jiyong Park | 6866041 | 2019-01-16 23:00:59 +0900 | [diff] [blame] | 246 | } // namespace init |
| 247 | } // namespace android |