blob: 203832d2dbe8d15ba9a352316f0a3a690a8d2bbb [file] [log] [blame]
Adam Lesinski6f6ceb72014-11-14 14:48:12 -08001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Adam Lesinskice5e56e2016-10-21 17:56:45 -070017#include <iostream>
18#include <string>
19
Adam Lesinski1ab598f2015-08-14 14:26:04 -070020#include "util/Util.h"
Adam Lesinski467f1712015-11-16 17:35:44 -080021#include "xml/XmlPullParser.h"
22#include "xml/XmlUtil.h"
Adam Lesinski1ab598f2015-08-14 14:26:04 -070023
Jeremy Meyerb4f83ff2023-11-30 19:29:50 +000024using ::android::InputStream;
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070025using ::android::StringPiece;
Adam Lesinskid5083f62017-01-16 15:07:21 -080026
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080027namespace aapt {
Adam Lesinski467f1712015-11-16 17:35:44 -080028namespace xml {
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080029
30constexpr char kXmlNamespaceSep = 1;
31
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070032XmlPullParser::XmlPullParser(InputStream* in) : in_(in), empty_(), depth_(0) {
Adam Lesinskice5e56e2016-10-21 17:56:45 -070033 parser_ = XML_ParserCreateNS(nullptr, kXmlNamespaceSep);
34 XML_SetUserData(parser_, this);
35 XML_SetElementHandler(parser_, StartElementHandler, EndElementHandler);
36 XML_SetNamespaceDeclHandler(parser_, StartNamespaceHandler,
37 EndNamespaceHandler);
38 XML_SetCharacterDataHandler(parser_, CharacterDataHandler);
39 XML_SetCommentHandler(parser_, CommentDataHandler);
Ryan Mitchellcb76d732018-06-05 10:15:04 -070040 XML_SetCdataSectionHandler(parser_, StartCdataSectionHandler, EndCdataSectionHandler);
Adam Lesinskice5e56e2016-10-21 17:56:45 -070041 event_queue_.push(EventData{Event::kStartDocument, 0, depth_++});
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080042}
43
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070044XmlPullParser::~XmlPullParser() {
45 XML_ParserFree(parser_);
46}
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080047
Adam Lesinskice5e56e2016-10-21 17:56:45 -070048XmlPullParser::Event XmlPullParser::Next() {
49 const Event currentEvent = event();
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070050 if (currentEvent == Event::kBadDocument || currentEvent == Event::kEndDocument) {
Adam Lesinskice5e56e2016-10-21 17:56:45 -070051 return currentEvent;
52 }
53
54 event_queue_.pop();
55 while (event_queue_.empty()) {
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070056 const char* buffer = nullptr;
57 size_t buffer_size = 0;
58 bool done = false;
59 if (!in_->Next(reinterpret_cast<const void**>(&buffer), &buffer_size)) {
60 if (in_->HadError()) {
61 error_ = in_->GetError();
62 event_queue_.push(EventData{Event::kBadDocument});
63 break;
64 }
Adam Lesinskice5e56e2016-10-21 17:56:45 -070065
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070066 done = true;
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080067 }
68
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070069 if (XML_Parse(parser_, buffer, buffer_size, done) == XML_STATUS_ERROR) {
Adam Lesinskice5e56e2016-10-21 17:56:45 -070070 error_ = XML_ErrorString(XML_GetErrorCode(parser_));
71 event_queue_.push(EventData{Event::kBadDocument});
Adam Lesinskiefeb7af2017-08-02 14:57:43 -070072 break;
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080073 }
74
Adam Lesinskice5e56e2016-10-21 17:56:45 -070075 if (done) {
76 event_queue_.push(EventData{Event::kEndDocument, 0, 0});
Adam Lesinski24aad162015-04-24 19:19:30 -070077 }
Adam Lesinskice5e56e2016-10-21 17:56:45 -070078 }
Adam Lesinski24aad162015-04-24 19:19:30 -070079
Adam Lesinskice5e56e2016-10-21 17:56:45 -070080 Event next_event = event();
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080081
Adam Lesinskice5e56e2016-10-21 17:56:45 -070082 // Record namespace prefixes and package names so that we can do our own
83 // handling of references that use namespace aliases.
84 if (next_event == Event::kStartNamespace ||
85 next_event == Event::kEndNamespace) {
Ryan Mitchell4382e442021-07-14 12:53:01 -070086 std::optional<ExtractedPackage> result = ExtractPackageFromNamespace(namespace_uri());
Adam Lesinskice5e56e2016-10-21 17:56:45 -070087 if (next_event == Event::kStartNamespace) {
88 if (result) {
89 package_aliases_.emplace_back(
90 PackageDecl{namespace_prefix(), std::move(result.value())});
91 }
92 } else {
93 if (result) {
94 package_aliases_.pop_back();
95 }
Adam Lesinski6f6ceb72014-11-14 14:48:12 -080096 }
Adam Lesinskice5e56e2016-10-21 17:56:45 -070097 }
98
99 return next_event;
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800100}
101
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700102XmlPullParser::Event XmlPullParser::event() const {
103 return event_queue_.front().event;
104}
105
106const std::string& XmlPullParser::error() const { return error_; }
107
108const std::string& XmlPullParser::comment() const {
109 return event_queue_.front().data1;
110}
111
112size_t XmlPullParser::line_number() const {
113 return event_queue_.front().line_number;
114}
115
116size_t XmlPullParser::depth() const { return event_queue_.front().depth; }
117
118const std::string& XmlPullParser::text() const {
119 if (event() != Event::kText) {
120 return empty_;
121 }
122 return event_queue_.front().data1;
123}
124
125const std::string& XmlPullParser::namespace_prefix() const {
126 const Event current_event = event();
127 if (current_event != Event::kStartNamespace &&
128 current_event != Event::kEndNamespace) {
129 return empty_;
130 }
131 return event_queue_.front().data1;
132}
133
134const std::string& XmlPullParser::namespace_uri() const {
135 const Event current_event = event();
136 if (current_event != Event::kStartNamespace &&
137 current_event != Event::kEndNamespace) {
138 return empty_;
139 }
140 return event_queue_.front().data2;
141}
142
Yurii Zubrytskyia5775142022-11-02 17:49:49 -0700143std::optional<ExtractedPackage> XmlPullParser::TransformPackageAlias(StringPiece alias) const {
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700144 if (alias.empty()) {
Adam Lesinski1ef0fa92017-08-15 21:32:49 -0700145 return ExtractedPackage{{}, false /*private*/};
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700146 }
147
148 const auto end_iter = package_aliases_.rend();
149 for (auto iter = package_aliases_.rbegin(); iter != end_iter; ++iter) {
150 if (alias == iter->prefix) {
151 if (iter->package.package.empty()) {
Adam Lesinski1ef0fa92017-08-15 21:32:49 -0700152 return ExtractedPackage{{}, iter->package.private_namespace};
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700153 }
154 return iter->package;
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800155 }
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700156 }
157 return {};
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800158}
159
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700160const std::string& XmlPullParser::element_namespace() const {
161 const Event current_event = event();
162 if (current_event != Event::kStartElement &&
163 current_event != Event::kEndElement) {
164 return empty_;
165 }
166 return event_queue_.front().data1;
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800167}
168
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700169const std::string& XmlPullParser::element_name() const {
170 const Event current_event = event();
171 if (current_event != Event::kStartElement &&
172 current_event != Event::kEndElement) {
173 return empty_;
174 }
175 return event_queue_.front().data2;
Adam Lesinski24aad162015-04-24 19:19:30 -0700176}
177
Ryan Mitchell326e35ff2021-04-12 07:50:42 -0700178const std::vector<XmlPullParser::PackageDecl>& XmlPullParser::package_decls() const {
179 return package_aliases_;
180}
181
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700182XmlPullParser::const_iterator XmlPullParser::begin_attributes() const {
183 return event_queue_.front().attributes.begin();
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800184}
185
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700186XmlPullParser::const_iterator XmlPullParser::end_attributes() const {
187 return event_queue_.front().attributes.end();
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800188}
189
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700190size_t XmlPullParser::attribute_count() const {
191 if (event() != Event::kStartElement) {
192 return 0;
193 }
194 return event_queue_.front().attributes.size();
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800195}
196
197/**
198 * Extracts the namespace and name of an expanded element or attribute name.
199 */
Adam Lesinskid5083f62017-01-16 15:07:21 -0800200static void SplitName(const char* name, std::string* out_ns, std::string* out_name) {
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700201 const char* p = name;
202 while (*p != 0 && *p != kXmlNamespaceSep) {
203 p++;
204 }
205
206 if (*p == 0) {
Adam Lesinskid5083f62017-01-16 15:07:21 -0800207 out_ns->clear();
208 out_name->assign(name);
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700209 } else {
Adam Lesinskid5083f62017-01-16 15:07:21 -0800210 out_ns->assign(name, (p - name));
211 out_name->assign(p + 1);
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700212 }
213}
214
215void XMLCALL XmlPullParser::StartNamespaceHandler(void* user_data,
216 const char* prefix,
217 const char* uri) {
218 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
219 std::string namespace_uri = uri != nullptr ? uri : std::string();
220 parser->namespace_uris_.push(namespace_uri);
221 parser->event_queue_.push(
222 EventData{Event::kStartNamespace,
223 XML_GetCurrentLineNumber(parser->parser_), parser->depth_++,
224 prefix != nullptr ? prefix : std::string(), namespace_uri});
225}
226
227void XMLCALL XmlPullParser::StartElementHandler(void* user_data,
228 const char* name,
229 const char** attrs) {
230 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
231
232 EventData data = {Event::kStartElement,
233 XML_GetCurrentLineNumber(parser->parser_),
234 parser->depth_++};
Adam Lesinskid5083f62017-01-16 15:07:21 -0800235 SplitName(name, &data.data1, &data.data2);
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700236
237 while (*attrs) {
238 Attribute attribute;
Adam Lesinskid5083f62017-01-16 15:07:21 -0800239 SplitName(*attrs++, &attribute.namespace_uri, &attribute.name);
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700240 attribute.value = *attrs++;
241
242 // Insert in sorted order.
243 auto iter = std::lower_bound(data.attributes.begin(), data.attributes.end(),
244 attribute);
245 data.attributes.insert(iter, std::move(attribute));
246 }
247
248 // Move the structure into the queue (no copy).
249 parser->event_queue_.push(std::move(data));
250}
251
252void XMLCALL XmlPullParser::CharacterDataHandler(void* user_data, const char* s,
253 int len) {
254 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
255
Adam Lesinskid5083f62017-01-16 15:07:21 -0800256 parser->event_queue_.push(EventData{Event::kText, XML_GetCurrentLineNumber(parser->parser_),
257 parser->depth_, std::string(s, len)});
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700258}
259
260void XMLCALL XmlPullParser::EndElementHandler(void* user_data,
261 const char* name) {
262 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
263
264 EventData data = {Event::kEndElement,
265 XML_GetCurrentLineNumber(parser->parser_),
266 --(parser->depth_)};
Adam Lesinskid5083f62017-01-16 15:07:21 -0800267 SplitName(name, &data.data1, &data.data2);
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700268
269 // Move the data into the queue (no copy).
270 parser->event_queue_.push(std::move(data));
271}
272
273void XMLCALL XmlPullParser::EndNamespaceHandler(void* user_data,
274 const char* prefix) {
275 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
276
277 parser->event_queue_.push(
278 EventData{Event::kEndNamespace, XML_GetCurrentLineNumber(parser->parser_),
279 --(parser->depth_), prefix != nullptr ? prefix : std::string(),
280 parser->namespace_uris_.top()});
281 parser->namespace_uris_.pop();
282}
283
284void XMLCALL XmlPullParser::CommentDataHandler(void* user_data,
285 const char* comment) {
286 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
287
288 parser->event_queue_.push(EventData{Event::kComment,
289 XML_GetCurrentLineNumber(parser->parser_),
290 parser->depth_, comment});
291}
292
Ryan Mitchellcb76d732018-06-05 10:15:04 -0700293void XMLCALL XmlPullParser::StartCdataSectionHandler(void* user_data) {
294 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
295
296 parser->event_queue_.push(EventData{Event::kCdataStart,
297 XML_GetCurrentLineNumber(parser->parser_),
298 parser->depth_ });
299}
300
301void XMLCALL XmlPullParser::EndCdataSectionHandler(void* user_data) {
302 XmlPullParser* parser = reinterpret_cast<XmlPullParser*>(user_data);
303
304 parser->event_queue_.push(EventData{Event::kCdataEnd,
305 XML_GetCurrentLineNumber(parser->parser_),
306 parser->depth_ });
307}
308
Yurii Zubrytskyia5775142022-11-02 17:49:49 -0700309std::optional<StringPiece> FindAttribute(const XmlPullParser* parser, StringPiece name) {
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700310 auto iter = parser->FindAttribute("", name);
311 if (iter != parser->end_attributes()) {
312 return StringPiece(util::TrimWhitespace(iter->value));
313 }
314 return {};
315}
316
Yurii Zubrytskyia5775142022-11-02 17:49:49 -0700317std::optional<StringPiece> FindNonEmptyAttribute(const XmlPullParser* parser, StringPiece name) {
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700318 auto iter = parser->FindAttribute("", name);
319 if (iter != parser->end_attributes()) {
320 StringPiece trimmed = util::TrimWhitespace(iter->value);
321 if (!trimmed.empty()) {
322 return trimmed;
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800323 }
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700324 }
325 return {};
Adam Lesinski6f6ceb72014-11-14 14:48:12 -0800326}
327
Adam Lesinskice5e56e2016-10-21 17:56:45 -0700328} // namespace xml
329} // namespace aapt