Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2010 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #define LOG_TAG "Tokenizer" |
| 18 | |
Mathias Agopian | 22dbf39 | 2017-02-28 15:06:51 -0800 | [diff] [blame] | 19 | #include <utils/Tokenizer.h> |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 20 | #include <fcntl.h> |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 21 | #include <sys/stat.h> |
Steven Moreland | 066e625 | 2023-10-07 00:29:44 +0000 | [diff] [blame] | 22 | #include <log/log.h> |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 23 | |
Steven Moreland | 377adea | 2022-10-08 05:06:52 +0000 | [diff] [blame] | 24 | #ifndef DEBUG_TOKENIZER |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 25 | // Enables debug output for the tokenizer. |
| 26 | #define DEBUG_TOKENIZER 0 |
Steven Moreland | 377adea | 2022-10-08 05:06:52 +0000 | [diff] [blame] | 27 | #endif |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 28 | |
| 29 | namespace android { |
| 30 | |
| 31 | static inline bool isDelimiter(char ch, const char* delimiters) { |
Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 32 | return strchr(delimiters, ch) != nullptr; |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 33 | } |
| 34 | |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 35 | Tokenizer::Tokenizer(const String8& filename, FileMap* fileMap, char* buffer, |
| 36 | bool ownBuffer, size_t length) : |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 37 | mFilename(filename), mFileMap(fileMap), |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 38 | mBuffer(buffer), mOwnBuffer(ownBuffer), mLength(length), |
| 39 | mCurrent(buffer), mLineNumber(1) { |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 40 | } |
| 41 | |
| 42 | Tokenizer::~Tokenizer() { |
Narayan Kamath | 6832a7a | 2015-02-23 15:43:35 +0000 | [diff] [blame] | 43 | delete mFileMap; |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 44 | if (mOwnBuffer) { |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 45 | delete[] mBuffer; |
Jeff Brown | d36ec3a | 2010-11-19 13:13:07 -0800 | [diff] [blame] | 46 | } |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 47 | } |
| 48 | |
| 49 | status_t Tokenizer::open(const String8& filename, Tokenizer** outTokenizer) { |
Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 50 | *outTokenizer = nullptr; |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 51 | |
Elliott Hughes | 643268f | 2018-10-08 11:10:11 -0700 | [diff] [blame] | 52 | int result = OK; |
Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 53 | int fd = ::open(filename.c_str(), O_RDONLY); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 54 | if (fd < 0) { |
| 55 | result = -errno; |
Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 56 | ALOGE("Error opening file '%s': %s", filename.c_str(), strerror(errno)); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 57 | } else { |
Jeff Brown | d36ec3a | 2010-11-19 13:13:07 -0800 | [diff] [blame] | 58 | struct stat stat; |
| 59 | if (fstat(fd, &stat)) { |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 60 | result = -errno; |
Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 61 | ALOGE("Error getting size of file '%s': %s", filename.c_str(), strerror(errno)); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 62 | } else { |
| 63 | size_t length = size_t(stat.st_size); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 64 | |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 65 | FileMap* fileMap = new FileMap(); |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 66 | bool ownBuffer = false; |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 67 | char* buffer; |
Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 68 | if (fileMap->create(nullptr, fd, 0, length, true)) { |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 69 | fileMap->advise(FileMap::SEQUENTIAL); |
| 70 | buffer = static_cast<char*>(fileMap->getDataPtr()); |
| 71 | } else { |
Narayan Kamath | 6832a7a | 2015-02-23 15:43:35 +0000 | [diff] [blame] | 72 | delete fileMap; |
Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 73 | fileMap = nullptr; |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 74 | |
| 75 | // Fall back to reading into a buffer since we can't mmap files in sysfs. |
| 76 | // The length we obtained from stat is wrong too (it will always be 4096) |
| 77 | // so we must trust that read will read the entire file. |
| 78 | buffer = new char[length]; |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 79 | ownBuffer = true; |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 80 | ssize_t nrd = read(fd, buffer, length); |
| 81 | if (nrd < 0) { |
| 82 | result = -errno; |
Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 83 | ALOGE("Error reading file '%s': %s", filename.c_str(), strerror(errno)); |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 84 | delete[] buffer; |
Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 85 | buffer = nullptr; |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 86 | } else { |
| 87 | length = size_t(nrd); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 88 | } |
| 89 | } |
Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 90 | |
| 91 | if (!result) { |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 92 | *outTokenizer = new Tokenizer(filename, fileMap, buffer, ownBuffer, length); |
Jeff Brown | d36ec3a | 2010-11-19 13:13:07 -0800 | [diff] [blame] | 93 | } |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 94 | } |
| 95 | close(fd); |
| 96 | } |
| 97 | return result; |
| 98 | } |
| 99 | |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 100 | status_t Tokenizer::fromContents(const String8& filename, |
| 101 | const char* contents, Tokenizer** outTokenizer) { |
Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 102 | *outTokenizer = new Tokenizer(filename, nullptr, |
Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 103 | const_cast<char*>(contents), false, strlen(contents)); |
| 104 | return OK; |
| 105 | } |
| 106 | |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 107 | String8 Tokenizer::getLocation() const { |
| 108 | String8 result; |
Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 109 | result.appendFormat("%s:%d", mFilename.c_str(), mLineNumber); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 110 | return result; |
| 111 | } |
| 112 | |
| 113 | String8 Tokenizer::peekRemainderOfLine() const { |
| 114 | const char* end = getEnd(); |
| 115 | const char* eol = mCurrent; |
| 116 | while (eol != end) { |
| 117 | char ch = *eol; |
| 118 | if (ch == '\n') { |
| 119 | break; |
| 120 | } |
| 121 | eol += 1; |
| 122 | } |
| 123 | return String8(mCurrent, eol - mCurrent); |
| 124 | } |
| 125 | |
| 126 | String8 Tokenizer::nextToken(const char* delimiters) { |
| 127 | #if DEBUG_TOKENIZER |
Steve Block | eb09533 | 2011-12-20 16:23:08 +0000 | [diff] [blame] | 128 | ALOGD("nextToken"); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 129 | #endif |
| 130 | const char* end = getEnd(); |
| 131 | const char* tokenStart = mCurrent; |
| 132 | while (mCurrent != end) { |
| 133 | char ch = *mCurrent; |
| 134 | if (ch == '\n' || isDelimiter(ch, delimiters)) { |
| 135 | break; |
| 136 | } |
| 137 | mCurrent += 1; |
| 138 | } |
| 139 | return String8(tokenStart, mCurrent - tokenStart); |
| 140 | } |
| 141 | |
| 142 | void Tokenizer::nextLine() { |
| 143 | #if DEBUG_TOKENIZER |
Steve Block | eb09533 | 2011-12-20 16:23:08 +0000 | [diff] [blame] | 144 | ALOGD("nextLine"); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 145 | #endif |
| 146 | const char* end = getEnd(); |
| 147 | while (mCurrent != end) { |
| 148 | char ch = *(mCurrent++); |
| 149 | if (ch == '\n') { |
| 150 | mLineNumber += 1; |
| 151 | break; |
| 152 | } |
| 153 | } |
| 154 | } |
| 155 | |
| 156 | void Tokenizer::skipDelimiters(const char* delimiters) { |
| 157 | #if DEBUG_TOKENIZER |
Steve Block | eb09533 | 2011-12-20 16:23:08 +0000 | [diff] [blame] | 158 | ALOGD("skipDelimiters"); |
Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 159 | #endif |
| 160 | const char* end = getEnd(); |
| 161 | while (mCurrent != end) { |
| 162 | char ch = *mCurrent; |
| 163 | if (ch == '\n' || !isDelimiter(ch, delimiters)) { |
| 164 | break; |
| 165 | } |
| 166 | mCurrent += 1; |
| 167 | } |
| 168 | } |
| 169 | |
| 170 | } // namespace android |