| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 1 | /* | 
|  | 2 | * Copyright (C) 2010 The Android Open Source Project | 
|  | 3 | * | 
|  | 4 | * Licensed under the Apache License, Version 2.0 (the "License"); | 
|  | 5 | * you may not use this file except in compliance with the License. | 
|  | 6 | * You may obtain a copy of the License at | 
|  | 7 | * | 
|  | 8 | *      http://www.apache.org/licenses/LICENSE-2.0 | 
|  | 9 | * | 
|  | 10 | * Unless required by applicable law or agreed to in writing, software | 
|  | 11 | * distributed under the License is distributed on an "AS IS" BASIS, | 
|  | 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
|  | 13 | * See the License for the specific language governing permissions and | 
|  | 14 | * limitations under the License. | 
|  | 15 | */ | 
|  | 16 |  | 
|  | 17 | #define LOG_TAG "Tokenizer" | 
|  | 18 |  | 
| Mathias Agopian | 22dbf39 | 2017-02-28 15:06:51 -0800 | [diff] [blame] | 19 | #include <utils/Tokenizer.h> | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 20 | #include <fcntl.h> | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 21 | #include <sys/stat.h> | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 22 | #include <utils/Log.h> | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 23 |  | 
| Steven Moreland | 377adea | 2022-10-08 05:06:52 +0000 | [diff] [blame] | 24 | #ifndef DEBUG_TOKENIZER | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 25 | // Enables debug output for the tokenizer. | 
|  | 26 | #define DEBUG_TOKENIZER 0 | 
| Steven Moreland | 377adea | 2022-10-08 05:06:52 +0000 | [diff] [blame] | 27 | #endif | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 28 |  | 
|  | 29 | namespace android { | 
|  | 30 |  | 
|  | 31 | static inline bool isDelimiter(char ch, const char* delimiters) { | 
| Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 32 | return strchr(delimiters, ch) != nullptr; | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 33 | } | 
|  | 34 |  | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 35 | Tokenizer::Tokenizer(const String8& filename, FileMap* fileMap, char* buffer, | 
|  | 36 | bool ownBuffer, size_t length) : | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 37 | mFilename(filename), mFileMap(fileMap), | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 38 | mBuffer(buffer), mOwnBuffer(ownBuffer), mLength(length), | 
|  | 39 | mCurrent(buffer), mLineNumber(1) { | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 40 | } | 
|  | 41 |  | 
|  | 42 | Tokenizer::~Tokenizer() { | 
| Narayan Kamath | 6832a7a | 2015-02-23 15:43:35 +0000 | [diff] [blame] | 43 | delete mFileMap; | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 44 | if (mOwnBuffer) { | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 45 | delete[] mBuffer; | 
| Jeff Brown | d36ec3a | 2010-11-19 13:13:07 -0800 | [diff] [blame] | 46 | } | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 47 | } | 
|  | 48 |  | 
|  | 49 | status_t Tokenizer::open(const String8& filename, Tokenizer** outTokenizer) { | 
| Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 50 | *outTokenizer = nullptr; | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 51 |  | 
| Elliott Hughes | 643268f | 2018-10-08 11:10:11 -0700 | [diff] [blame] | 52 | int result = OK; | 
| Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 53 | int fd = ::open(filename.c_str(), O_RDONLY); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 54 | if (fd < 0) { | 
|  | 55 | result = -errno; | 
| Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 56 | ALOGE("Error opening file '%s': %s", filename.c_str(), strerror(errno)); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 57 | } else { | 
| Jeff Brown | d36ec3a | 2010-11-19 13:13:07 -0800 | [diff] [blame] | 58 | struct stat stat; | 
|  | 59 | if (fstat(fd, &stat)) { | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 60 | result = -errno; | 
| Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 61 | ALOGE("Error getting size of file '%s': %s", filename.c_str(), strerror(errno)); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 62 | } else { | 
|  | 63 | size_t length = size_t(stat.st_size); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 64 |  | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 65 | FileMap* fileMap = new FileMap(); | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 66 | bool ownBuffer = false; | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 67 | char* buffer; | 
| Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 68 | if (fileMap->create(nullptr, fd, 0, length, true)) { | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 69 | fileMap->advise(FileMap::SEQUENTIAL); | 
|  | 70 | buffer = static_cast<char*>(fileMap->getDataPtr()); | 
|  | 71 | } else { | 
| Narayan Kamath | 6832a7a | 2015-02-23 15:43:35 +0000 | [diff] [blame] | 72 | delete fileMap; | 
| Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 73 | fileMap = nullptr; | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 74 |  | 
|  | 75 | // Fall back to reading into a buffer since we can't mmap files in sysfs. | 
|  | 76 | // The length we obtained from stat is wrong too (it will always be 4096) | 
|  | 77 | // so we must trust that read will read the entire file. | 
|  | 78 | buffer = new char[length]; | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 79 | ownBuffer = true; | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 80 | ssize_t nrd = read(fd, buffer, length); | 
|  | 81 | if (nrd < 0) { | 
|  | 82 | result = -errno; | 
| Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 83 | ALOGE("Error reading file '%s': %s", filename.c_str(), strerror(errno)); | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 84 | delete[] buffer; | 
| Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 85 | buffer = nullptr; | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 86 | } else { | 
|  | 87 | length = size_t(nrd); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 88 | } | 
|  | 89 | } | 
| Jeff Brown | 1d618d6 | 2010-12-02 13:50:46 -0800 | [diff] [blame] | 90 |  | 
|  | 91 | if (!result) { | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 92 | *outTokenizer = new Tokenizer(filename, fileMap, buffer, ownBuffer, length); | 
| Jeff Brown | d36ec3a | 2010-11-19 13:13:07 -0800 | [diff] [blame] | 93 | } | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 94 | } | 
|  | 95 | close(fd); | 
|  | 96 | } | 
|  | 97 | return result; | 
|  | 98 | } | 
|  | 99 |  | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 100 | status_t Tokenizer::fromContents(const String8& filename, | 
|  | 101 | const char* contents, Tokenizer** outTokenizer) { | 
| Yi Kong | e1731a4 | 2018-07-16 18:11:34 -0700 | [diff] [blame] | 102 | *outTokenizer = new Tokenizer(filename, nullptr, | 
| Jeff Brown | 2c1627d | 2012-04-17 18:19:50 -0700 | [diff] [blame] | 103 | const_cast<char*>(contents), false, strlen(contents)); | 
|  | 104 | return OK; | 
|  | 105 | } | 
|  | 106 |  | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 107 | String8 Tokenizer::getLocation() const { | 
|  | 108 | String8 result; | 
| Tomasz Wasilczyk | 18b7461 | 2023-08-10 23:29:50 +0000 | [diff] [blame] | 109 | result.appendFormat("%s:%d", mFilename.c_str(), mLineNumber); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 110 | return result; | 
|  | 111 | } | 
|  | 112 |  | 
|  | 113 | String8 Tokenizer::peekRemainderOfLine() const { | 
|  | 114 | const char* end = getEnd(); | 
|  | 115 | const char* eol = mCurrent; | 
|  | 116 | while (eol != end) { | 
|  | 117 | char ch = *eol; | 
|  | 118 | if (ch == '\n') { | 
|  | 119 | break; | 
|  | 120 | } | 
|  | 121 | eol += 1; | 
|  | 122 | } | 
|  | 123 | return String8(mCurrent, eol - mCurrent); | 
|  | 124 | } | 
|  | 125 |  | 
|  | 126 | String8 Tokenizer::nextToken(const char* delimiters) { | 
|  | 127 | #if DEBUG_TOKENIZER | 
| Steve Block | eb09533 | 2011-12-20 16:23:08 +0000 | [diff] [blame] | 128 | ALOGD("nextToken"); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 129 | #endif | 
|  | 130 | const char* end = getEnd(); | 
|  | 131 | const char* tokenStart = mCurrent; | 
|  | 132 | while (mCurrent != end) { | 
|  | 133 | char ch = *mCurrent; | 
|  | 134 | if (ch == '\n' || isDelimiter(ch, delimiters)) { | 
|  | 135 | break; | 
|  | 136 | } | 
|  | 137 | mCurrent += 1; | 
|  | 138 | } | 
|  | 139 | return String8(tokenStart, mCurrent - tokenStart); | 
|  | 140 | } | 
|  | 141 |  | 
|  | 142 | void Tokenizer::nextLine() { | 
|  | 143 | #if DEBUG_TOKENIZER | 
| Steve Block | eb09533 | 2011-12-20 16:23:08 +0000 | [diff] [blame] | 144 | ALOGD("nextLine"); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 145 | #endif | 
|  | 146 | const char* end = getEnd(); | 
|  | 147 | while (mCurrent != end) { | 
|  | 148 | char ch = *(mCurrent++); | 
|  | 149 | if (ch == '\n') { | 
|  | 150 | mLineNumber += 1; | 
|  | 151 | break; | 
|  | 152 | } | 
|  | 153 | } | 
|  | 154 | } | 
|  | 155 |  | 
|  | 156 | void Tokenizer::skipDelimiters(const char* delimiters) { | 
|  | 157 | #if DEBUG_TOKENIZER | 
| Steve Block | eb09533 | 2011-12-20 16:23:08 +0000 | [diff] [blame] | 158 | ALOGD("skipDelimiters"); | 
| Jeff Brown | 647925d | 2010-11-10 16:03:06 -0800 | [diff] [blame] | 159 | #endif | 
|  | 160 | const char* end = getEnd(); | 
|  | 161 | while (mCurrent != end) { | 
|  | 162 | char ch = *mCurrent; | 
|  | 163 | if (ch == '\n' || !isDelimiter(ch, delimiters)) { | 
|  | 164 | break; | 
|  | 165 | } | 
|  | 166 | mCurrent += 1; | 
|  | 167 | } | 
|  | 168 | } | 
|  | 169 |  | 
|  | 170 | } // namespace android |