satok | e808e43 | 2010-12-02 14:53:24 +0900 | [diff] [blame] | 1 | /* |
| 2 | ** |
| 3 | ** Copyright 2010, The Android Open Source Project |
| 4 | ** |
| 5 | ** Licensed under the Apache License, Version 2.0 (the "License"); |
| 6 | ** you may not use this file except in compliance with the License. |
| 7 | ** You may obtain a copy of the License at |
| 8 | ** |
| 9 | ** http://www.apache.org/licenses/LICENSE-2.0 |
| 10 | ** |
| 11 | ** Unless required by applicable law or agreed to in writing, software |
| 12 | ** distributed under the License is distributed on an "AS IS" BASIS, |
| 13 | ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 14 | ** See the License for the specific language governing permissions and |
| 15 | ** limitations under the License. |
| 16 | */ |
| 17 | |
| 18 | #ifndef LATINIME_DEFINES_H |
| 19 | #define LATINIME_DEFINES_H |
| 20 | |
satok | 20d9fda | 2011-07-13 14:40:30 +0900 | [diff] [blame^] | 21 | #ifdef FLAG_DO_PROFILE |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 22 | // Profiler |
| 23 | #include <time.h> |
| 24 | #define PROF_BUF_SIZE 100 |
| 25 | static double profile_buf[PROF_BUF_SIZE]; |
| 26 | static double profile_old[PROF_BUF_SIZE]; |
| 27 | static unsigned int profile_counter[PROF_BUF_SIZE]; |
| 28 | |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 29 | #define PROF_RESET prof_reset() |
| 30 | #define PROF_COUNT(prof_buf_id) ++profile_counter[prof_buf_id] |
| 31 | #define PROF_OPEN do { PROF_RESET; PROF_START(PROF_BUF_SIZE - 1); } while(0) |
| 32 | #define PROF_START(prof_buf_id) do { \ |
| 33 | PROF_COUNT(prof_buf_id); profile_old[prof_buf_id] = (clock()); } while(0) |
| 34 | #define PROF_CLOSE do { PROF_END(PROF_BUF_SIZE - 1); PROF_OUTALL; } while(0) |
| 35 | #define PROF_END(prof_buf_id) profile_buf[prof_buf_id] += ((clock()) - profile_old[prof_buf_id]) |
| 36 | #define PROF_CLOCKOUT(prof_buf_id) \ |
| 37 | LOGI("%s : clock is %f", __FUNCTION__, (clock() - profile_old[prof_buf_id])) |
| 38 | #define PROF_OUTALL do { LOGI("--- %s ---", __FUNCTION__); prof_out(); } while(0) |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 39 | |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 40 | static void prof_reset(void) { |
| 41 | for (int i = 0; i < PROF_BUF_SIZE; ++i) { |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 42 | profile_buf[i] = 0; |
| 43 | profile_old[i] = 0; |
| 44 | profile_counter[i] = 0; |
| 45 | } |
| 46 | } |
| 47 | |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 48 | static void prof_out(void) { |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 49 | if (profile_counter[PROF_BUF_SIZE - 1] != 1) { |
| 50 | LOGI("Error: You must call PROF_OPEN before PROF_CLOSE."); |
| 51 | } |
| 52 | LOGI("Total time is %6.3f ms.", |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 53 | profile_buf[PROF_BUF_SIZE - 1] * 1000 / (double)CLOCKS_PER_SEC); |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 54 | double all = 0; |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 55 | for (int i = 0; i < PROF_BUF_SIZE - 1; ++i) { |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 56 | all += profile_buf[i]; |
| 57 | } |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 58 | if (all == 0) all = 1; |
| 59 | for (int i = 0; i < PROF_BUF_SIZE - 1; ++i) { |
| 60 | if (profile_buf[i] != 0) { |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 61 | LOGI("(%d): Used %4.2f%%, %8.4f ms. Called %d times.", |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 62 | i, (profile_buf[i] * 100 / all), |
| 63 | profile_buf[i] * 1000 / (double)CLOCKS_PER_SEC, profile_counter[i]); |
| 64 | } |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 65 | } |
| 66 | } |
| 67 | |
satok | 20d9fda | 2011-07-13 14:40:30 +0900 | [diff] [blame^] | 68 | #else // FLAG_DO_PROFILE |
satok | 61e2f85 | 2011-01-05 14:13:07 +0900 | [diff] [blame] | 69 | #define PROF_BUF_SIZE 0 |
| 70 | #define PROF_RESET |
| 71 | #define PROF_COUNT(prof_buf_id) |
| 72 | #define PROF_OPEN |
| 73 | #define PROF_START(prof_buf_id) |
| 74 | #define PROF_CLOSE |
| 75 | #define PROF_END(prof_buf_id) |
| 76 | #define PROF_CLOCK_OUT(prof_buf_id) |
| 77 | #define PROF_CLOCKOUT(prof_buf_id) |
| 78 | #define PROF_OUTALL |
| 79 | |
satok | 20d9fda | 2011-07-13 14:40:30 +0900 | [diff] [blame^] | 80 | #endif // FLAG_DO_PROFILE |
| 81 | |
| 82 | #ifdef FLAG_DBG |
| 83 | #include <cutils/log.h> |
| 84 | #ifndef LOG_TAG |
| 85 | #define LOG_TAG "LatinIME: " |
| 86 | #endif |
| 87 | #define DEBUG_DICT true |
| 88 | #define DEBUG_DICT_FULL false |
| 89 | #define DEBUG_SHOW_FOUND_WORD DEBUG_DICT_FULL |
| 90 | #define DEBUG_NODE DEBUG_DICT_FULL |
| 91 | #define DEBUG_TRACE DEBUG_DICT_FULL |
| 92 | #define DEBUG_PROXIMITY_INFO true |
| 93 | |
| 94 | #else // FLAG_DBG |
| 95 | #define LOGE(fmt, ...) |
| 96 | #define LOGI(fmt, ...) |
| 97 | #define DEBUG_DICT false |
| 98 | #define DEBUG_DICT_FULL false |
| 99 | #define DEBUG_SHOW_FOUND_WORD false |
| 100 | #define DEBUG_NODE false |
| 101 | #define DEBUG_TRACE false |
| 102 | #define DEBUG_PROXIMITY_INFO false |
| 103 | |
satok | e808e43 | 2010-12-02 14:53:24 +0900 | [diff] [blame] | 104 | #endif // FLAG_DBG |
| 105 | |
satok | 662fe69 | 2010-12-08 17:05:39 +0900 | [diff] [blame] | 106 | #ifndef U_SHORT_MAX |
| 107 | #define U_SHORT_MAX 1 << 16 |
| 108 | #endif |
Jean Chalard | a5d5849 | 2011-02-18 17:50:58 +0900 | [diff] [blame] | 109 | #ifndef S_INT_MAX |
satok | 3c4bb77 | 2011-03-04 22:50:19 -0800 | [diff] [blame] | 110 | #define S_INT_MAX 2147483647 // ((1 << 31) - 1) |
Jean Chalard | a5d5849 | 2011-02-18 17:50:58 +0900 | [diff] [blame] | 111 | #endif |
satok | 662fe69 | 2010-12-08 17:05:39 +0900 | [diff] [blame] | 112 | |
Ken Wakasa | e90b333 | 2011-01-07 15:01:51 +0900 | [diff] [blame] | 113 | // Define this to use mmap() for dictionary loading. Undefine to use malloc() instead of mmap(). |
| 114 | // We measured and compared performance of both, and found mmap() is fairly good in terms of |
| 115 | // loading time, and acceptable even for several initial lookups which involve page faults. |
| 116 | #define USE_MMAP_FOR_DICTIONARY |
| 117 | |
satok | e808e43 | 2010-12-02 14:53:24 +0900 | [diff] [blame] | 118 | // 22-bit address = ~4MB dictionary size limit, which on average would be about 200k-300k words |
| 119 | #define ADDRESS_MASK 0x3FFFFF |
| 120 | |
| 121 | // The bit that decides if an address follows in the next 22 bits |
| 122 | #define FLAG_ADDRESS_MASK 0x40 |
| 123 | // The bit that decides if this is a terminal node for a word. The node could still have children, |
| 124 | // if the word has other endings. |
| 125 | #define FLAG_TERMINAL_MASK 0x80 |
| 126 | |
| 127 | #define FLAG_BIGRAM_READ 0x80 |
| 128 | #define FLAG_BIGRAM_CHILDEXIST 0x40 |
| 129 | #define FLAG_BIGRAM_CONTINUED 0x80 |
| 130 | #define FLAG_BIGRAM_FREQ 0x7F |
| 131 | |
| 132 | #define DICTIONARY_VERSION_MIN 200 |
| 133 | #define DICTIONARY_HEADER_SIZE 2 |
| 134 | #define NOT_VALID_WORD -99 |
| 135 | |
satok | 817e517 | 2011-03-04 06:06:45 -0800 | [diff] [blame] | 136 | #define KEYCODE_SPACE ' ' |
| 137 | |
satok | 662fe69 | 2010-12-08 17:05:39 +0900 | [diff] [blame] | 138 | #define SUGGEST_WORDS_WITH_MISSING_CHARACTER true |
| 139 | #define SUGGEST_WORDS_WITH_MISSING_SPACE_CHARACTER true |
| 140 | #define SUGGEST_WORDS_WITH_EXCESSIVE_CHARACTER true |
satok | a3d78f6 | 2010-12-09 22:08:33 +0900 | [diff] [blame] | 141 | #define SUGGEST_WORDS_WITH_TRANSPOSED_CHARACTERS true |
satok | 817e517 | 2011-03-04 06:06:45 -0800 | [diff] [blame] | 142 | #define SUGGEST_WORDS_WITH_SPACE_PROXIMITY true |
satok | a3d78f6 | 2010-12-09 22:08:33 +0900 | [diff] [blame] | 143 | |
Jean Chalard | 8dc754a | 2011-01-27 14:20:22 +0900 | [diff] [blame] | 144 | // The following "rate"s are used as a multiplier before dividing by 100, so they are in percent. |
satok | 72bc17e | 2011-04-13 17:23:27 +0900 | [diff] [blame] | 145 | #define WORDS_WITH_MISSING_CHARACTER_DEMOTION_RATE 80 |
satok | dc5301e | 2011-04-11 16:14:45 +0900 | [diff] [blame] | 146 | #define WORDS_WITH_MISSING_CHARACTER_DEMOTION_START_POS_10X 12 |
satok | 99c908a | 2011-05-24 14:28:13 +0900 | [diff] [blame] | 147 | #define WORDS_WITH_MISSING_SPACE_CHARACTER_DEMOTION_RATE 67 |
satok | a3d78f6 | 2010-12-09 22:08:33 +0900 | [diff] [blame] | 148 | #define WORDS_WITH_EXCESSIVE_CHARACTER_DEMOTION_RATE 75 |
satok | 54fe9e0 | 2010-12-13 14:42:35 +0900 | [diff] [blame] | 149 | #define WORDS_WITH_EXCESSIVE_CHARACTER_OUT_OF_PROXIMITY_DEMOTION_RATE 75 |
satok | a3d78f6 | 2010-12-09 22:08:33 +0900 | [diff] [blame] | 150 | #define WORDS_WITH_TRANSPOSED_CHARACTERS_DEMOTION_RATE 60 |
satok | 58c49b9 | 2011-01-27 03:23:39 +0900 | [diff] [blame] | 151 | #define FULL_MATCHED_WORDS_PROMOTION_RATE 120 |
satok | 9d2a302 | 2011-04-14 19:13:34 +0900 | [diff] [blame] | 152 | #define WORDS_WITH_PROXIMITY_CHARACTER_DEMOTION_RATE 90 |
satok | e808e43 | 2010-12-02 14:53:24 +0900 | [diff] [blame] | 153 | |
satok | f5cded1 | 2010-12-06 21:28:24 +0900 | [diff] [blame] | 154 | // This should be greater than or equal to MAX_WORD_LENGTH defined in BinaryDictionary.java |
| 155 | // This is only used for the size of array. Not to be used in c functions. |
| 156 | #define MAX_WORD_LENGTH_INTERNAL 48 |
satok | 715514d | 2010-12-02 20:19:59 +0900 | [diff] [blame] | 157 | |
satok | 6831926 | 2010-12-03 19:38:08 +0900 | [diff] [blame] | 158 | #define MAX_DEPTH_MULTIPLIER 3 |
| 159 | |
Jean Chalard | a787dba | 2011-03-04 12:17:48 +0900 | [diff] [blame] | 160 | // TODO: Reduce this constant if possible; check the maximum number of umlauts in the same German |
| 161 | // word in the dictionary |
| 162 | #define DEFAULT_MAX_UMLAUT_SEARCH_DEPTH 5 |
| 163 | |
satok | 54fe9e0 | 2010-12-13 14:42:35 +0900 | [diff] [blame] | 164 | // Minimum suggest depth for one word for all cases except for missing space suggestions. |
| 165 | #define MIN_SUGGEST_DEPTH 1 |
| 166 | #define MIN_USER_TYPED_LENGTH_FOR_MISSING_SPACE_SUGGESTION 3 |
| 167 | #define MIN_USER_TYPED_LENGTH_FOR_EXCESSIVE_CHARACTER_SUGGESTION 3 |
satok | 662fe69 | 2010-12-08 17:05:39 +0900 | [diff] [blame] | 168 | |
Tadashi G. Takaoka | 887f11e | 2011-02-10 20:53:58 +0900 | [diff] [blame] | 169 | // The size of next letters frequency array. Zero will disable the feature. |
| 170 | #define NEXT_LETTERS_SIZE 0 |
| 171 | |
satok | f5cded1 | 2010-12-06 21:28:24 +0900 | [diff] [blame] | 172 | #define min(a,b) ((a)<(b)?(a):(b)) |
| 173 | |
satok | e808e43 | 2010-12-02 14:53:24 +0900 | [diff] [blame] | 174 | #endif // LATINIME_DEFINES_H |