blob: 2fbe83e867e59b0142b3b81b5ba87fb1f08e48ee [file] [log] [blame]
The Android Open Source Project923bf412009-03-13 15:11:42 -07001/*
Ken Wakasa0bbb9172012-07-25 17:51:43 +09002 * Copyright (C) 2009, The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
The Android Open Source Project923bf412009-03-13 15:11:42 -070016
satoke808e432010-12-02 14:53:24 +090017#define LOG_TAG "LatinIME: dictionary.cpp"
18
Ken Wakasa77e8e812012-08-02 19:48:08 +090019#include <stdint.h>
20
21#include "bigram_dictionary.h"
Jean Chalard46a1eec2012-02-27 19:48:47 +090022#include "binary_format.h"
Ken Wakasa3b088a22012-05-16 23:05:32 +090023#include "defines.h"
The Android Open Source Project923bf412009-03-13 15:11:42 -070024#include "dictionary.h"
Satoshi Kataokae9f3e182012-08-09 23:23:08 +090025#include "dic_traverse_wrapper.h"
Satoshi Kataokadeb09872012-07-03 17:45:50 +090026#include "gesture_decoder_wrapper.h"
Ken Wakasa77e8e812012-08-02 19:48:08 +090027#include "unigram_dictionary.h"
satokd4952c82010-12-01 19:09:29 +090028
The Android Open Source Project923bf412009-03-13 15:11:42 -070029namespace latinime {
30
satok8fbd5522011-02-22 17:28:55 +090031// TODO: Change the type of all keyCodes to uint32_t
Ken Wakasae90b3332011-01-07 15:01:51 +090032Dictionary::Dictionary(void *dict, int dictSize, int mmapFd, int dictBufAdjust,
Ken Wakasa162c2112012-08-24 14:51:15 +090033 int typedLetterMultiplier, int fullWordMultiplier, int maxWordLength, int maxWords,
34 int maxPredictions)
35 : mDict(static_cast<unsigned char *>(dict)),
36 mOffsetDict((static_cast<unsigned char *>(dict)) + BinaryFormat::getHeaderSize(mDict)),
37 mDictSize(dictSize), mMmapFd(mmapFd), mDictBufAdjust(dictBufAdjust),
38 mUnigramDictionary(new UnigramDictionary(mOffsetDict, typedLetterMultiplier,
39 fullWordMultiplier, maxWordLength, maxWords, BinaryFormat::getFlags(mDict))),
40 mBigramDictionary(new BigramDictionary(mOffsetDict, maxWordLength, maxPredictions)),
41 mGestureDecoder(new GestureDecoderWrapper(maxWordLength, maxWords)) {
satok662fe692010-12-08 17:05:39 +090042 if (DEBUG_DICT) {
43 if (MAX_WORD_LENGTH_INTERNAL < maxWordLength) {
satok9fb6f472012-01-13 18:01:22 +090044 AKLOGI("Max word length (%d) is greater than %d",
satok662fe692010-12-08 17:05:39 +090045 maxWordLength, MAX_WORD_LENGTH_INTERNAL);
satok9fb6f472012-01-13 18:01:22 +090046 AKLOGI("IN NATIVE SUGGEST Version: %d", (mDict[0] & 0xFF));
satok662fe692010-12-08 17:05:39 +090047 }
satok715514d2010-12-02 20:19:59 +090048 }
The Android Open Source Project923bf412009-03-13 15:11:42 -070049}
50
satok662fe692010-12-08 17:05:39 +090051Dictionary::~Dictionary() {
satok30088252010-12-01 21:22:15 +090052 delete mUnigramDictionary;
53 delete mBigramDictionary;
Ken Wakasa8658e552012-06-30 08:53:33 +090054 delete mGestureDecoder;
The Android Open Source Project923bf412009-03-13 15:11:42 -070055}
satoke808e432010-12-02 14:53:24 +090056
Satoshi Kataoka91278112012-08-08 21:23:25 +090057int Dictionary::getSuggestions(ProximityInfo *proximityInfo, void *traverseSession,
58 int *xcoordinates, int *ycoordinates, int *times, int *pointerIds,
59 int *codes, int codesSize, int *prevWordChars,
Ken Wakasa77e8e812012-08-02 19:48:08 +090060 int prevWordLength, int commitPoint, bool isGesture,
61 bool useFullEditDistance, unsigned short *outWords,
Satoshi Kataokaf6be15c2012-08-15 16:57:32 +090062 int *frequencies, int *spaceIndices, int *outputTypes) const {
Ken Wakasa77e8e812012-08-02 19:48:08 +090063 int result = 0;
64 if (isGesture) {
Satoshi Kataokae9f3e182012-08-09 23:23:08 +090065 DicTraverseWrapper::initDicTraverseSession(
66 traverseSession, this, prevWordChars, prevWordLength);
Satoshi Kataoka91278112012-08-08 21:23:25 +090067 result = mGestureDecoder->getSuggestions(proximityInfo, traverseSession,
68 xcoordinates, ycoordinates, times, pointerIds, codes, codesSize, commitPoint,
Ken Wakasa77e8e812012-08-02 19:48:08 +090069 outWords, frequencies, spaceIndices, outputTypes);
Satoshi Kataoka586b0ca2012-08-06 11:20:54 +090070 if (DEBUG_DICT) {
71 DUMP_RESULT(outWords, frequencies, 18 /* MAX_WORDS */, MAX_WORD_LENGTH_INTERNAL);
72 }
Ken Wakasa77e8e812012-08-02 19:48:08 +090073 return result;
74 } else {
75 std::map<int, int> bigramMap;
76 uint8_t bigramFilter[BIGRAM_FILTER_BYTE_SIZE];
77 mBigramDictionary->fillBigramAddressToFrequencyMapAndFilter(prevWordChars,
78 prevWordLength, &bigramMap, bigramFilter);
79 result = mUnigramDictionary->getSuggestions(proximityInfo, xcoordinates,
80 ycoordinates, codes, codesSize, &bigramMap, bigramFilter,
81 useFullEditDistance, outWords, frequencies, outputTypes);
82 return result;
83 }
84}
85
86int Dictionary::getBigrams(const int32_t *word, int length, int *codes, int codesSize,
87 unsigned short *outWords, int *frequencies, int *outputTypes) const {
88 if (length <= 0) return 0;
89 return mBigramDictionary->getBigrams(word, length, codes, codesSize, outWords, frequencies,
90 outputTypes);
91}
92
satokb1ed1d42012-06-14 16:35:23 -070093int Dictionary::getFrequency(const int32_t *word, int length) const {
Satoshi Kataoka2f854e12012-05-29 15:58:13 +090094 return mUnigramDictionary->getFrequency(word, length);
satoke808e432010-12-02 14:53:24 +090095}
96
Tom Ouyang4d289d32012-04-26 23:50:21 -070097bool Dictionary::isValidBigram(const int32_t *word1, int length1, const int32_t *word2,
satokb1ed1d42012-06-14 16:35:23 -070098 int length2) const {
Tom Ouyang4d289d32012-04-26 23:50:21 -070099 return mBigramDictionary->isValidBigram(word1, length1, word2, length2);
100}
The Android Open Source Project923bf412009-03-13 15:11:42 -0700101} // namespace latinime