blob: 8210aa0ff6d6c738b1c069671a458769be951be9 [file] [log] [blame]
The Android Open Source Project923bf412009-03-13 15:11:42 -07001/*
Ken Wakasa0bbb9172012-07-25 17:51:43 +09002 * Copyright (C) 2009, The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
The Android Open Source Project923bf412009-03-13 15:11:42 -070016
satoke808e432010-12-02 14:53:24 +090017#define LOG_TAG "LatinIME: dictionary.cpp"
18
Ken Wakasa77e8e812012-08-02 19:48:08 +090019#include <stdint.h>
20
21#include "bigram_dictionary.h"
Jean Chalard46a1eec2012-02-27 19:48:47 +090022#include "binary_format.h"
Ken Wakasa3b088a22012-05-16 23:05:32 +090023#include "defines.h"
The Android Open Source Project923bf412009-03-13 15:11:42 -070024#include "dictionary.h"
Satoshi Kataokae9f3e182012-08-09 23:23:08 +090025#include "dic_traverse_wrapper.h"
Satoshi Kataokadeb09872012-07-03 17:45:50 +090026#include "gesture_decoder_wrapper.h"
Ken Wakasa77e8e812012-08-02 19:48:08 +090027#include "unigram_dictionary.h"
satokd4952c82010-12-01 19:09:29 +090028
The Android Open Source Project923bf412009-03-13 15:11:42 -070029namespace latinime {
30
Ken Wakasafe9ec6b2012-11-16 19:28:56 +090031Dictionary::Dictionary(void *dict, int dictSize, int mmapFd, int dictBufAdjust, int maxWordLength,
32 int maxWords, int maxPredictions)
Ken Wakasa162c2112012-08-24 14:51:15 +090033 : mDict(static_cast<unsigned char *>(dict)),
34 mOffsetDict((static_cast<unsigned char *>(dict)) + BinaryFormat::getHeaderSize(mDict)),
35 mDictSize(dictSize), mMmapFd(mmapFd), mDictBufAdjust(dictBufAdjust),
Ken Wakasafe9ec6b2012-11-16 19:28:56 +090036 mUnigramDictionary(new UnigramDictionary(mOffsetDict, maxWordLength, maxWords,
37 BinaryFormat::getFlags(mDict))),
Ken Wakasa162c2112012-08-24 14:51:15 +090038 mBigramDictionary(new BigramDictionary(mOffsetDict, maxWordLength, maxPredictions)),
39 mGestureDecoder(new GestureDecoderWrapper(maxWordLength, maxWords)) {
satok662fe692010-12-08 17:05:39 +090040 if (DEBUG_DICT) {
41 if (MAX_WORD_LENGTH_INTERNAL < maxWordLength) {
satok9fb6f472012-01-13 18:01:22 +090042 AKLOGI("Max word length (%d) is greater than %d",
satok662fe692010-12-08 17:05:39 +090043 maxWordLength, MAX_WORD_LENGTH_INTERNAL);
satok9fb6f472012-01-13 18:01:22 +090044 AKLOGI("IN NATIVE SUGGEST Version: %d", (mDict[0] & 0xFF));
satok662fe692010-12-08 17:05:39 +090045 }
satok715514d2010-12-02 20:19:59 +090046 }
The Android Open Source Project923bf412009-03-13 15:11:42 -070047}
48
satok662fe692010-12-08 17:05:39 +090049Dictionary::~Dictionary() {
satok30088252010-12-01 21:22:15 +090050 delete mUnigramDictionary;
51 delete mBigramDictionary;
Ken Wakasa8658e552012-06-30 08:53:33 +090052 delete mGestureDecoder;
The Android Open Source Project923bf412009-03-13 15:11:42 -070053}
satoke808e432010-12-02 14:53:24 +090054
Satoshi Kataoka91278112012-08-08 21:23:25 +090055int Dictionary::getSuggestions(ProximityInfo *proximityInfo, void *traverseSession,
Ken Wakasa1e614932012-10-29 18:06:22 +090056 int *xcoordinates, int *ycoordinates, int *times, int *pointerIds, int *codes,
57 int codesSize, int *prevWordChars, int prevWordLength, int commitPoint, bool isGesture,
58 bool useFullEditDistance, int *outWords, int *frequencies, int *spaceIndices,
59 int *outputTypes) const {
Ken Wakasa77e8e812012-08-02 19:48:08 +090060 int result = 0;
61 if (isGesture) {
Satoshi Kataokae9f3e182012-08-09 23:23:08 +090062 DicTraverseWrapper::initDicTraverseSession(
63 traverseSession, this, prevWordChars, prevWordLength);
Satoshi Kataoka91278112012-08-08 21:23:25 +090064 result = mGestureDecoder->getSuggestions(proximityInfo, traverseSession,
65 xcoordinates, ycoordinates, times, pointerIds, codes, codesSize, commitPoint,
Ken Wakasa77e8e812012-08-02 19:48:08 +090066 outWords, frequencies, spaceIndices, outputTypes);
Satoshi Kataoka586b0ca2012-08-06 11:20:54 +090067 if (DEBUG_DICT) {
68 DUMP_RESULT(outWords, frequencies, 18 /* MAX_WORDS */, MAX_WORD_LENGTH_INTERNAL);
69 }
Ken Wakasa77e8e812012-08-02 19:48:08 +090070 return result;
71 } else {
72 std::map<int, int> bigramMap;
73 uint8_t bigramFilter[BIGRAM_FILTER_BYTE_SIZE];
74 mBigramDictionary->fillBigramAddressToFrequencyMapAndFilter(prevWordChars,
75 prevWordLength, &bigramMap, bigramFilter);
76 result = mUnigramDictionary->getSuggestions(proximityInfo, xcoordinates,
77 ycoordinates, codes, codesSize, &bigramMap, bigramFilter,
78 useFullEditDistance, outWords, frequencies, outputTypes);
79 return result;
80 }
81}
82
Ken Wakasaaa5a3e82012-12-03 19:54:30 +090083int Dictionary::getBigrams(const int *word, int length, int *codes, int codesSize,
Ken Wakasa1e614932012-10-29 18:06:22 +090084 int *outWords, int *frequencies, int *outputTypes) const {
Ken Wakasa77e8e812012-08-02 19:48:08 +090085 if (length <= 0) return 0;
86 return mBigramDictionary->getBigrams(word, length, codes, codesSize, outWords, frequencies,
87 outputTypes);
88}
89
Ken Wakasaaa5a3e82012-12-03 19:54:30 +090090int Dictionary::getFrequency(const int *word, int length) const {
Satoshi Kataoka2f854e12012-05-29 15:58:13 +090091 return mUnigramDictionary->getFrequency(word, length);
satoke808e432010-12-02 14:53:24 +090092}
93
Ken Wakasaaa5a3e82012-12-03 19:54:30 +090094bool Dictionary::isValidBigram(const int *word1, int length1, const int *word2, int length2) const {
Tom Ouyang4d289d32012-04-26 23:50:21 -070095 return mBigramDictionary->isValidBigram(word1, length1, word2, length2);
96}
The Android Open Source Project923bf412009-03-13 15:11:42 -070097} // namespace latinime