blob: 1292268b8dcc2ea67cd41b96c02b786d68d1864f [file] [log] [blame]
The Android Open Source Project923bf412009-03-13 15:11:42 -07001/*
2 * Copyright (C) 2009 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef LATINIME_DICTIONARY_H
18#define LATINIME_DICTIONARY_H
19
Jean Chalard1ff8dc42012-05-02 16:00:24 +090020#include <map>
21
satok30088252010-12-01 21:22:15 +090022#include "bigram_dictionary.h"
satokd24df432011-07-14 15:43:42 +090023#include "char_utils.h"
satoke808e432010-12-02 14:53:24 +090024#include "defines.h"
Ken Wakasa8658e552012-06-30 08:53:33 +090025#include "incremental_decoder_interface.h"
satok8fbd5522011-02-22 17:28:55 +090026#include "proximity_info.h"
satok30088252010-12-01 21:22:15 +090027#include "unigram_dictionary.h"
satoka7e5a5a2011-12-15 16:49:12 +090028#include "words_priority_queue_pool.h"
satok30088252010-12-01 21:22:15 +090029
The Android Open Source Project923bf412009-03-13 15:11:42 -070030namespace latinime {
31
32class Dictionary {
Ken Wakasae12e9b52012-01-06 12:24:38 +090033 public:
Ken Wakasae90b3332011-01-07 15:01:51 +090034 Dictionary(void *dict, int dictSize, int mmapFd, int dictBufAdjust, int typedLetterMultipler,
Jean Chalardb7d7c5a2012-07-11 11:31:48 +090035 int fullWordMultiplier, int maxWordLength, int maxWords, int maxPredictions);
satok1147c7b2011-12-14 15:04:58 +090036
satok8fbd5522011-02-22 17:28:55 +090037 int getSuggestions(ProximityInfo *proximityInfo, int *xcoordinates, int *ycoordinates,
Satoshi Kataoka73680092012-06-25 17:44:54 +090038 int *times, int *pointerIds, int *codes, int codesSize, int *prevWordChars,
Jean Chalard05efe572012-06-27 17:31:09 +090039 int prevWordLength, int commitPoint, bool isGesture,
Satoshi Kataoka73680092012-06-25 17:44:54 +090040 bool useFullEditDistance, unsigned short *outWords,
Jean Chalard6931df92012-07-12 12:55:48 +090041 int *frequencies, int *spaceIndices, int *outputTypes) {
Satoshi Kataoka73680092012-06-25 17:44:54 +090042 int result = 0;
Satoshi Kataoka91eb4d82012-06-26 16:39:07 +090043 if (isGesture) {
44 mGestureDecoder->setPrevWord(prevWordChars, prevWordLength);
45 result = mGestureDecoder->getSuggestions(proximityInfo, xcoordinates, ycoordinates,
Jean Chalard05efe572012-06-27 17:31:09 +090046 times, pointerIds, codes, codesSize, commitPoint,
Jean Chalard6931df92012-07-12 12:55:48 +090047 outWords, frequencies, spaceIndices, outputTypes);
Satoshi Kataokadeb09872012-07-03 17:45:50 +090048 return result;
Satoshi Kataoka91eb4d82012-06-26 16:39:07 +090049 } else {
50 std::map<int, int> bigramMap;
51 uint8_t bigramFilter[BIGRAM_FILTER_BYTE_SIZE];
52 mBigramDictionary->fillBigramAddressToFrequencyMapAndFilter(prevWordChars,
53 prevWordLength, &bigramMap, bigramFilter);
54 result = mUnigramDictionary->getSuggestions(proximityInfo, xcoordinates,
55 ycoordinates, codes, codesSize, &bigramMap, bigramFilter,
Jean Chalard6931df92012-07-12 12:55:48 +090056 useFullEditDistance, outWords, frequencies, outputTypes);
Satoshi Kataokadeb09872012-07-03 17:45:50 +090057 return result;
Satoshi Kataoka91eb4d82012-06-26 16:39:07 +090058 }
satok30088252010-12-01 21:22:15 +090059 }
60
Jean Chalard522a04e2012-04-23 15:37:07 +090061 int getBigrams(const int32_t *word, int length, int *codes, int codesSize,
Jean Chalard6931df92012-07-12 12:55:48 +090062 unsigned short *outWords, int *frequencies, int *outputTypes) const {
Jean Chalard3b576312012-07-11 16:47:22 +090063 if (length <= 0) return 0;
Jean Chalard6931df92012-07-12 12:55:48 +090064 return mBigramDictionary->getBigrams(word, length, codes, codesSize, outWords, frequencies,
65 outputTypes);
satok30088252010-12-01 21:22:15 +090066 }
satok8fbd5522011-02-22 17:28:55 +090067
satokb1ed1d42012-06-14 16:35:23 -070068 int getFrequency(const int32_t *word, int length) const;
69 bool isValidBigram(const int32_t *word1, int length1, const int32_t *word2, int length2) const;
70 void *getDict() const { return (void *)mDict; }
71 int getDictSize() const { return mDictSize; }
72 int getMmapFd() const { return mMmapFd; }
73 int getDictBufAdjust() const { return mDictBufAdjust; }
The Android Open Source Project923bf412009-03-13 15:11:42 -070074 ~Dictionary();
Amith Yamasanicc3e5c72009-03-31 10:51:17 -070075
satoke808e432010-12-02 14:53:24 +090076 // public static utility methods
77 // static inline methods should be defined in the header file
satok18c28f42010-12-02 18:11:54 +090078 static int wideStrLen(unsigned short *str);
Jean Chalard581335c2011-06-17 12:45:17 +090079
Ken Wakasae12e9b52012-01-06 12:24:38 +090080 private:
satok1bc038c2012-06-14 11:25:50 -070081 DISALLOW_IMPLICIT_CONSTRUCTORS(Dictionary);
Ken Wakasae90b3332011-01-07 15:01:51 +090082 const unsigned char *mDict;
83
84 // Used only for the mmap version of dictionary loading, but we use these as dummy variables
85 // also for the malloc version.
86 const int mDictSize;
87 const int mMmapFd;
88 const int mDictBufAdjust;
89
satok1bc038c2012-06-14 11:25:50 -070090 const UnigramDictionary *mUnigramDictionary;
satokb1ed1d42012-06-14 16:35:23 -070091 const BigramDictionary *mBigramDictionary;
Ken Wakasa8658e552012-06-30 08:53:33 +090092 IncrementalDecoderInterface *mGestureDecoder;
The Android Open Source Project923bf412009-03-13 15:11:42 -070093};
94
satoke808e432010-12-02 14:53:24 +090095// public static utility methods
96// static inline methods should be defined in the header file
satok18c28f42010-12-02 18:11:54 +090097inline int Dictionary::wideStrLen(unsigned short *str) {
98 if (!str) return 0;
99 unsigned short *end = str;
100 while (*end)
101 end++;
102 return end - str;
103}
Ken Wakasace9e52a2011-06-18 13:09:55 +0900104} // namespace latinime
105
The Android Open Source Project923bf412009-03-13 15:11:42 -0700106#endif // LATINIME_DICTIONARY_H