| Index: third_party/prediction/suggest/policyimpl/dictionary/structure/pt_common/patricia_trie_reading_utils.h
|
| diff --git a/third_party/prediction/suggest/policyimpl/dictionary/structure/pt_common/patricia_trie_reading_utils.h b/third_party/prediction/suggest/policyimpl/dictionary/structure/pt_common/patricia_trie_reading_utils.h
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..81286e098cd6c6c3523501243d72302acafb99e3
|
| --- /dev/null
|
| +++ b/third_party/prediction/suggest/policyimpl/dictionary/structure/pt_common/patricia_trie_reading_utils.h
|
| @@ -0,0 +1,154 @@
|
| +/*
|
| + * Copyright (C) 2013, The Android Open Source Project
|
| + *
|
| + * Licensed under the Apache License, Version 2.0 (the "License");
|
| + * you may not use this file except in compliance with the License.
|
| + * You may obtain a copy of the License at
|
| + *
|
| + * http://www.apache.org/licenses/LICENSE-2.0
|
| + *
|
| + * Unless required by applicable law or agreed to in writing, software
|
| + * distributed under the License is distributed on an "AS IS" BASIS,
|
| + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
| + * See the License for the specific language governing permissions and
|
| + * limitations under the License.
|
| + */
|
| +
|
| +#ifndef LATINIME_PATRICIA_TRIE_READING_UTILS_H
|
| +#define LATINIME_PATRICIA_TRIE_READING_UTILS_H
|
| +
|
| +#include <cstdint>
|
| +
|
| +#include "third_party/prediction/defines.h"
|
| +
|
| +namespace latinime {
|
| +
|
| +class DictionaryShortcutsStructurePolicy;
|
| +class DictionaryBigramsStructurePolicy;
|
| +
|
| +class PatriciaTrieReadingUtils {
|
| + public:
|
| + typedef uint8_t NodeFlags;
|
| +
|
| + static int getPtNodeArraySizeAndAdvancePosition(const uint8_t* const buffer,
|
| + int* const pos);
|
| +
|
| + static NodeFlags getFlagsAndAdvancePosition(const uint8_t* const buffer,
|
| + int* const pos);
|
| +
|
| + static int getCodePointAndAdvancePosition(const uint8_t* const buffer,
|
| + int* const pos);
|
| +
|
| + // Returns the number of read characters.
|
| + static int getCharsAndAdvancePosition(const uint8_t* const buffer,
|
| + const NodeFlags flags,
|
| + const int maxLength,
|
| + int* const outBuffer,
|
| + int* const pos);
|
| +
|
| + // Returns the number of skipped characters.
|
| + static int skipCharacters(const uint8_t* const buffer,
|
| + const NodeFlags flags,
|
| + const int maxLength,
|
| + int* const pos);
|
| +
|
| + static int readProbabilityAndAdvancePosition(const uint8_t* const buffer,
|
| + int* const pos);
|
| +
|
| + static int readChildrenPositionAndAdvancePosition(const uint8_t* const buffer,
|
| + const NodeFlags flags,
|
| + int* const pos);
|
| +
|
| + /**
|
| + * Node Flags
|
| + */
|
| + static AK_FORCE_INLINE bool isBlacklisted(const NodeFlags flags) {
|
| + return (flags & FLAG_IS_BLACKLISTED) != 0;
|
| + }
|
| +
|
| + static AK_FORCE_INLINE bool isNotAWord(const NodeFlags flags) {
|
| + return (flags & FLAG_IS_NOT_A_WORD) != 0;
|
| + }
|
| +
|
| + static AK_FORCE_INLINE bool isTerminal(const NodeFlags flags) {
|
| + return (flags & FLAG_IS_TERMINAL) != 0;
|
| + }
|
| +
|
| + static AK_FORCE_INLINE bool hasShortcutTargets(const NodeFlags flags) {
|
| + return (flags & FLAG_HAS_SHORTCUT_TARGETS) != 0;
|
| + }
|
| +
|
| + static AK_FORCE_INLINE bool hasBigrams(const NodeFlags flags) {
|
| + return (flags & FLAG_HAS_BIGRAMS) != 0;
|
| + }
|
| +
|
| + static AK_FORCE_INLINE bool hasMultipleChars(const NodeFlags flags) {
|
| + return (flags & FLAG_HAS_MULTIPLE_CHARS) != 0;
|
| + }
|
| +
|
| + static AK_FORCE_INLINE bool hasChildrenInFlags(const NodeFlags flags) {
|
| + return FLAG_CHILDREN_POSITION_TYPE_NOPOSITION !=
|
| + (MASK_CHILDREN_POSITION_TYPE & flags);
|
| + }
|
| +
|
| + static AK_FORCE_INLINE NodeFlags
|
| + createAndGetFlags(const bool isBlacklisted,
|
| + const bool isNotAWord,
|
| + const bool isTerminal,
|
| + const bool hasShortcutTargets,
|
| + const bool hasBigrams,
|
| + const bool hasMultipleChars,
|
| + const int childrenPositionFieldSize) {
|
| + NodeFlags nodeFlags = 0;
|
| + nodeFlags = isBlacklisted ? (nodeFlags | FLAG_IS_BLACKLISTED) : nodeFlags;
|
| + nodeFlags = isNotAWord ? (nodeFlags | FLAG_IS_NOT_A_WORD) : nodeFlags;
|
| + nodeFlags = isTerminal ? (nodeFlags | FLAG_IS_TERMINAL) : nodeFlags;
|
| + nodeFlags = hasShortcutTargets ? (nodeFlags | FLAG_HAS_SHORTCUT_TARGETS)
|
| + : nodeFlags;
|
| + nodeFlags = hasBigrams ? (nodeFlags | FLAG_HAS_BIGRAMS) : nodeFlags;
|
| + nodeFlags =
|
| + hasMultipleChars ? (nodeFlags | FLAG_HAS_MULTIPLE_CHARS) : nodeFlags;
|
| + if (childrenPositionFieldSize == 1) {
|
| + nodeFlags |= FLAG_CHILDREN_POSITION_TYPE_ONEBYTE;
|
| + } else if (childrenPositionFieldSize == 2) {
|
| + nodeFlags |= FLAG_CHILDREN_POSITION_TYPE_TWOBYTES;
|
| + } else if (childrenPositionFieldSize == 3) {
|
| + nodeFlags |= FLAG_CHILDREN_POSITION_TYPE_THREEBYTES;
|
| + } else {
|
| + nodeFlags |= FLAG_CHILDREN_POSITION_TYPE_NOPOSITION;
|
| + }
|
| + return nodeFlags;
|
| + }
|
| +
|
| + static void readPtNodeInfo(
|
| + const uint8_t* const dictBuf,
|
| + const int ptNodePos,
|
| + const DictionaryShortcutsStructurePolicy* const shortcutPolicy,
|
| + const DictionaryBigramsStructurePolicy* const bigramPolicy,
|
| + NodeFlags* const outFlags,
|
| + int* const outCodePointCount,
|
| + int* const outCodePoint,
|
| + int* const outProbability,
|
| + int* const outChildrenPos,
|
| + int* const outShortcutPos,
|
| + int* const outBigramPos,
|
| + int* const outSiblingPos);
|
| +
|
| + private:
|
| + DISALLOW_IMPLICIT_CONSTRUCTORS(PatriciaTrieReadingUtils);
|
| +
|
| + static const NodeFlags MASK_CHILDREN_POSITION_TYPE;
|
| + static const NodeFlags FLAG_CHILDREN_POSITION_TYPE_NOPOSITION;
|
| + static const NodeFlags FLAG_CHILDREN_POSITION_TYPE_ONEBYTE;
|
| + static const NodeFlags FLAG_CHILDREN_POSITION_TYPE_TWOBYTES;
|
| + static const NodeFlags FLAG_CHILDREN_POSITION_TYPE_THREEBYTES;
|
| +
|
| + static const NodeFlags FLAG_HAS_MULTIPLE_CHARS;
|
| + static const NodeFlags FLAG_IS_TERMINAL;
|
| + static const NodeFlags FLAG_HAS_SHORTCUT_TARGETS;
|
| + static const NodeFlags FLAG_HAS_BIGRAMS;
|
| + static const NodeFlags FLAG_IS_NOT_A_WORD;
|
| + static const NodeFlags FLAG_IS_BLACKLISTED;
|
| +};
|
| +} // namespace latinime
|
| +#endif /* LATINIME_PATRICIA_TRIE_NODE_READING_UTILS_H */
|
|
|