Index: third_party/android_prediction/suggest/policyimpl/dictionary/structure/v4/ver4_dict_buffers.cpp |
diff --git a/third_party/android_prediction/suggest/policyimpl/dictionary/structure/v4/ver4_dict_buffers.cpp b/third_party/android_prediction/suggest/policyimpl/dictionary/structure/v4/ver4_dict_buffers.cpp |
new file mode 100644 |
index 0000000000000000000000000000000000000000..d62b04fd039cb9ece4d4e4b8f6487f342d2aaee6 |
--- /dev/null |
+++ b/third_party/android_prediction/suggest/policyimpl/dictionary/structure/v4/ver4_dict_buffers.cpp |
@@ -0,0 +1,214 @@ |
+/* |
+ * Copyright (C) 2013 The Android Open Source Project |
+ * |
+ * Licensed under the Apache License, Version 2.0 (the "License"); |
+ * you may not use this file except in compliance with the License. |
+ * You may obtain a copy of the License at |
+ * |
+ * http://www.apache.org/licenses/LICENSE-2.0 |
+ * |
+ * Unless required by applicable law or agreed to in writing, software |
+ * distributed under the License is distributed on an "AS IS" BASIS, |
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
+ * See the License for the specific language governing permissions and |
+ * limitations under the License. |
+ */ |
+ |
+#include "third_party/android_prediction/suggest/policyimpl/dictionary/structure/v4/ver4_dict_buffers.h" |
+ |
+#include <cerrno> |
+#include <cstring> |
+#include <fcntl.h> |
+#include <sys/stat.h> |
+#include <sys/types.h> |
+#include <vector> |
+ |
+#include "third_party/android_prediction/suggest/policyimpl/dictionary/utils/byte_array_utils.h" |
+#include "third_party/android_prediction/suggest/policyimpl/dictionary/utils/dict_file_writing_utils.h" |
+#include "third_party/android_prediction/suggest/policyimpl/dictionary/utils/file_utils.h" |
+#include "third_party/android_prediction/utils/byte_array_view.h" |
+ |
+namespace latinime { |
+ |
+/* static */ Ver4DictBuffers::Ver4DictBuffersPtr Ver4DictBuffers::openVer4DictBuffers( |
+ const char *const dictPath, MmappedBuffer::MmappedBufferPtr &&headerBuffer, |
+ const FormatUtils::FORMAT_VERSION formatVersion) { |
+ if (!headerBuffer) { |
+ ASSERT(false); |
+ AKLOGE("The header buffer must be valid to open ver4 dict buffers."); |
+ return Ver4DictBuffersPtr(nullptr); |
+ } |
+ // TODO: take only dictDirPath, and open both header and trie files in the constructor below |
+ const bool isUpdatable = headerBuffer->isUpdatable(); |
+ MmappedBuffer::MmappedBufferPtr bodyBuffer = MmappedBuffer::openBuffer(dictPath, |
+ Ver4DictConstants::BODY_FILE_EXTENSION, isUpdatable); |
+ if (!bodyBuffer) { |
+ return Ver4DictBuffersPtr(nullptr); |
+ } |
+ std::vector<uint8_t *> buffers; |
+ std::vector<int> bufferSizes; |
+ const ReadWriteByteArrayView buffer = bodyBuffer->getReadWriteByteArrayView(); |
+ int position = 0; |
+ while (position < static_cast<int>(buffer.size())) { |
+ const int bufferSize = ByteArrayUtils::readUint32AndAdvancePosition( |
+ buffer.data(), &position); |
+ const ReadWriteByteArrayView subBuffer = buffer.subView(position, bufferSize); |
+ buffers.push_back(subBuffer.data()); |
+ bufferSizes.push_back(subBuffer.size()); |
+ position += bufferSize; |
+ if (bufferSize < 0 || position < 0 || position > static_cast<int>(buffer.size())) { |
+ AKLOGE("The dict body file is corrupted."); |
+ return Ver4DictBuffersPtr(nullptr); |
+ } |
+ } |
+ if (buffers.size() != Ver4DictConstants::NUM_OF_CONTENT_BUFFERS_IN_BODY_FILE) { |
+ AKLOGE("The dict body file is corrupted."); |
+ return Ver4DictBuffersPtr(nullptr); |
+ } |
+ return Ver4DictBuffersPtr(new Ver4DictBuffers(std::move(headerBuffer), std::move(bodyBuffer), |
+ formatVersion, buffers, bufferSizes)); |
+} |
+ |
+bool Ver4DictBuffers::flushHeaderAndDictBuffers(const char *const dictDirPath, |
+ const BufferWithExtendableBuffer *const headerBuffer) const { |
+ // Create temporary directory. |
+ const int tmpDirPathBufSize = FileUtils::getFilePathWithSuffixBufSize(dictDirPath, |
+ DictFileWritingUtils::TEMP_FILE_SUFFIX_FOR_WRITING_DICT_FILE); |
+ char tmpDirPath[tmpDirPathBufSize]; |
+ FileUtils::getFilePathWithSuffix(dictDirPath, |
+ DictFileWritingUtils::TEMP_FILE_SUFFIX_FOR_WRITING_DICT_FILE, tmpDirPathBufSize, |
+ tmpDirPath); |
+ if (FileUtils::existsDir(tmpDirPath)) { |
+ if (!FileUtils::removeDirAndFiles(tmpDirPath)) { |
+ AKLOGE("Existing directory %s cannot be removed.", tmpDirPath); |
+ ASSERT(false); |
+ return false; |
+ } |
+ } |
+ umask(S_IWGRP | S_IWOTH); |
+ if (mkdir(tmpDirPath, S_IRWXU) == -1) { |
+ AKLOGE("Cannot create directory: %s. errno: %d.", tmpDirPath, errno); |
+ return false; |
+ } |
+ // Get dictionary base path. |
+ const int dictNameBufSize = strlen(dictDirPath) + 1 /* terminator */; |
+ char dictName[dictNameBufSize]; |
+ FileUtils::getBasename(dictDirPath, dictNameBufSize, dictName); |
+ const int dictPathBufSize = FileUtils::getFilePathBufSize(tmpDirPath, dictName); |
+ char dictPath[dictPathBufSize]; |
+ FileUtils::getFilePath(tmpDirPath, dictName, dictPathBufSize, dictPath); |
+ |
+ // Write header file. |
+ if (!DictFileWritingUtils::flushBufferToFileWithSuffix(dictPath, |
+ Ver4DictConstants::HEADER_FILE_EXTENSION, headerBuffer)) { |
+ AKLOGE("Dictionary header file %s%s cannot be written.", tmpDirPath, |
+ Ver4DictConstants::HEADER_FILE_EXTENSION); |
+ return false; |
+ } |
+ |
+ // Write body file. |
+ const int bodyFilePathBufSize = FileUtils::getFilePathWithSuffixBufSize(dictPath, |
+ Ver4DictConstants::BODY_FILE_EXTENSION); |
+ char bodyFilePath[bodyFilePathBufSize]; |
+ FileUtils::getFilePathWithSuffix(dictPath, Ver4DictConstants::BODY_FILE_EXTENSION, |
+ bodyFilePathBufSize, bodyFilePath); |
+ |
+ const int fd = open(bodyFilePath, O_WRONLY | O_CREAT | O_EXCL, S_IRUSR | S_IWUSR); |
+ if (fd == -1) { |
+ AKLOGE("File %s cannot be opened. errno: %d", bodyFilePath, errno); |
+ ASSERT(false); |
+ return false; |
+ } |
+ FILE *const file = fdopen(fd, "wb"); |
+ if (!file) { |
+ AKLOGE("fdopen failed for the file %s. errno: %d", bodyFilePath, errno); |
+ ASSERT(false); |
+ return false; |
+ } |
+ |
+ if (!flushDictBuffers(file)) { |
+ fclose(file); |
+ return false; |
+ } |
+ fclose(file); |
+ // Remove existing dictionary. |
+ if (!FileUtils::removeDirAndFiles(dictDirPath)) { |
+ AKLOGE("Existing directory %s cannot be removed.", dictDirPath); |
+ ASSERT(false); |
+ return false; |
+ } |
+ // Rename temporary directory. |
+ if (rename(tmpDirPath, dictDirPath) != 0) { |
+ AKLOGE("%s cannot be renamed to %s", tmpDirPath, dictDirPath); |
+ ASSERT(false); |
+ return false; |
+ } |
+ return true; |
+} |
+ |
+bool Ver4DictBuffers::flushDictBuffers(FILE *const file) const { |
+ // Write trie. |
+ if (!DictFileWritingUtils::writeBufferToFileTail(file, &mExpandableTrieBuffer)) { |
+ AKLOGE("Trie cannot be written."); |
+ return false; |
+ } |
+ // Write terminal position lookup table. |
+ if (!mTerminalPositionLookupTable.flushToFile(file)) { |
+ AKLOGE("Terminal position lookup table cannot be written."); |
+ return false; |
+ } |
+ // Write language model content. |
+ if (!mLanguageModelDictContent.save(file)) { |
+ AKLOGE("Language model dict content cannot be written."); |
+ return false; |
+ } |
+ // Write bigram dict content. |
+ if (!mBigramDictContent.flushToFile(file)) { |
+ AKLOGE("Bigram dict content cannot be written."); |
+ return false; |
+ } |
+ // Write shortcut dict content. |
+ if (!mShortcutDictContent.flushToFile(file)) { |
+ AKLOGE("Shortcut dict content cannot be written."); |
+ return false; |
+ } |
+ return true; |
+} |
+ |
+Ver4DictBuffers::Ver4DictBuffers(MmappedBuffer::MmappedBufferPtr &&headerBuffer, |
+ MmappedBuffer::MmappedBufferPtr &&bodyBuffer, |
+ const FormatUtils::FORMAT_VERSION formatVersion, |
+ const std::vector<uint8_t *> &contentBuffers, const std::vector<int> &contentBufferSizes) |
+ : mHeaderBuffer(std::move(headerBuffer)), mDictBuffer(std::move(bodyBuffer)), |
+ mHeaderPolicy(mHeaderBuffer->getReadOnlyByteArrayView().data(), formatVersion), |
+ mExpandableHeaderBuffer(mHeaderBuffer->getReadWriteByteArrayView(), |
+ BufferWithExtendableBuffer::DEFAULT_MAX_ADDITIONAL_BUFFER_SIZE), |
+ mExpandableTrieBuffer( |
+ ReadWriteByteArrayView(contentBuffers[Ver4DictConstants::TRIE_BUFFER_INDEX], |
+ contentBufferSizes[Ver4DictConstants::TRIE_BUFFER_INDEX]), |
+ BufferWithExtendableBuffer::DEFAULT_MAX_ADDITIONAL_BUFFER_SIZE), |
+ mTerminalPositionLookupTable( |
+ contentBuffers[Ver4DictConstants::TERMINAL_ADDRESS_LOOKUP_TABLE_BUFFER_INDEX], |
+ contentBufferSizes[ |
+ Ver4DictConstants::TERMINAL_ADDRESS_LOOKUP_TABLE_BUFFER_INDEX]), |
+ mLanguageModelDictContent( |
+ ReadWriteByteArrayView( |
+ contentBuffers[Ver4DictConstants::LANGUAGE_MODEL_BUFFER_INDEX], |
+ contentBufferSizes[Ver4DictConstants::LANGUAGE_MODEL_BUFFER_INDEX]), |
+ mHeaderPolicy.hasHistoricalInfoOfWords()), |
+ mBigramDictContent(&contentBuffers[Ver4DictConstants::BIGRAM_BUFFERS_INDEX], |
+ &contentBufferSizes[Ver4DictConstants::BIGRAM_BUFFERS_INDEX], |
+ mHeaderPolicy.hasHistoricalInfoOfWords()), |
+ mShortcutDictContent(&contentBuffers[Ver4DictConstants::SHORTCUT_BUFFERS_INDEX], |
+ &contentBufferSizes[Ver4DictConstants::SHORTCUT_BUFFERS_INDEX]), |
+ mIsUpdatable(mDictBuffer->isUpdatable()) {} |
+ |
+Ver4DictBuffers::Ver4DictBuffers(const HeaderPolicy *const headerPolicy, const int maxTrieSize) |
+ : mHeaderBuffer(nullptr), mDictBuffer(nullptr), mHeaderPolicy(headerPolicy), |
+ mExpandableHeaderBuffer(Ver4DictConstants::MAX_DICTIONARY_SIZE), |
+ mExpandableTrieBuffer(maxTrieSize), mTerminalPositionLookupTable(), |
+ mLanguageModelDictContent(headerPolicy->hasHistoricalInfoOfWords()), |
+ mBigramDictContent(headerPolicy->hasHistoricalInfoOfWords()), mShortcutDictContent(), |
+ mIsUpdatable(true) {} |
+ |
+} // namespace latinime |