summaryrefslogtreecommitdiffstats
path: root/src/storage
diff options
context:
space:
mode:
authorPeng Wu <alexepico@gmail.com>2025-11-13 11:53:30 +0800
committerPeng Wu <alexepico@gmail.com>2025-11-13 11:53:30 +0800
commit303d175f391aa159ab54ef345fc98b69c9b03d6b (patch)
tree2afac93aa7770a30254ed2b0e388bc1da9f41816 /src/storage
parent8aa630a81e9efcc37a31cb98f22ead3215e93c60 (diff)
downloadlibpinyin-303d175f391aa159ab54ef345fc98b69c9b03d6b.tar.gz
libpinyin-303d175f391aa159ab54ef345fc98b69c9b03d6b.tar.xz
libpinyin-303d175f391aa159ab54ef345fc98b69c9b03d6b.zip
Write chewing_large_table2_tkrzwdb.h
Diffstat (limited to 'src/storage')
-rw-r--r--src/storage/chewing_large_table2_tkrzwdb.h133
1 files changed, 133 insertions, 0 deletions
diff --git a/src/storage/chewing_large_table2_tkrzwdb.h b/src/storage/chewing_large_table2_tkrzwdb.h
new file mode 100644
index 0000000..dc97d81
--- /dev/null
+++ b/src/storage/chewing_large_table2_tkrzwdb.h
@@ -0,0 +1,133 @@
+/*
+ * libpinyin
+ * Library to deal with pinyin.
+ *
+ * Copyright (C) 2025 Peng Wu <alexepico@gmail.com>
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program. If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#ifndef CHEWING_LARGE_TABLE2_TKRZWDB_H
+#define CHEWING_LARGE_TABLE2_TKRZWDB_H
+
+#include "novel_types.h"
+#include "memory_chunk.h"
+#include <stdio.h>
+#include <tkrzw_dbm.h>
+#include "table_info.h"
+
+namespace pinyin{
+
+template<int phrase_length>
+class ChewingTableEntry;
+
+class ChewingLargeTable2{
+private:
+ /* member variables. */
+ tkrzw::DBM * m_db;
+
+protected:
+ /* Array of ChewingTableEntry. */
+ GPtrArray * m_entries;
+
+ void init_entries();
+
+ void fini_entries();
+
+ void reset();
+
+protected:
+ template<int phrase_length>
+ int search_internal(/* in */ const ChewingKey index[],
+ /* in */ const ChewingKey keys[],
+ /* out */ PhraseIndexRanges ranges) const;
+
+ int search_internal(int phrase_length,
+ /* in */ const ChewingKey index[],
+ /* in */ const ChewingKey keys[],
+ /* out */ PhraseIndexRanges ranges) const;
+
+ template<int phrase_length>
+ int search_suggestion_internal(/* in */ const MemoryChunk & chunk,
+ int prefix_len,
+ /* in */ const ChewingKey prefix_keys[],
+ /* out */ PhraseTokens tokens) const;
+
+ int search_suggestion_internal(int phrase_length,
+ /* in */ const MemoryChunk & chunk,
+ int prefix_len,
+ /* in */ const ChewingKey prefix_keys[],
+ /* out */ PhraseTokens tokens) const;
+
+ template<int phrase_length>
+ int add_index_internal(/* in */ const ChewingKey index[],
+ /* in */ const ChewingKey keys[],
+ /* in */ phrase_token_t token);
+
+ int add_index_internal(int phrase_length,
+ /* in */ const ChewingKey index[],
+ /* in */ const ChewingKey keys[],
+ /* in */ phrase_token_t token);
+
+ template<int phrase_length>
+ int remove_index_internal(/* in */ const ChewingKey index[],
+ /* in */ const ChewingKey keys[],
+ /* in */ phrase_token_t token);
+
+ int remove_index_internal(int phrase_length,
+ /* in */ const ChewingKey index[],
+ /* in */ const ChewingKey keys[],
+ /* in */ phrase_token_t token);
+
+public:
+ ChewingLargeTable2();
+
+ ~ChewingLargeTable2() {
+ reset();
+ }
+
+ /* attach method */
+ bool attach(const char * dbfile, guint32 flags);
+
+ /* load/store method */
+ /* use in-memory DBM here, for better performance. */
+ bool load_db(const char * filename);
+
+ bool store_db(const char * new_filename);
+
+ bool load_text(FILE * infile, TABLE_PHONETIC_TYPE type);
+
+ /* search method */
+ int search(int phrase_length, /* in */ const ChewingKey keys[],
+ /* out */ PhraseIndexRanges ranges) const;
+
+ /* search_suggesion method */
+ int search_suggestion(int prefix_len,
+ /* in */ const ChewingKey prefix_keys[],
+ /* out */ PhraseTokens tokens) const;
+
+ /* add/remove index method */
+ int add_index(int phrase_length, /* in */ const ChewingKey keys[],
+ /* in */ phrase_token_t token);
+
+ int remove_index(int phrase_length, /* in */ const ChewingKey keys[],
+ /* in */ phrase_token_t token);
+
+ /* mask out method */
+ bool mask_out(phrase_token_t mask, phrase_token_t value);
+};
+
+};
+
+#endif