2016-03-20 02:32:35 +00:00
|
|
|
/*
|
2017-08-15 04:43:09 +00:00
|
|
|
* Copyright (C) 2016-2017 Alex Yatskov <alex@foosoft.net>
|
2016-03-20 02:32:35 +00:00
|
|
|
* Author: Alex Yatskov <alex@foosoft.net>
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
2016-11-07 16:29:21 +00:00
|
|
|
class Database {
|
2016-03-21 00:15:40 +00:00
|
|
|
constructor() {
|
2016-09-12 05:47:08 +00:00
|
|
|
this.db = null;
|
2017-09-14 00:26:02 +00:00
|
|
|
this.tagCache = {};
|
2016-08-21 20:32:36 +00:00
|
|
|
}
|
|
|
|
|
2017-07-10 20:16:24 +00:00
|
|
|
async prepare() {
|
2017-07-09 23:29:52 +00:00
|
|
|
if (this.db) {
|
2017-07-10 20:16:24 +00:00
|
|
|
throw 'database already initialized';
|
2016-09-13 22:59:18 +00:00
|
|
|
}
|
|
|
|
|
2017-07-10 20:16:24 +00:00
|
|
|
this.db = new Dexie('dict');
|
2017-09-11 04:49:37 +00:00
|
|
|
this.db.version(2).stores({
|
|
|
|
terms: '++id,dictionary,expression,reading',
|
|
|
|
kanji: '++,dictionary,character',
|
|
|
|
tagMeta: '++,dictionary',
|
2017-07-10 20:16:24 +00:00
|
|
|
dictionaries: '++,title,version'
|
2016-12-30 18:47:27 +00:00
|
|
|
});
|
2017-09-11 04:49:37 +00:00
|
|
|
this.db.version(3).stores({
|
|
|
|
termFreq: '++,dictionary,expression',
|
|
|
|
kanjiFreq: '++,dictionary,character',
|
2017-09-13 23:42:04 +00:00
|
|
|
tagMeta: '++,dictionary,name'
|
2017-09-11 04:49:37 +00:00
|
|
|
});
|
2017-07-10 20:16:24 +00:00
|
|
|
|
|
|
|
await this.db.open();
|
2016-03-21 00:15:40 +00:00
|
|
|
}
|
|
|
|
|
2017-07-10 20:16:24 +00:00
|
|
|
async purge() {
|
2017-07-09 22:23:11 +00:00
|
|
|
if (!this.db) {
|
2017-07-10 20:16:24 +00:00
|
|
|
throw 'database not initialized';
|
2016-11-14 03:10:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
this.db.close();
|
2017-07-10 20:16:24 +00:00
|
|
|
await this.db.delete();
|
|
|
|
this.db = null;
|
2017-09-14 00:26:02 +00:00
|
|
|
this.tagCache = {};
|
2017-07-10 20:16:24 +00:00
|
|
|
|
|
|
|
await this.prepare();
|
2016-11-14 03:10:28 +00:00
|
|
|
}
|
|
|
|
|
2017-07-10 21:10:58 +00:00
|
|
|
async findTerms(term, titles) {
|
2017-07-09 22:23:11 +00:00
|
|
|
if (!this.db) {
|
2017-07-10 20:16:24 +00:00
|
|
|
throw 'database not initialized';
|
2016-09-12 05:47:08 +00:00
|
|
|
}
|
|
|
|
|
2016-04-18 01:38:29 +00:00
|
|
|
const results = [];
|
2017-07-10 20:16:24 +00:00
|
|
|
await this.db.terms.where('expression').equals(term).or('reading').equals(term).each(row => {
|
2017-07-10 21:10:58 +00:00
|
|
|
if (titles.includes(row.dictionary)) {
|
2016-11-13 03:29:30 +00:00
|
|
|
results.push({
|
|
|
|
expression: row.expression,
|
|
|
|
reading: row.reading,
|
2017-03-03 05:01:49 +00:00
|
|
|
tags: dictFieldSplit(row.tags),
|
|
|
|
rules: dictFieldSplit(row.rules),
|
2017-01-10 03:51:21 +00:00
|
|
|
glossary: row.glossary,
|
2016-12-18 05:42:53 +00:00
|
|
|
score: row.score,
|
2016-12-18 05:26:46 +00:00
|
|
|
dictionary: row.dictionary,
|
2016-11-13 03:29:30 +00:00
|
|
|
id: row.id
|
|
|
|
});
|
|
|
|
}
|
2016-08-22 02:51:12 +00:00
|
|
|
});
|
2017-07-10 20:16:24 +00:00
|
|
|
|
|
|
|
return results;
|
2016-08-22 02:51:12 +00:00
|
|
|
}
|
2016-04-13 06:12:20 +00:00
|
|
|
|
2017-09-13 01:29:16 +00:00
|
|
|
async findTermFreq(term, titles) {
|
|
|
|
if (!this.db) {
|
|
|
|
throw 'database not initialized';
|
|
|
|
}
|
|
|
|
|
|
|
|
const results = [];
|
|
|
|
await this.db.termFreq.where('expression').equals(term).each(row => {
|
|
|
|
if (titles.includes(row.dictionary)) {
|
|
|
|
results.push({frequency: row.frequency, dictionary: row.dictionary});
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
return results;
|
|
|
|
}
|
|
|
|
|
2017-07-10 21:10:58 +00:00
|
|
|
async findKanji(kanji, titles) {
|
2017-07-09 22:23:11 +00:00
|
|
|
if (!this.db) {
|
2016-09-12 05:47:08 +00:00
|
|
|
return Promise.reject('database not initialized');
|
|
|
|
}
|
|
|
|
|
2016-08-22 02:51:12 +00:00
|
|
|
const results = [];
|
2017-07-10 20:16:24 +00:00
|
|
|
await this.db.kanji.where('character').equals(kanji).each(row => {
|
2017-07-10 21:10:58 +00:00
|
|
|
if (titles.includes(row.dictionary)) {
|
2016-11-13 03:29:30 +00:00
|
|
|
results.push({
|
|
|
|
character: row.character,
|
2017-03-03 05:01:49 +00:00
|
|
|
onyomi: dictFieldSplit(row.onyomi),
|
|
|
|
kunyomi: dictFieldSplit(row.kunyomi),
|
|
|
|
tags: dictFieldSplit(row.tags),
|
2017-01-10 03:51:21 +00:00
|
|
|
glossary: row.meanings,
|
2016-12-18 20:07:01 +00:00
|
|
|
dictionary: row.dictionary
|
2016-11-13 03:29:30 +00:00
|
|
|
});
|
|
|
|
}
|
|
|
|
});
|
2017-07-10 20:16:24 +00:00
|
|
|
|
|
|
|
return results;
|
2016-04-01 03:03:39 +00:00
|
|
|
}
|
2016-08-24 03:33:04 +00:00
|
|
|
|
2017-09-13 03:20:03 +00:00
|
|
|
async findKanjiFreq(kanji, titles) {
|
|
|
|
if (!this.db) {
|
|
|
|
throw 'database not initialized';
|
|
|
|
}
|
|
|
|
|
|
|
|
const results = [];
|
|
|
|
await this.db.kanjiFreq.where('character').equals(kanji).each(row => {
|
|
|
|
if (titles.includes(row.dictionary)) {
|
|
|
|
results.push({frequency: row.frequency, dictionary: row.dictionary});
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
return results;
|
|
|
|
}
|
|
|
|
|
2017-09-14 01:03:55 +00:00
|
|
|
async findTagForTitle(name, title) {
|
2017-07-09 22:23:11 +00:00
|
|
|
if (!this.db) {
|
2017-07-10 20:16:24 +00:00
|
|
|
throw 'database not initialized';
|
2016-09-12 05:47:08 +00:00
|
|
|
}
|
|
|
|
|
2017-09-14 00:26:02 +00:00
|
|
|
this.tagCache[title] = this.tagCache[title] || {};
|
|
|
|
|
|
|
|
let result = this.tagCache[title][name];
|
|
|
|
if (!result) {
|
|
|
|
await this.db.tagMeta.where('name').equals(name).each(row => {
|
|
|
|
if (title === row.dictionary) {
|
|
|
|
result = row;
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
this.tagCache[title][name] = result;
|
|
|
|
}
|
2017-09-13 23:42:04 +00:00
|
|
|
|
|
|
|
return result;
|
2016-08-24 05:22:09 +00:00
|
|
|
}
|
2016-08-24 03:33:04 +00:00
|
|
|
|
2017-09-14 00:30:45 +00:00
|
|
|
async getTitles() {
|
2017-07-10 21:10:58 +00:00
|
|
|
if (this.db) {
|
|
|
|
return this.db.dictionaries.toArray();
|
|
|
|
} else {
|
2017-07-10 20:16:24 +00:00
|
|
|
throw 'database not initialized';
|
2016-11-06 01:24:45 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-07-10 20:16:24 +00:00
|
|
|
async importDictionary(archive, callback) {
|
2017-07-09 22:23:11 +00:00
|
|
|
if (!this.db) {
|
2016-09-12 05:47:08 +00:00
|
|
|
return Promise.reject('database not initialized');
|
|
|
|
}
|
2016-08-24 05:22:09 +00:00
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
const indexDataLoaded = async summary => {
|
|
|
|
const count = await this.db.dictionaries.where('title').equals(summary.title).count();
|
|
|
|
if (count > 0) {
|
2017-09-13 22:41:06 +00:00
|
|
|
throw `dictionary "${summary.title}" is already imported`;
|
2017-07-10 20:16:24 +00:00
|
|
|
}
|
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
await this.db.dictionaries.add(summary);
|
2016-11-05 23:44:29 +00:00
|
|
|
};
|
2016-08-24 03:33:04 +00:00
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
const termDataLoaded = async (title, entries, total, current) => {
|
2017-07-10 20:16:24 +00:00
|
|
|
if (callback) {
|
|
|
|
callback(total, current);
|
|
|
|
}
|
|
|
|
|
2016-11-05 23:44:29 +00:00
|
|
|
const rows = [];
|
2017-02-26 19:12:54 +00:00
|
|
|
for (const [expression, reading, tags, rules, score, ...glossary] of entries) {
|
2016-11-06 00:30:00 +00:00
|
|
|
rows.push({
|
|
|
|
expression,
|
|
|
|
reading,
|
|
|
|
tags,
|
2016-12-18 01:42:41 +00:00
|
|
|
rules,
|
2016-12-18 03:30:26 +00:00
|
|
|
score,
|
2016-11-07 03:14:43 +00:00
|
|
|
glossary,
|
|
|
|
dictionary: title
|
2016-11-06 00:30:00 +00:00
|
|
|
});
|
2016-11-05 23:44:29 +00:00
|
|
|
}
|
2016-08-24 03:33:04 +00:00
|
|
|
|
2017-09-13 03:20:03 +00:00
|
|
|
await this.db.terms.bulkAdd(rows);
|
2016-11-05 23:44:29 +00:00
|
|
|
};
|
|
|
|
|
2017-09-13 01:29:16 +00:00
|
|
|
const termFreqDataLoaded = async (title, entries, total, current) => {
|
|
|
|
if (callback) {
|
|
|
|
callback(total, current);
|
|
|
|
}
|
|
|
|
|
|
|
|
const rows = [];
|
|
|
|
for (const [expression, frequency] of entries) {
|
|
|
|
rows.push({
|
|
|
|
expression,
|
|
|
|
frequency,
|
|
|
|
dictionary: title
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2017-09-13 03:20:03 +00:00
|
|
|
await this.db.termFreq.bulkAdd(rows);
|
2017-09-13 01:29:16 +00:00
|
|
|
};
|
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
const kanjiDataLoaded = async (title, entries, total, current) => {
|
2017-07-10 20:16:24 +00:00
|
|
|
if (callback) {
|
|
|
|
callback(total, current);
|
|
|
|
}
|
|
|
|
|
2016-11-05 23:44:29 +00:00
|
|
|
const rows = [];
|
2017-02-26 19:12:54 +00:00
|
|
|
for (const [character, onyomi, kunyomi, tags, ...meanings] of entries) {
|
2016-11-06 00:30:00 +00:00
|
|
|
rows.push({
|
|
|
|
character,
|
|
|
|
onyomi,
|
|
|
|
kunyomi,
|
|
|
|
tags,
|
2016-11-07 03:14:43 +00:00
|
|
|
meanings,
|
|
|
|
dictionary: title
|
2016-11-06 00:30:00 +00:00
|
|
|
});
|
2016-08-24 05:22:09 +00:00
|
|
|
}
|
|
|
|
|
2017-09-13 03:20:03 +00:00
|
|
|
await this.db.kanji.bulkAdd(rows);
|
|
|
|
};
|
|
|
|
|
|
|
|
const kanjiFreqDataLoaded = async (title, entries, total, current) => {
|
|
|
|
if (callback) {
|
|
|
|
callback(total, current);
|
|
|
|
}
|
|
|
|
|
|
|
|
const rows = [];
|
|
|
|
for (const [character, frequency] of entries) {
|
|
|
|
rows.push({
|
|
|
|
character,
|
|
|
|
frequency,
|
|
|
|
dictionary: title
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
await this.db.kanjiFreq.bulkAdd(rows);
|
2016-11-05 23:44:29 +00:00
|
|
|
};
|
2016-08-24 05:22:09 +00:00
|
|
|
|
2017-09-12 20:29:13 +00:00
|
|
|
const tagDataLoaded = async (title, entries, total, current) => {
|
|
|
|
if (callback) {
|
|
|
|
callback(total, current);
|
|
|
|
}
|
|
|
|
|
|
|
|
const rows = [];
|
|
|
|
for (const [name, category, order, notes] of entries) {
|
|
|
|
const row = dictTagSanitize({
|
|
|
|
name,
|
|
|
|
category,
|
|
|
|
order,
|
|
|
|
notes,
|
|
|
|
dictionary: title
|
|
|
|
});
|
|
|
|
|
|
|
|
rows.push(row);
|
|
|
|
}
|
|
|
|
|
2017-09-13 03:20:03 +00:00
|
|
|
await this.db.tagMeta.bulkAdd(rows);
|
2017-09-12 20:29:13 +00:00
|
|
|
};
|
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
return await Database.importDictionaryZip(
|
|
|
|
archive,
|
|
|
|
indexDataLoaded,
|
|
|
|
termDataLoaded,
|
2017-09-13 01:29:16 +00:00
|
|
|
termFreqDataLoaded,
|
2017-09-11 04:49:37 +00:00
|
|
|
kanjiDataLoaded,
|
2017-09-13 03:20:03 +00:00
|
|
|
kanjiFreqDataLoaded,
|
2017-09-12 20:29:13 +00:00
|
|
|
tagDataLoaded
|
2017-09-11 04:49:37 +00:00
|
|
|
);
|
2016-08-24 05:22:09 +00:00
|
|
|
}
|
2017-07-10 21:53:06 +00:00
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
static async importDictionaryZip(
|
|
|
|
archive,
|
|
|
|
indexDataLoaded,
|
|
|
|
termDataLoaded,
|
|
|
|
termFreqDataLoaded,
|
|
|
|
kanjiDataLoaded,
|
|
|
|
kanjiFreqDataLoaded,
|
|
|
|
tagDataLoaded
|
|
|
|
) {
|
2017-09-13 22:41:06 +00:00
|
|
|
const zip = await JSZip.loadAsync(archive);
|
2017-07-10 21:53:06 +00:00
|
|
|
|
2017-09-13 22:41:06 +00:00
|
|
|
const indexFile = zip.files['index.json'];
|
2017-07-10 21:53:06 +00:00
|
|
|
if (!indexFile) {
|
|
|
|
throw 'no dictionary index found in archive';
|
|
|
|
}
|
|
|
|
|
|
|
|
const index = JSON.parse(await indexFile.async('string'));
|
|
|
|
if (!index.title || !index.version || !index.revision) {
|
|
|
|
throw 'unrecognized dictionary format';
|
|
|
|
}
|
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
const summary = {title: index.title, version: index.version, revision: index.revision};
|
|
|
|
if (indexDataLoaded) {
|
|
|
|
await indexDataLoaded(summary);
|
|
|
|
}
|
2017-07-10 21:53:06 +00:00
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
const buildTermBankName = index => `term_bank_${index + 1}.json`;
|
|
|
|
const buildTermFreqBankName = index => `termfreq_bank_${index + 1}.json`;
|
|
|
|
const buildKanjiBankName = index => `kanji_bank_${index + 1}.json`;
|
|
|
|
const buildKanjiFreqBankName = index => `kanjifreq_bank_${index + 1}.json`;
|
|
|
|
const buildTagBankName = index => `tag_bank_${index + 1}.json`;
|
|
|
|
|
|
|
|
const countBanks = namer => {
|
|
|
|
let count = 0;
|
2017-09-13 22:41:06 +00:00
|
|
|
while (zip.files[namer(count)]) {
|
2017-09-11 04:49:37 +00:00
|
|
|
++count;
|
2017-07-10 21:53:06 +00:00
|
|
|
}
|
2017-09-11 04:49:37 +00:00
|
|
|
|
|
|
|
return count;
|
|
|
|
};
|
|
|
|
|
|
|
|
const termBankCount = countBanks(buildTermBankName);
|
2017-09-12 20:29:13 +00:00
|
|
|
const termFreqBankCount = countBanks(buildTermFreqBankName);
|
|
|
|
const kanjiBankCount = countBanks(buildKanjiBankName);
|
|
|
|
const kanjiFreqBankCount = countBanks(buildKanjiFreqBankName);
|
|
|
|
const tagBankCount = countBanks(buildTagBankName);
|
2017-09-11 04:49:37 +00:00
|
|
|
|
|
|
|
let bankLoadedCount = 0;
|
2017-09-12 20:29:13 +00:00
|
|
|
let bankTotalCount =
|
2017-09-11 04:49:37 +00:00
|
|
|
termBankCount +
|
|
|
|
termFreqBankCount +
|
2017-09-12 20:29:13 +00:00
|
|
|
kanjiBankCount +
|
2017-09-11 04:49:37 +00:00
|
|
|
kanjiFreqBankCount +
|
|
|
|
tagBankCount;
|
|
|
|
|
2017-09-12 20:29:13 +00:00
|
|
|
if (tagDataLoaded && index.tagMeta) {
|
|
|
|
const bank = [];
|
|
|
|
for (const name in index.tagMeta) {
|
|
|
|
const tag = index.tagMeta[name];
|
|
|
|
bank.push([name, tag.category, tag.order, tag.notes]);
|
|
|
|
}
|
|
|
|
|
|
|
|
tagDataLoaded(index.title, bank, ++bankTotalCount, bankLoadedCount++);
|
|
|
|
}
|
|
|
|
|
2017-09-11 04:49:37 +00:00
|
|
|
const loadBank = async (namer, count, callback) => {
|
|
|
|
if (callback) {
|
|
|
|
for (let i = 0; i < count; ++i) {
|
2017-09-13 22:41:06 +00:00
|
|
|
const bankFile = zip.files[namer(i)];
|
2017-09-11 04:49:37 +00:00
|
|
|
const bank = JSON.parse(await bankFile.async('string'));
|
|
|
|
await callback(index.title, bank, bankTotalCount, bankLoadedCount++);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
await loadBank(buildTermBankName, termBankCount, termDataLoaded);
|
|
|
|
await loadBank(buildTermFreqBankName, termFreqBankCount, termFreqDataLoaded);
|
|
|
|
await loadBank(buildKanjiBankName, kanjiBankCount, kanjiDataLoaded);
|
|
|
|
await loadBank(buildKanjiFreqBankName, kanjiFreqBankCount, kanjiFreqDataLoaded);
|
|
|
|
await loadBank(buildTagBankName, tagBankCount, tagDataLoaded);
|
|
|
|
|
|
|
|
return summary;
|
2017-07-10 21:53:06 +00:00
|
|
|
}
|
2016-03-20 02:32:35 +00:00
|
|
|
}
|