Some work on deinflector
This commit is contained in:
parent
d8a630fa28
commit
2d526b7ecd
@ -3,6 +3,7 @@
|
||||
<body>
|
||||
<script src="lib/jquery-2.2.2.min.js"></script>
|
||||
<script src="jp/dictionary.js"></script>
|
||||
<script src="jp/deinflector.js"></script>
|
||||
<script src="jp/translator.js"></script>
|
||||
</body>
|
||||
</html>
|
||||
|
133
ext/jp/deinflector.js
Normal file
133
ext/jp/deinflector.js
Normal file
@ -0,0 +1,133 @@
|
||||
/*
|
||||
* Copyright (C) 2016 Alex Yatskov <alex@foosoft.net>
|
||||
* Author: Alex Yatskov <alex@foosoft.net>
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
* the Free Software Foundation, either version 3 of the License, or
|
||||
* (at your option) any later version.
|
||||
*
|
||||
* This program is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
* GNU General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
|
||||
class Deinflection {
|
||||
constructor(term, tags=[], rule='') {
|
||||
this.children = [];
|
||||
this.term = term;
|
||||
this.tags = tags;
|
||||
this.rule = rule;
|
||||
this.success = false;
|
||||
}
|
||||
|
||||
validate(validator) {
|
||||
for (const tags of validator(this.term)) {
|
||||
if (this.tags.length === 0) {
|
||||
return true;
|
||||
}
|
||||
|
||||
for (const tag in this.tags) {
|
||||
if (this.searchTags(tag, tags)) {
|
||||
return true;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
deinflect(validator, rules) {
|
||||
if (this.validate(validator)) {
|
||||
const child = new Deinflection(this.term);
|
||||
this.children.push(child);
|
||||
}
|
||||
|
||||
for (const [rule, variants] of rules) {
|
||||
for (const variant of variants) {
|
||||
const tagsIn = variant.tagsIn;
|
||||
const tagsOut = variant.tagsOut;
|
||||
const kanaIn = variant.kanaIn;
|
||||
const kanaOut = variant.kanaOut;
|
||||
|
||||
let allowed = this.tags.length === 0;
|
||||
for (const tag in this.tags) {
|
||||
if (this.searchTags(tag, tagsIn)) {
|
||||
allowed = true;
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
// FIX
|
||||
// if (!allowed || !this.term.endswith(kanaIn)) {
|
||||
// continue;
|
||||
// }
|
||||
|
||||
// FIX
|
||||
// const term = self.term[:-kanaIn.length] + kanaOut;
|
||||
// const child = new Deinflection(term, tagsOut, rule);
|
||||
// if (child.deinflect(validator, rules)) {
|
||||
// this.children.append(child);
|
||||
// }
|
||||
}
|
||||
}
|
||||
|
||||
return this.children.length > 0;
|
||||
}
|
||||
|
||||
searchTags(tag, tags) {
|
||||
for (const t of tags) {
|
||||
// FIX
|
||||
if (re.search(tag, t)) {
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
gather() {
|
||||
if (this.children.length === 0) {
|
||||
return [{root: this.term, rules: []}];
|
||||
}
|
||||
|
||||
const paths = [];
|
||||
for (const child of this.children) {
|
||||
for (const path in child.gather()) {
|
||||
if (this.rule.length > 0) {
|
||||
path.rules.append(this.rule);
|
||||
}
|
||||
|
||||
path.source = this.term;
|
||||
paths.push(path);
|
||||
}
|
||||
}
|
||||
|
||||
return paths;
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
class Deinflector {
|
||||
constructor() {
|
||||
this.rules = {};
|
||||
}
|
||||
|
||||
setRules(rules) {
|
||||
this.rules = rules;
|
||||
}
|
||||
|
||||
deinflect(term, validator) {
|
||||
const node = new Deinflection(term)
|
||||
if (node.deinflect(validator, this.rules)) {
|
||||
return node.gather();
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
}
|
@ -19,6 +19,7 @@
|
||||
class Translator {
|
||||
constructor() {
|
||||
this.dictionary = new Dictionary();
|
||||
this.deinflector = new Deinflector();
|
||||
this.initialized = false;
|
||||
}
|
||||
|
||||
@ -35,6 +36,8 @@ class Translator {
|
||||
}
|
||||
|
||||
$.when.apply($, loaders).done((rules, edict, enamdict, kanjidic) => {
|
||||
this.deinflector.setRules(rules);
|
||||
|
||||
this.dictionary.addTermDict(edict[0]);
|
||||
this.dictionary.addTermDict(enamdict[0]);
|
||||
this.dictionary.addKanjiDict(kanjidic[0]);
|
||||
@ -56,6 +59,6 @@ trans.initialize({
|
||||
enamdict: 'jp/data/enamdict.json',
|
||||
kanjidic: 'jp/data/kanjidic.json',
|
||||
}, function() {
|
||||
// alert('Loaded');
|
||||
alert('Loaded');
|
||||
// alert(trans.dictionary.findTerm('猫'));
|
||||
});
|
||||
|
Loading…
x
Reference in New Issue
Block a user