# -*- coding: utf-8 -*- # Copyright (C) 2011 Alex Yatskov # # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program. If not, see . import operator import sqlite3 class Dictionary: def __init__(self, filename, index=True): self.db = sqlite3.connect(filename) self.indices = set() def findTerm(self, word, partial=False): self.requireIndex('Terms', 'expression') self.requireIndex('Terms', 'reading') cursor = self.db.cursor() cursor.execute('SELECT * FROM Terms WHERE expression {0} ? OR reading=?'.format('LIKE' if partial else '='), (word, word)) results = list() for expression, reading, definitions, tags in cursor.fetchall(): results.append((expression, reading, definitions, tags.split())) return results def findCharacter(self, character): cursor = self.db.cursor() cursor.execute('SELECT * FROM Kanji WHERE character=? LIMIT 1', character) return cursor.fetchone() def findCharacterVisually(self, characters): radicals = dict() for character in characters: for radical in self.findRadicalsByCharacter(character): radicals[radical] = radicals.get(radical, 0) + 1 results = dict() for radical, count in radicals.items(): for character in self.findCharactersByRadical(radical): results[character] = results.get(character, 0) + count return sorted(results.items(), key=operator.itemgetter(1), reverse=True) def findRadicalsByCharacter(self, character): cursor = self.db.cursor() cursor.execute('SELECT radicals FROM Radicals WHERE character=? LIMIT 1', character) columns = cursor.fetchone() if columns is None: return None return columns[0].split() def findCharactersByRadical(self, radical): cursor = self.db.cursor() cursor.execute('SELECT character FROM Radicals WHERE radicals LIKE ?', (u'%{0}%'.format(radical),)) columns = cursor.fetchall() if columns is None: return None return map(operator.itemgetter(0), columns) def requireIndex(self, table, column): name = 'index_{0}_{1}'.format(table, column) if not self.hasIndex(name): self.buildIndex(name, table, column) def buildIndex(self, name, table, column): cursor = self.db.cursor() cursor.execute('CREATE INDEX {0} ON {1}({2})'.format(name, table, column)) self.db.commit() def hasIndex(self, name): if name in self.indices: return True cursor = self.db.cursor() cursor.execute('SELECT * FROM sqlite_master WHERE name=?', (name,)) if len(cursor.fetchall()) == 0: return False self.indices.update([name]) return True