yomichan-anki/yomi_base/reader_util.py

# -*- coding: utf-8 -*-

# Copyright (C) 2013  Alex Yatskov
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.


from PyQt4 import QtGui
import re
import codecs
import sqlite3


def decodeContent(content):
    encodings = ['utf-8', 'shift_jis', 'euc-jp', 'utf-16']
    errors = dict()

    for encoding in encodings:
        try:
            return content.decode(encoding), encoding
        except UnicodeDecodeError, e:
            errors[encoding] = e[2]

    encoding = sorted(errors, key=errors.get, reverse=True)[0]
    return content.decode(encoding, 'replace'), encoding


def stripReadings(content):
    return re.sub(u'《[^》]+》', u'', content)


def findSentence(content, position):
    quotesFwd = {u'「': u'」', u'『': u'』', u"'": u"'", u'"': u'"'}
    quotesBwd = {u'」': u'「', u'』': u'『', u"'": u"'", u'"': u'"'}
    terminators = u'。．.？?！!'

    quoteStack = []

    start = 0
    for i in xrange(position, start, -1):
        c = content[i]

        if not quoteStack and (c in terminators or c in quotesFwd or c == '\n'):
            start = i + 1
            break

        if quoteStack and c == quoteStack[0]:
            quoteStack.pop()
        elif c in quotesBwd:
            quoteStack.insert(0, quotesBwd[c])

    quoteStack = []

    end = len(content)
    for i in xrange(position, end):
        c = content[i]

        if not quoteStack:
            if c in terminators:
                end = i + 1
                break
            elif c in quotesBwd:
                end = i
                break

        if quoteStack and c == quoteStack[0]:
            quoteStack.pop()
        elif c in quotesFwd:
            quoteStack.insert(0, quotesFwd[c])

    return content[start:end].strip()


def formatFields(fields, markup):
    result = {}
    for field, value in fields.items():
        try:
            result[field] = value.format(**markup)
        except KeyError:
            pass

    return result


def splitTags(tags):
    return filter(lambda tag: tag.strip(), re.split('[;,\s]', tags))


def markupVocabExp(definition):
    if definition['reading']:
        summary = u'{expression} [{reading}]'.format(**definition)
    else:
        summary = u'{expression}'.format(**definition)

    return {
        'expression': definition['expression'],
        'reading':    definition['reading'] or u'',
        'glossary':   definition['glossary'],
        'sentence':   definition.get('sentence'),
        'summary':    summary
    }


def markupVocabReading(definition):
    if definition['reading']:
        return {
            'expression': definition['reading'],
            'reading':    u'',
            'glossary':   definition['glossary'],
            'sentence':   definition.get('sentence'),
            'summary':    definition['reading']
        }


def copyVocabDef(definition):
    glossary = '; '.join(definition['glossary'])
    if definition['reading']:
        result = u'{0}\t{1}\t{2}\n'.format(
            definition['expression'],
            definition['reading'],
            glossary
        )
    else:
        result = u'{0}\t{1}\n'.format(
            definition['expression'],
            glossary
        )

    QtGui.QApplication.clipboard().setText(result)


def markupKanji(definition):
    return {
        'character': definition['character'],
        'onyomi':    definition['onyomi'],
        'kunyomi':   definition['kunyomi'],
        'glossary':  definition['glossary'],
        'summary':   definition['character']
    }


def copyKanjiDef(definition):
    result = u'{0}\t{1}\t{2}\t{3}'.format(
        definition['character'],
        ', '.join(definition['kunyomi']),
        ', '.join(definition['onyomi']),
        ', '.join(definition['glossary'])
    )

    QtGui.QApplication.clipboard().setText(result)


def buildDefHeader():
    palette   = QtGui.QApplication.palette()
    toolTipBg = palette.color(QtGui.QPalette.Window).name()
    toolTipFg = palette.color(QtGui.QPalette.WindowText).name()

    return u'''
        <html><head><style>
        body {{ background-color: {0}; color: {1}; font-size: 11pt; }}
        span.expression {{ font-size: 15pt; }}
        </style></head><body>'''.format(toolTipBg, toolTipFg)


def buildDefFooter():
    return '</body></html>'


def buildEmpty():
    return u'''
        <p>No definitions to display.</p>
        <p>Mouse over text with the <em>middle mouse button</em> or <em>shift key</em> pressed to search.</p>
        <p>You can also also input terms in the search box below.'''


def buildVocabDef(definition, index, query):
    reading = u''
    if definition['reading']:
        reading = u'<span class="reading">[{0}]<br></span>'.format(definition['reading'])

    rules = u''
    if definition.get('rules'):
        rules = ' &lt; '.join(definition['rules'])
        rules = '<span class="rules">({0})<br></span>'.format(rules)

    links = '<a href="copyVocabDef:{0}"><img src="://img/img/icon_copy_definition.png" align="right"></a>'.format(index)
    if query is not None:
        if query('vocab', markupVocabExp(definition)):
            links += '<a href="addVocabExp:{0}"><img src="://img/img/icon_add_expression.png" align="right"></a>'.format(index)
        if query('vocab', markupVocabReading(definition)):
            links += '<a href="addVocabReading:{0}"><img src="://img/img/icon_add_reading.png" align="right"></a>'.format(index)

    glossary = u'<ol>'
    for g in definition['glossary']:
        glossary += u'<li>{0}</li>'.format(g)
    glossary += u'</ol>'

    html = u'''
        <span class="links">{0}</span>
        <span class="expression">{1}<br></span>
        {2}
        <span class="glossary">{3}<br></span>
        {4}
        <br clear="all">'''.format(links, definition['expression'], reading, glossary, rules)

    return html


def buildVocabDefs(definitions, query):
    html = buildDefHeader()
    if len(definitions) > 0:
        for i, definition in enumerate(definitions):
            html += buildVocabDef(definition, i, query)
    else:
        html += buildEmpty()

    return html + buildDefFooter()


def buildKanjiDef(definition, index, query):
    links = '<a href="copyKanjiDef:{0}"><img src="://img/img/icon_copy_definition.png" align="right"></a>'.format(index)
    if query is not None and query('kanji', markupKanji(definition)):
        links += '<a href="addKanji:{0}"><img src="://img/img/icon_add_expression.png" align="right"></a>'.format(index)

    readings = ', '.join(definition['kunyomi'] + definition['onyomi'])
    glossary = ', '.join(definition['glossary'])

    html = u'''
        <span class="links">{0}</span>
        <span class="expression">{1}<br></span>
        <span class="reading">[{2}]<br></span>
        <span class="glossary">{3}<br></span>
        <br clear="all">'''.format(links, definition['character'], readings, glossary)

    return html


def buildKanjiDefs(definitions, query):
    html = buildDefHeader()

    if len(definitions) > 0:
        for i, definition in enumerate(definitions):
            html += buildKanjiDef(definition, i, query)
    else:
        html += buildEmpty()

    return html + buildDefFooter()


def extractKindleDeck(filename):
    words = []

    try:
        with sqlite3.connect(unicode(filename)) as db:
            for row in db.execute('select word from WORDS'):
                words.append(row[0])
    except sqlite3.OperationalError:
        pass

    return words


def extractWordList(filename):
    words = []

    with codecs.open(unicode(filename), 'rb', 'utf-8') as fp:
        words = re.split('[;,\s]', fp.read())

    return filter(None, words)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								# -*- coding: utf-8 -*-
-												version bump, cleanup

											
										
										
											2011-10-27 15:22:26 +00:00
-												Switching dictionary to return values in python dictionaries instead of tuples


Former-commit-id: 3f0682e88a24faed24f9e12e7c9cee338e817672
											
										
										
											2013-11-09 23:42:02 +00:00
+								# Copyright (C) 2013  Alex Yatskov
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								#
 								# This program is free software: you can redistribute it and/or modify
 								# it under the terms of the GNU General Public License as published by
 								# the Free Software Foundation, either version 3 of the License, or
 								# (at your option) any later version.
 								#
 								# This program is distributed in the hope that it will be useful,
 								# but WITHOUT ANY WARRANTY; without even the implied warranty of
 								# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 								# GNU General Public License for more details.
 								#
 								# You should have received a copy of the GNU General Public License
 								# along with this program.  If not, see <http://www.gnu.org/licenses/>.
 								from PyQt4 import QtGui
-												Switching dictionary to return values in python dictionaries instead of tuples


Former-commit-id: 3f0682e88a24faed24f9e12e7c9cee338e817672
											
										
										
											2013-11-09 23:42:02 +00:00
+								import re
-												Allow text word lists to be imported


Former-commit-id: ac96ec75dd83094a5dd1455a77f2d0fb68bed0b7
											
										
										
											2014-12-24 08:26:05 +00:00
+								import codecs
-												Stub for importing word list


Former-commit-id: ee45d2c32f6ec50a4ab38cd5e139636b103efa9f
											
										
										
											2014-12-20 11:19:22 +00:00
+								import sqlite3
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
 								def decodeContent(content):
-												Adding additional encodings for autodetect, fixing line wrap bug


Former-commit-id: c8c98e42b5e73f3ae293ce72432ab3530a08c48c
											
										
										
											2013-11-10 03:09:40 +00:00
+								    encodings = ['utf-8', 'shift_jis', 'euc-jp', 'utf-16']
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								    errors = dict()
 								    for encoding in encodings:
 								        try:
 								            return content.decode(encoding), encoding
 								        except UnicodeDecodeError, e:
 								            errors[encoding] = e[2]
 								    encoding = sorted(errors, key=errors.get, reverse=True)[0]
 								    return content.decode(encoding, 'replace'), encoding
-												Cleanup of helper functions for card generation


Former-commit-id: 61748bf8d76245d7a11ed2377bc8375bd6ece256
											
										
										
											2013-11-11 01:39:44 +00:00
+								def stripReadings(content):
-												Cleanup

											
										
										
											2016-05-18 05:12:05 +00:00
+								    return re.sub(u'《[^》]+》', u'', content)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
 								def findSentence(content, position):
 								    quotesFwd = {u'「': u'」', u'『': u'』', u"'": u"'", u'"': u'"'}
 								    quotesBwd = {u'」': u'「', u'』': u'『', u"'": u"'", u'"': u'"'}
 								    terminators = u'。．.？?！!'
-												Fixups, adding yomichan-common submodule

											
										
										
											2016-05-08 19:05:32 +00:00
+								    quoteStack = []
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
 								    start = 0
 								    for i in xrange(position, start, -1):
 								        c = content[i]
 								        if not quoteStack and (c in terminators or c in quotesFwd or c == '\n'):
 								            start = i + 1
 								            break
 								        if quoteStack and c == quoteStack[0]:
 								            quoteStack.pop()
 								        elif c in quotesBwd:
 								            quoteStack.insert(0, quotesBwd[c])
-												Fixups, adding yomichan-common submodule

											
										
										
											2016-05-08 19:05:32 +00:00
+								    quoteStack = []
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
 								    end = len(content)
 								    for i in xrange(position, end):
 								        c = content[i]
 								        if not quoteStack:
 								            if c in terminators:
 								                end = i + 1
 								                break
-												Reverting changes to getSentece() behavior

New line is now again ignored when looking for the end of the sentence.


Former-commit-id: a47014c3dfeb6cfb0d251dc448814bacdaec98db
											
										
										
											2015-02-12 04:44:29 +00:00
+								            elif c in quotesBwd:
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								                end = i
 								                break
 								        if quoteStack and c == quoteStack[0]:
 								            quoteStack.pop()
 								        elif c in quotesFwd:
 								            quoteStack.insert(0, quotesFwd[c])
-												Deleting dead code, updating README


Former-commit-id: 680131f5b7ea0dc78ac7d2585fbbf4c0a07aa720
											
										
										
											2015-11-13 09:33:13 +00:00
 								    return content[start:end].strip()
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Cleanup of helper functions for card generation


Former-commit-id: 61748bf8d76245d7a11ed2377bc8375bd6ece256
											
										
										
											2013-11-11 01:39:44 +00:00
+								def formatFields(fields, markup):
-												Fixups, adding yomichan-common submodule

											
										
										
											2016-05-08 19:05:32 +00:00
+								    result = {}
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								    for field, value in fields.items():
-												Adding handling for incorrect field markup


Former-commit-id: 1f496162e8fc779cb4950d4f3c179e4d6d52aa61
											
										
										
											2013-11-16 20:51:21 +00:00
+								        try:
 								            result[field] = value.format(**markup)
 								        except KeyError:
 								            pass
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
 								    return result
-												Cleanup of helper functions for card generation


Former-commit-id: 61748bf8d76245d7a11ed2377bc8375bd6ece256
											
										
										
											2013-11-11 01:39:44 +00:00
+								def splitTags(tags):
 								    return filter(lambda tag: tag.strip(), re.split('[;,\s]', tags))
 								def markupVocabExp(definition):
-												Fixing bugs related to adding kana-only cards, bumping version


Former-commit-id: 298b5275a85d3f60b118846c6fc7b9885702c48a
											
										
										
											2013-12-22 21:57:05 +00:00
+								    if definition['reading']:
 								        summary = u'{expression} [{reading}]'.format(**definition)
 								    else:
 								        summary = u'{expression}'.format(**definition)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								    return {
-												Cleanup of helper functions for card generation


Former-commit-id: 61748bf8d76245d7a11ed2377bc8375bd6ece256
											
										
										
											2013-11-11 01:39:44 +00:00
+								        'expression': definition['expression'],
-												Cleanup

											
										
										
											2016-05-18 05:12:05 +00:00
+								        'reading':    definition['reading'] or u'',
-												Cleanup

											
										
										
											2016-05-02 03:43:09 +00:00
+								        'glossary':   definition['glossary'],
 								        'sentence':   definition.get('sentence'),
 								        'summary':    summary
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								    }
-												Cleanup of helper functions for card generation


Former-commit-id: 61748bf8d76245d7a11ed2377bc8375bd6ece256
											
										
										
											2013-11-11 01:39:44 +00:00
+								def markupVocabReading(definition):
-												Fixing bugs related to adding kana-only cards, bumping version


Former-commit-id: 298b5275a85d3f60b118846c6fc7b9885702c48a
											
										
										
											2013-12-22 21:57:05 +00:00
+								    if definition['reading']:
 								        return {
 								            'expression': definition['reading'],
-												Cleanup

											
										
										
											2016-05-18 05:12:05 +00:00
+								            'reading':    u'',
-												Cleanup

											
										
										
											2016-05-02 03:43:09 +00:00
+								            'glossary':   definition['glossary'],
 								            'sentence':   definition.get('sentence'),
 								            'summary':    definition['reading']
-												Fixing bugs related to adding kana-only cards, bumping version


Former-commit-id: 298b5275a85d3f60b118846c6fc7b9885702c48a
											
										
										
											2013-12-22 21:57:05 +00:00
+								        }
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Cleanup


Former-commit-id: 9810f65c42e33af17c2db976c5859a60654e2ded
											
										
										
											2013-11-12 03:59:47 +00:00
+								def copyVocabDef(definition):
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								    glossary = '; '.join(definition['glossary'])
-												Cleanup


Former-commit-id: 9810f65c42e33af17c2db976c5859a60654e2ded
											
										
										
											2013-11-12 03:59:47 +00:00
+								    if definition['reading']:
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								        result = u'{0}\t{1}\t{2}\n'.format(
 								            definition['expression'],
 								            definition['reading'],
 								            glossary
 								        )
-												Cleanup


Former-commit-id: 9810f65c42e33af17c2db976c5859a60654e2ded
											
										
										
											2013-11-12 03:59:47 +00:00
+								    else:
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								        result = u'{0}\t{1}\n'.format(
 								            definition['expression'],
 								            glossary
 								        )
-												Cleanup


Former-commit-id: 9810f65c42e33af17c2db976c5859a60654e2ded
											
										
										
											2013-11-12 03:59:47 +00:00
 								    QtGui.QApplication.clipboard().setText(result)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Cleanup


Former-commit-id: 9810f65c42e33af17c2db976c5859a60654e2ded
											
										
										
											2013-11-12 03:59:47 +00:00
+								def markupKanji(definition):
 								    return {
 								        'character': definition['character'],
-												Cleanup

											
										
										
											2016-05-02 03:43:09 +00:00
+								        'onyomi':    definition['onyomi'],
 								        'kunyomi':   definition['kunyomi'],
 								        'glossary':  definition['glossary'],
 								        'summary':   definition['character']
-												Cleanup


Former-commit-id: 9810f65c42e33af17c2db976c5859a60654e2ded
											
										
										
											2013-11-12 03:59:47 +00:00
+								    }
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Correctly copy Kanji defintions to clipboard


Former-commit-id: 505fff8db8eabb0abfe1f8ff8e6b411ee520563d
											
										
										
											2013-11-14 16:36:26 +00:00
+								def copyKanjiDef(definition):
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								    result = u'{0}\t{1}\t{2}\t{3}'.format(
 								        definition['character'],
 								        ', '.join(definition['kunyomi']),
 								        ', '.join(definition['onyomi']),
 								        ', '.join(definition['glossary'])
 								    )
 								    QtGui.QApplication.clipboard().setText(result)
-												Correctly copy Kanji defintions to clipboard


Former-commit-id: 505fff8db8eabb0abfe1f8ff8e6b411ee520563d
											
										
										
											2013-11-14 16:36:26 +00:00
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								def buildDefHeader():
-												Cleanup

											
										
										
											2016-05-02 03:43:09 +00:00
+								    palette   = QtGui.QApplication.palette()
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								    toolTipBg = palette.color(QtGui.QPalette.Window).name()
 								    toolTipFg = palette.color(QtGui.QPalette.WindowText).name()
-												Handle glossary in list format

											
										
										
											2016-05-18 05:28:56 +00:00
+								    return u'''
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								        <html><head><style>
 								        body {{ background-color: {0}; color: {1}; font-size: 11pt; }}
 								        span.expression {{ font-size: 15pt; }}
-												Handle glossary in list format

											
										
										
											2016-05-18 05:28:56 +00:00
+								        </style></head><body>'''.format(toolTipBg, toolTipFg)
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
 								def buildDefFooter():
 								    return '</body></html>'
-												Updating UI labels


Former-commit-id: 06c061d606fef268af9acdfc57b769d6f2adeb35
											
										
										
											2013-11-16 19:53:02 +00:00
+								def buildEmpty():
-												Handle glossary in list format

											
										
										
											2016-05-18 05:28:56 +00:00
+								    return u'''
-												Updating UI labels


Former-commit-id: 06c061d606fef268af9acdfc57b769d6f2adeb35
											
										
										
											2013-11-16 19:53:02 +00:00
+								        <p>No definitions to display.</p>
 								        <p>Mouse over text with the <em>middle mouse button</em> or <em>shift key</em> pressed to search.</p>
-												Handle glossary in list format

											
										
										
											2016-05-18 05:28:56 +00:00
+								        <p>You can also also input terms in the search box below.'''
-												Updating UI labels


Former-commit-id: 06c061d606fef268af9acdfc57b769d6f2adeb35
											
										
										
											2013-11-16 19:53:02 +00:00
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								def buildVocabDef(definition, index, query):
-												Cleanup

											
										
										
											2016-05-18 05:12:05 +00:00
+								    reading = u''
-												Switching dictionary to return values in python dictionaries instead of tuples


Former-commit-id: 3f0682e88a24faed24f9e12e7c9cee338e817672
											
										
										
											2013-11-09 23:42:02 +00:00
+								    if definition['reading']:
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								        reading = u'<span class="reading">[{0}]<br></span>'.format(definition['reading'])
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Cleanup

											
										
										
											2016-05-18 05:12:05 +00:00
+								    rules = u''
-												Can now import Kindle vocab decks


Former-commit-id: 79282c1efd08bc501505850d1613926f479a95b0
											
										
										
											2014-12-20 11:39:24 +00:00
+								    if definition.get('rules'):
-												Improvements to text scanning and deinflection display


Former-commit-id: 94bfd5c174c2f68dfb85b2040a272e4523f9e799
											
										
										
											2013-11-18 04:21:57 +00:00
+								        rules = ' &lt; '.join(definition['rules'])
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								        rules = '<span class="rules">({0})<br></span>'.format(rules)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								    links = '<a href="copyVocabDef:{0}"><img src="://img/img/icon_copy_definition.png" align="right"></a>'.format(index)
-												Updating Kanji lookup, temporarily disabling fancy search


Former-commit-id: c6e298b51f4d5ae8596244fe97e227bc8fa2dc18
											
										
										
											2013-11-14 17:22:20 +00:00
+								    if query is not None:
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								        if query('vocab', markupVocabExp(definition)):
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								            links += '<a href="addVocabExp:{0}"><img src="://img/img/icon_add_expression.png" align="right"></a>'.format(index)
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								        if query('vocab', markupVocabReading(definition)):
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								            links += '<a href="addVocabReading:{0}"><img src="://img/img/icon_add_reading.png" align="right"></a>'.format(index)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								    glossary = u'<ol>'
 								    for g in definition['glossary']:
 								        glossary += u'<li>{0}</li>'.format(g)
 								    glossary += u'</ol>'
-												Handle glossary in list format

											
										
										
											2016-05-18 05:28:56 +00:00
+								    html = u'''
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								        <span class="links">{0}</span>
 								        <span class="expression">{1}<br></span>
-												Updating formatting for HTML output


Former-commit-id: 9f3bb3a0f42e0ab0b074e84f40044c07a4e0db91
											
										
										
											2013-11-16 20:30:20 +00:00
+								        {2}
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								        <span class="glossary">{3}<br></span>
-												Updating formatting for HTML output


Former-commit-id: 9f3bb3a0f42e0ab0b074e84f40044c07a4e0db91
											
										
										
											2013-11-16 20:30:20 +00:00
+								        {4}
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								        <br clear="all">'''.format(links, definition['expression'], reading, glossary, rules)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
 								    return html
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								def buildVocabDefs(definitions, query):
 								    html = buildDefHeader()
-												Switching dictionary to return values in python dictionaries instead of tuples


Former-commit-id: 3f0682e88a24faed24f9e12e7c9cee338e817672
											
										
										
											2013-11-09 23:42:02 +00:00
+								    if len(definitions) > 0:
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								        for i, definition in enumerate(definitions):
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								            html += buildVocabDef(definition, i, query)
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								    else:
-												Updating UI labels


Former-commit-id: 06c061d606fef268af9acdfc57b769d6f2adeb35
											
										
										
											2013-11-16 19:53:02 +00:00
+								        html += buildEmpty()
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
+								    return html + buildDefFooter()
 								def buildKanjiDef(definition, index, query):
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								    links = '<a href="copyKanjiDef:{0}"><img src="://img/img/icon_copy_definition.png" align="right"></a>'.format(index)
-												Updating Kanji lookup, temporarily disabling fancy search


Former-commit-id: c6e298b51f4d5ae8596244fe97e227bc8fa2dc18
											
										
										
											2013-11-14 17:22:20 +00:00
+								    if query is not None and query('kanji', markupKanji(definition)):
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								        links += '<a href="addKanji:{0}"><img src="://img/img/icon_add_expression.png" align="right"></a>'.format(index)
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								    readings = ', '.join(definition['kunyomi'] + definition['onyomi'])
 								    glossary = ', '.join(definition['glossary'])
-												Handle glossary in list format

											
										
										
											2016-05-18 05:28:56 +00:00
+								    html = u'''
-												Cleanup of HTML generation code


Former-commit-id: b7080d6c0970944494c07ccd5c3c35719b34b660
											
										
										
											2014-12-28 12:46:01 +00:00
+								        <span class="links">{0}</span>
 								        <span class="expression">{1}<br></span>
 								        <span class="reading">[{2}]<br></span>
 								        <span class="glossary">{3}<br></span>
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								        <br clear="all">'''.format(links, definition['character'], readings, glossary)
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
-												initial drop

											
										
										
											2011-08-28 18:01:32 +00:00
+								    return html
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
 								def buildKanjiDefs(definitions, query):
 								    html = buildDefHeader()
 								    if len(definitions) > 0:
 								        for i, definition in enumerate(definitions):
 								            html += buildKanjiDef(definition, i, query)
 								    else:
-												Updating UI labels


Former-commit-id: 06c061d606fef268af9acdfc57b769d6f2adeb35
											
										
										
											2013-11-16 19:53:02 +00:00
+								        html += buildEmpty()
-												Some basic support for displaying information about characters


Former-commit-id: 895554df1f912021309091c88cd5b3c2a8b7211f
											
										
										
											2013-11-11 04:27:25 +00:00
 								    return html + buildDefFooter()
-												Stub for importing word list


Former-commit-id: ee45d2c32f6ec50a4ab38cd5e139636b103efa9f
											
										
										
											2014-12-20 11:19:22 +00:00
 								def extractKindleDeck(filename):
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								    words = []
-												Stub for importing word list


Former-commit-id: ee45d2c32f6ec50a4ab38cd5e139636b103efa9f
											
										
										
											2014-12-20 11:19:22 +00:00
 								    try:
-												Adding in contents of enamdict


Former-commit-id: 2738889da33182d941c2179afbc5f3d776dc886a
											
										
										
											2014-12-28 10:13:24 +00:00
+								        with sqlite3.connect(unicode(filename)) as db:
 								            for row in db.execute('select word from WORDS'):
 								                words.append(row[0])
-												Stub for importing word list


Former-commit-id: ee45d2c32f6ec50a4ab38cd5e139636b103efa9f
											
										
										
											2014-12-20 11:19:22 +00:00
+								    except sqlite3.OperationalError:
 								        pass
 								    return words
-												Allow text word lists to be imported


Former-commit-id: ac96ec75dd83094a5dd1455a77f2d0fb68bed0b7
											
										
										
											2014-12-24 08:26:05 +00:00
+								def extractWordList(filename):
-												Fixing copy-paste

											
										
										
											2016-05-18 16:26:47 +00:00
+								    words = []
-												Allow text word lists to be imported


Former-commit-id: ac96ec75dd83094a5dd1455a77f2d0fb68bed0b7
											
										
										
											2014-12-24 08:26:05 +00:00
 								    with codecs.open(unicode(filename), 'rb', 'utf-8') as fp:
 								        words = re.split('[;,\s]', fp.read())
 								    return filter(None, words)