2017-03-25 17:05:03 +00:00
|
|
|
/*
|
2020-01-01 17:00:00 +00:00
|
|
|
* Copyright (C) 2017-2020 Alex Yatskov <alex@foosoft.net>
|
2017-03-25 17:05:03 +00:00
|
|
|
* Author: Alex Yatskov <alex@foosoft.net>
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
2020-01-01 17:00:31 +00:00
|
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
2017-03-25 17:05:03 +00:00
|
|
|
*/
|
|
|
|
|
2020-03-11 02:30:36 +00:00
|
|
|
/* global
|
|
|
|
* jpIsStringEntirelyKana
|
|
|
|
*/
|
2017-03-25 17:05:03 +00:00
|
|
|
|
2020-03-07 19:36:16 +00:00
|
|
|
class AudioUriBuilder {
|
|
|
|
constructor() {
|
|
|
|
this._getUrlHandlers = new Map([
|
|
|
|
['jpod101', this._getUriJpod101.bind(this)],
|
|
|
|
['jpod101-alternate', this._getUriJpod101Alternate.bind(this)],
|
|
|
|
['jisho', this._getUriJisho.bind(this)],
|
|
|
|
['text-to-speech', this._getUriTextToSpeech.bind(this)],
|
|
|
|
['text-to-speech-reading', this._getUriTextToSpeechReading.bind(this)],
|
|
|
|
['custom', this._getUriCustom.bind(this)]
|
|
|
|
]);
|
|
|
|
}
|
|
|
|
|
|
|
|
normalizeUrl(url, baseUrl, basePath) {
|
|
|
|
if (url) {
|
|
|
|
if (url[0] === '/') {
|
|
|
|
if (url.length >= 2 && url[1] === '/') {
|
|
|
|
// Begins with "//"
|
|
|
|
url = baseUrl.substring(0, baseUrl.indexOf(':') + 1) + url;
|
|
|
|
} else {
|
|
|
|
// Begins with "/"
|
|
|
|
url = baseUrl + url;
|
|
|
|
}
|
|
|
|
} else if (!/^[a-z][a-z0-9\-+.]*:/i.test(url)) {
|
|
|
|
// No URI scheme => relative path
|
|
|
|
url = baseUrl + basePath + url;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return url;
|
|
|
|
}
|
|
|
|
|
2020-03-10 01:00:57 +00:00
|
|
|
async getUri(definition, source, options) {
|
|
|
|
const handler = this._getUrlHandlers.get(source);
|
2020-03-07 19:36:16 +00:00
|
|
|
if (typeof handler === 'function') {
|
|
|
|
try {
|
|
|
|
return await handler(definition, options);
|
|
|
|
} catch (e) {
|
|
|
|
// NOP
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
async _getUriJpod101(definition) {
|
2017-04-02 19:08:15 +00:00
|
|
|
let kana = definition.reading;
|
|
|
|
let kanji = definition.expression;
|
2017-03-25 17:05:03 +00:00
|
|
|
|
2020-01-27 21:28:01 +00:00
|
|
|
if (!kana && jpIsStringEntirelyKana(kanji)) {
|
2017-04-02 19:08:15 +00:00
|
|
|
kana = kanji;
|
|
|
|
kanji = null;
|
|
|
|
}
|
2017-03-25 17:05:03 +00:00
|
|
|
|
2017-04-02 19:08:15 +00:00
|
|
|
const params = [];
|
|
|
|
if (kanji) {
|
|
|
|
params.push(`kanji=${encodeURIComponent(kanji)}`);
|
2017-03-25 17:05:03 +00:00
|
|
|
}
|
2017-04-02 19:08:15 +00:00
|
|
|
if (kana) {
|
|
|
|
params.push(`kana=${encodeURIComponent(kana)}`);
|
|
|
|
}
|
|
|
|
|
2019-10-10 01:54:58 +00:00
|
|
|
return `https://assets.languagepod101.com/dictionary/japanese/audiomp3.php?${params.join('&')}`;
|
2020-03-07 19:36:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
async _getUriJpod101Alternate(definition) {
|
2019-10-10 01:54:58 +00:00
|
|
|
const response = await new Promise((resolve, reject) => {
|
|
|
|
const xhr = new XMLHttpRequest();
|
|
|
|
xhr.open('POST', 'https://www.japanesepod101.com/learningcenter/reference/dictionary_post');
|
|
|
|
xhr.setRequestHeader('Content-Type', 'application/x-www-form-urlencoded');
|
|
|
|
xhr.addEventListener('error', () => reject(new Error('Failed to scrape audio data')));
|
|
|
|
xhr.addEventListener('load', () => resolve(xhr.responseText));
|
|
|
|
xhr.send(`post=dictionary_reference&match_type=exact&search_query=${encodeURIComponent(definition.expression)}`);
|
2017-04-02 19:08:15 +00:00
|
|
|
});
|
2017-08-16 04:36:30 +00:00
|
|
|
|
2019-10-10 01:54:58 +00:00
|
|
|
const dom = new DOMParser().parseFromString(response, 'text/html');
|
|
|
|
for (const row of dom.getElementsByClassName('dc-result-row')) {
|
2017-08-16 04:36:30 +00:00
|
|
|
try {
|
2019-10-10 01:54:58 +00:00
|
|
|
const url = row.querySelector('audio>source[src]').getAttribute('src');
|
2020-02-23 16:58:17 +00:00
|
|
|
const reading = row.getElementsByClassName('dc-vocab_kana').item(0).textContent;
|
2019-10-10 01:54:58 +00:00
|
|
|
if (url && reading && (!definition.reading || definition.reading === reading)) {
|
2020-03-07 19:36:16 +00:00
|
|
|
return this.normalizeUrl(url, 'https://www.japanesepod101.com', '/learningcenter/reference/');
|
2017-08-16 04:36:30 +00:00
|
|
|
}
|
|
|
|
} catch (e) {
|
|
|
|
// NOP
|
|
|
|
}
|
2019-10-10 01:54:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
throw new Error('Failed to find audio URL');
|
2020-03-07 19:36:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
async _getUriJisho(definition) {
|
2019-10-10 01:54:58 +00:00
|
|
|
const response = await new Promise((resolve, reject) => {
|
|
|
|
const xhr = new XMLHttpRequest();
|
|
|
|
xhr.open('GET', `https://jisho.org/search/${definition.expression}`);
|
|
|
|
xhr.addEventListener('error', () => reject(new Error('Failed to scrape audio data')));
|
|
|
|
xhr.addEventListener('load', () => resolve(xhr.responseText));
|
|
|
|
xhr.send();
|
2017-08-16 04:36:30 +00:00
|
|
|
});
|
2019-10-10 01:54:58 +00:00
|
|
|
|
|
|
|
const dom = new DOMParser().parseFromString(response, 'text/html');
|
|
|
|
try {
|
|
|
|
const audio = dom.getElementById(`audio_${definition.expression}:${definition.reading}`);
|
|
|
|
if (audio !== null) {
|
|
|
|
const url = audio.getElementsByTagName('source').item(0).getAttribute('src');
|
|
|
|
if (url) {
|
2020-03-07 19:36:16 +00:00
|
|
|
return this.normalizeUrl(url, 'https://jisho.org', '/search/');
|
2019-10-10 01:54:58 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
} catch (e) {
|
|
|
|
// NOP
|
|
|
|
}
|
|
|
|
|
|
|
|
throw new Error('Failed to find audio URL');
|
2020-03-07 19:36:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
async _getUriTextToSpeech(definition, options) {
|
2019-10-13 03:59:21 +00:00
|
|
|
const voiceURI = options.audio.textToSpeechVoice;
|
|
|
|
if (!voiceURI) {
|
|
|
|
throw new Error('No voice');
|
|
|
|
}
|
|
|
|
|
|
|
|
return `tts:?text=${encodeURIComponent(definition.expression)}&voice=${encodeURIComponent(voiceURI)}`;
|
2020-03-07 19:36:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
async _getUriTextToSpeechReading(definition, options) {
|
2019-10-13 03:59:21 +00:00
|
|
|
const voiceURI = options.audio.textToSpeechVoice;
|
|
|
|
if (!voiceURI) {
|
|
|
|
throw new Error('No voice');
|
|
|
|
}
|
|
|
|
|
|
|
|
return `tts:?text=${encodeURIComponent(definition.reading || definition.expression)}&voice=${encodeURIComponent(voiceURI)}`;
|
2017-04-02 19:08:15 +00:00
|
|
|
}
|
2017-03-25 17:05:03 +00:00
|
|
|
|
2020-03-07 19:36:16 +00:00
|
|
|
async _getUriCustom(definition, options) {
|
|
|
|
const customSourceUrl = options.audio.customSourceUrl;
|
|
|
|
return customSourceUrl.replace(/\{([^}]*)\}/g, (m0, m1) => (hasOwn(definition, m1) ? `${definition[m1]}` : m0));
|
2019-02-17 03:34:00 +00:00
|
|
|
}
|
|
|
|
}
|