/* * Copyright (c) 2016 Alex Yatskov * Author: Alex Yatskov * * Permission is hereby granted, free of charge, to any person obtaining a copy of * this software and associated documentation files (the "Software"), to deal in * the Software without restriction, including without limitation the rights to * use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of * the Software, and to permit persons to whom the Software is furnished to do so, * subject to the following conditions: * * The above copyright notice and this permission notice shall be included in all * copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS * FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR * COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER * IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ package main import ( "encoding/json" "io" "io/ioutil" "regexp" ) type epwingEntry struct { Heading string `json:"heading"` Text string `json:"text"` } type epwingSubbook struct { Title string `json:"title"` Copyright string `json:"copyright"` Entries []epwingEntry `json:"entries"` } type epwingBook struct { CharCode string `json:"charCode"` DiscCode string `json:"discCode"` Subbooks []epwingSubbook `json:"subbooks"` } type epwingExtractor interface { extractTerms(entry epwingEntry) []dbTerm extractKanji(entry epwingEntry) []dbKanji } type daijirinExtractor struct { partsExp *regexp.Regexp phonExp *regexp.Regexp variantExp *regexp.Regexp annotExp *regexp.Regexp } func exportEpwingDb(outputDir, title string, reader io.Reader, flags int) error { data, err := ioutil.ReadAll(reader) if err != nil { return err } var book epwingBook if err := json.Unmarshal(data, &book); err != nil { return err } epwingExtractors := map[string]epwingExtractor{ "三省堂 スーパー大辞林": makeDaijirinExtractor(), } var terms dbTermList var kanji dbKanjiList for _, subbook := range book.Subbooks { if extractor, ok := epwingExtractors[subbook.Title]; ok { for _, entry := range subbook.Entries { terms = append(terms, extractor.extractTerms(entry)...) kanji = append(kanji, extractor.extractKanji(entry)...) } } } return writeDb( outputDir, title, terms.crush(), kanji.crush(), nil, flags&flagPretty == flagPretty, ) }