1
yomichan-import/frequency.go

91 lines
2.6 KiB
Go
Raw Normal View History

2017-09-10 20:25:11 +00:00
/*
* Copyright (c) 2017 Alex Yatskov <alex@foosoft.net>
* Author: Alex Yatskov <alex@foosoft.net>
*
* Permission is hereby granted, free of charge, to any person obtaining a copy of
* this software and associated documentation files (the "Software"), to deal in
* the Software without restriction, including without limitation the rights to
* use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
* the Software, and to permit persons to whom the Software is furnished to do so,
* subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in all
* copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
* FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
* COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
* IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
package main
import (
"bufio"
"os"
"strconv"
"strings"
)
const frequencyRevision = "frequency1"
2017-09-10 20:45:06 +00:00
func frequencyTermsExportDb(inputPath, outputPath, language, title string, stride int, pretty bool) error {
2017-09-23 06:03:05 +00:00
return frequncyExportDb(inputPath, outputPath, language, title, stride, pretty, "term_meta")
2017-09-10 20:45:06 +00:00
}
func frequencyKanjiExportDb(inputPath, outputPath, language, title string, stride int, pretty bool) error {
2017-09-23 06:03:05 +00:00
return frequncyExportDb(inputPath, outputPath, language, title, stride, pretty, "kanji_meta")
2017-09-10 20:45:06 +00:00
}
func frequncyExportDb(inputPath, outputPath, language, title string, stride int, pretty bool, key string) error {
2017-09-10 20:25:11 +00:00
reader, err := os.Open(inputPath)
if err != nil {
return err
}
defer reader.Close()
2017-09-23 06:03:05 +00:00
var frequencies dbMetaList
2017-09-10 20:25:11 +00:00
for scanner := bufio.NewScanner(reader); scanner.Scan(); {
line := scanner.Text()
if strings.HasPrefix(line, "#") {
continue
}
parts := strings.Split(line, "\t")
2017-09-23 19:50:54 +00:00
if len(parts) < 2 {
2017-09-10 20:25:11 +00:00
continue
}
expression := parts[0]
count, err := strconv.Atoi(parts[1])
if err != nil {
2017-09-23 19:50:54 +00:00
expression = parts[1]
count, err = strconv.Atoi(parts[0])
if err != nil {
continue
}
2017-09-10 20:25:11 +00:00
}
2017-09-23 06:03:05 +00:00
frequencies = append(frequencies, dbMeta{expression, "freq", count})
2017-09-10 20:25:11 +00:00
}
2017-09-12 20:51:49 +00:00
if title == "" {
title = "Frequency"
}
2017-09-10 20:25:11 +00:00
recordData := map[string]dbRecordList{
2017-09-10 20:45:06 +00:00
key: frequencies.crush(),
2017-09-10 20:25:11 +00:00
}
return writeDb(
outputPath,
title,
frequencyRevision,
recordData,
stride,
pretty,
)
}