1
zero-epwing/gaiji.c
2016-11-20 20:10:58 -08:00

210 lines
5.2 KiB
C

/*
* Copyright (C) 2016 Alex Yatskov <alex@foosoft.net>
* Author: Alex Yatskov <alex@foosoft.net>
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
#include <string.h>
#include <stdbool.h>
#include <assert.h>
#include "util.h"
#include "gaiji.h"
/*
* Macros
*/
#define GAIJI_CONTEXT(name, ents) {\
name,\
gaiji_table_##ents##_wide,\
ARRSIZE(gaiji_table_##ents##_wide),\
gaiji_table_##ents##_narrow,\
ARRSIZE(gaiji_table_##ents##_narrow)\
}
/*
* Local data
*/
#include "tables/gaiji_table_chujiten.h"
#include "tables/gaiji_table_daijirin.h"
#include "tables/gaiji_table_daijisen.h"
#include "tables/gaiji_table_genius.h"
#include "tables/gaiji_table_kojien.h"
#include "tables/gaiji_table_meikyojj.h"
#include "tables/gaiji_table_meikyou.h"
#include "tables/gaiji_table_snmkg99.h"
#include "tables/gaiji_table_wadai5.h"
static const Gaiji_Context gaiji_contexts[] = {
GAIJI_CONTEXT("ジーニアス英和辞典", genius),
GAIJI_CONTEXT("スーパー大辞林", daijirin),
GAIJI_CONTEXT("大辞泉", daijisen),
GAIJI_CONTEXT("広辞苑第六版", kojien),
GAIJI_CONTEXT("新和英大辞典", wadai5),
GAIJI_CONTEXT("新明解国語辞典 ", snmkg99),
GAIJI_CONTEXT("新英和・和英中辞典", chujiten),
GAIJI_CONTEXT("明鏡国語辞典", meikyojj),
};
/*
* Local functions
*/
static int ascii_to_nibble(char c) {
if (c >= '0' && c <= '9') {
return c - '0';
}
if (c >= 'a' && c <= 'f') {
return 0x0a + (c - 'a');
}
return 0;
}
static char nibble_to_ascii(int n) {
const char hex[] = {
'0', '1', '2', '3', '4', '5', '6', '7',
'8', '9', 'a', 'b', 'c', 'd', 'e', 'f'
};
return n <= 0x0f ? hex[n] : 0;
}
static bool is_ascii_nibble(char c) {
return (c >= '0' && c <= '9') || (c >= 'a' && c <= 'f');
}
static void encode_sequence(char output[], int size, const char utf8[]) {
strncpy(output, "{#", size);
int offset = strlen(output);
for (int i = 0; i < MAX_UTF8_BYTES; ++i) {
const unsigned char byte = utf8[i];
if (byte == 0) {
break;
}
if (offset >= size - 1) {
break;
}
output[offset++] = nibble_to_ascii(byte >> 0x04);
if (offset >= size - 1) {
break;
}
output[offset++] = nibble_to_ascii(byte & 0x0f);
}
output[offset] = 0;
strncat(output, "}", size);
}
/*
* Exported functions
*/
const Gaiji_Context* gaiji_context_select(const char name[]) {
for (unsigned i = 0; i < ARRSIZE(gaiji_contexts); ++i) {
const Gaiji_Context* context = gaiji_contexts + i;
if (strcmp(context->name, name) == 0) {
return context;
}
}
return NULL;
}
void gaiji_stub_encode(char output[], int size, int code, const Gaiji_Context* context, Gaiji_Width width) {
do {
if (context == NULL) {
break;
}
const Gaiji_Entry* entries = NULL;
int count = 0;
switch (width) {
case GAIJI_WIDTH_WIDE:
entries = context->table_wide;
count = context->count_wide;
break;
case GAIJI_WIDTH_NARROW:
entries = context->table_narrow;
count = context->count_narrow;
break;
}
assert(entries != NULL);
for (int i = 0; i < count; ++i) {
const Gaiji_Entry* entry = entries + i;
if (entry->code == code) {
encode_sequence(output, size, entry->utf8);
return;
}
}
}
while (0);
strncpy(output, "<?>", size);
output[size - 1] = 0;
}
void gaiji_stub_decode(char output[], int size, const char input[]) {
const char* ptr_in = input;
char* ptr_out = output;
bool decode = false;
while (*ptr_in != 0 && ptr_out - output < size - 1) {
if (strncmp(ptr_in, "{#", 2) == 0) {
decode = true;
ptr_in += 2;
}
if (decode) {
const char high_ascii = *ptr_in++;
if (high_ascii == 0) {
break;
}
const char low_ascii = *ptr_in++;
if (low_ascii == 0) {
break;
}
if (high_ascii == '}') {
decode = false;
--ptr_in;
}
else {
assert(is_ascii_nibble(high_ascii));
assert(is_ascii_nibble(low_ascii));
*ptr_out++ = ascii_to_nibble(high_ascii) << 0x04 | ascii_to_nibble(low_ascii);
}
}
else {
*ptr_out++ = *ptr_in++;
}
}
*ptr_out = 0;
}