awtk/tools/ime_gen/to_t9_zh.js
2020-04-21 10:22:05 +08:00

89 lines
1.8 KiB
JavaScript

const fs = require('fs');
const helper = require('./helper');
function toT9(filename, onlySimpleChinese) {
let obj = {}
let result = ''
const content = fs.readFileSync(filename, "utf16le");
const lines = content.split('\n');
lines.forEach((line, index) => {
const words = line.split(' ');
const char = words[0];
const freq = parseFloat(words[1]);
const tw = words[2] === '1';
const pinyin = helper.mergePinyin(words);
const key = helper.mapStr(pinyin);
const notExist = !obj[key];
if (!key) {
return;
}
if (onlySimpleChinese && tw) {
return;
}
console.log(`${pinyin} => ${key}`);
if (notExist) {
obj[key] = {
pinyin: '',
key: key,
items: []
}
}
let value = obj[key];
if (value.pinyin.indexOf(' ' + pinyin) < 0) {
value.pinyin = value.pinyin + ' ' + pinyin;
}
value.items.push({
pinyin: pinyin,
char: char,
freq: freq
});
});
let arr = []
for (let key in obj) {
let value = obj[key];
if (value.items.length == 0) {
continue;
}
value.items.sort((a, b) => {
return b.freq - a.freq;
});
result += `/*${value.pinyin}*/\n`;
result += `static const char* s_${key}[] = {\n`
value.items.forEach(iter => {
result += ` \"${iter.char}\",\n`;
});
result += ' NULL\n';
result += '};\n';
arr.push(value);
}
arr.sort((a, b) => {
return a.key.localeCompare(b.key);
});
result += `static const table_entry_t s_t9_numbers_pinyin[] = {\n`;
arr.forEach(iter => {
let key = iter.key;
let pinyin = iter.items[0].pinyin;
result += ` {"${key}", "${pinyin}", s_${key}},\n`
});
result += '};\n';
helper.saveResult(`t9_zh_cn.inc`, result);
}
toT9('chinese_words.txt', true);