344 lines
9.3 KiB
TypeScript
Raw Normal View History

2024-07-01 21:36:47 +08:00
// ToolGood.Words.Translate.js
// 2020, Lin Zhijun, https://github.com/toolgood/ToolGood.Words
// Licensed under the Apache License 2.0
import {_s2t_s, _s2t_t, _t2hk_t, _t2hk_hk, _t2s_s, _t2tw_t, _t2s_t, _t2tw_tw} from './TranslateWord'
class TrieNode {
Index = 0;
Layer = 0;
End = false;
Char = '';
Results = [];
m_values = {};
Failure = null;
Parent = null;
public Add(c) {
if (this.m_values[c] != null) {
return this.m_values[c];
}
var node = new TrieNode();
node.Parent = this;
node.Char = c;
this.m_values[c] = node;
return node;
}
public SetResults(index) {
if (this.End == false) {
this.End = true;
}
this.Results.push(index)
}
}
class TrieNode2 {
End = false;
Results = [];
m_values = {};
minflag = 1;
maxflag = 0;
public Add(c, node3) {
if (typeof c !== 'number') {
c = parseInt(c);
}
if (this.minflag > c) {
this.minflag = c;
}
if (this.maxflag < c) {
this.maxflag = c;
}
this.m_values[c] = node3;
}
public SetResults(index) {
if (this.End == false) {
this.End = true;
}
if (this.Results.indexOf(index) == -1) {
this.Results.push(index);
}
}
public HasKey(c) {
return this.m_values[c] != undefined;
}
public TryGetValue(c) {
if (this.minflag <= c && this.maxflag >= c) {
return this.m_values[c];
}
return null;
}
}
class WordsSearch {
_first: TrieNode2 = null;
_keywords = [];
_others = [];
public SetKeywords(keywords) {
this._keywords = keywords;
let root = new TrieNode();
let allNodeLayer = {};
for (let i = 0; i < this._keywords.length; i++) {
let p = this._keywords[i];
let nd = root;
for (let j = 0; j < p.length; j++) {
nd = nd.Add(p.charCodeAt(j));
if (nd.Layer == 0) {
nd.Layer = j + 1;
if (allNodeLayer[nd.Layer]) {
allNodeLayer[nd.Layer].push(nd)
} else {
allNodeLayer[nd.Layer] = [];
allNodeLayer[nd.Layer].push(nd)
}
}
}
nd.SetResults(i);
}
let allNode: TrieNode[] = [];
allNode.push(root);
for (let key in allNodeLayer) {
let nds = allNodeLayer[key];
for (let i = 0; i < nds.length; i++) {
allNode.push(nds[i]);
}
}
allNodeLayer = null;
for (let i = 1; i < allNode.length; i++) {
let nd: TrieNode = allNode[i];
nd.Index = i;
let r = nd.Parent.Failure;
let c = nd.Char;
while (r != null && !r.m_values[c])
r = r.Failure;
if (r == null)
nd.Failure = root;
else {
nd.Failure = r.m_values[c];
for (let key2 in nd.Failure.Results) {
if (nd.Failure.Results.hasOwnProperty(key2) == false) {
continue;
}
let result = nd.Failure.Results[key2];
nd.SetResults(result);
}
}
}
root.Failure = root;
let allNode2 = [];
for (let i = 0; i < allNode.length; i++) {
allNode2.push(new TrieNode2());
}
for (let i = 0; i < allNode2.length; i++) {
let oldNode = allNode[i];
let newNode = allNode2[i];
for (let key in oldNode.m_values) {
if (oldNode.m_values.hasOwnProperty(key) == false) {
continue;
}
let index = oldNode.m_values[key].Index;
newNode.Add(key, allNode2[index]);
}
for (let index = 0; index < oldNode.Results.length; index++) {
let item = oldNode.Results[index];
newNode.SetResults(item);
}
oldNode = oldNode.Failure;
while (oldNode != root) {
for (let key in oldNode.m_values) {
if (oldNode.m_values.hasOwnProperty(key) == false) {
continue;
}
if (newNode.HasKey(key) == false) {
let index = oldNode.m_values[key].Index;
newNode.Add(key, allNode2[index]);
}
}
for (let index = 0; index < oldNode.Results.length; index++) {
let item = oldNode.Results[index];
newNode.SetResults(item);
}
oldNode = oldNode.Failure;
}
}
allNode = null;
root = null;
this._first = allNode2[0];
}
public FindAll(text) {
var ptr = null;
var list = [];
for (let i = 0; i < text.length; i++) {
var t = text.charCodeAt(i);
var tn = null;
if (ptr == null) {
tn = this._first.TryGetValue(t);
} else {
tn = ptr.TryGetValue(t);
if (!tn) {
tn = this._first.TryGetValue(t);
}
}
if (tn != null) {
if (tn.End) {
for (let j = 0; j < tn.Results.length; j++) {
var item = tn.Results[j];
var keyword = this._keywords[item];
list.push({
Keyword: keyword,
Success: true,
End: i,
Start: i + 1 - this._keywords[item].length,
Index: item,
});
}
}
}
ptr = tn;
}
return list;
}
}
//---------------------------
//-----------------------
var s2tSearch = null; // WordsSearch
var t2sSearch = null;// WordsSearch
var t2twSearch = null;// WordsSearch
var tw2tSearch = null;// WordsSearch
var t2hkSearch = null;// WordsSearch
var hk2tSearch = null;// WordsSearch
/**
*
* @param {any} text
* @param {any} type 012
*/
2024-09-18 16:58:59 +08:00
export function toTraditionalChinese(text: any, type: any) {
2024-07-01 21:36:47 +08:00
if (type == undefined) {
type = 0;
}
if (type > 2 || type < 0) {
throw "type 不支持该类型";
}
var s2t = GetWordsSearch(true, 0);
text = TransformationReplace(text, s2t);
if (type > 0) {
var t2 = GetWordsSearch(true, type);
text = TransformationReplace(text, t2);
}
return text;
}
/**
*
* @param {any} text
* @param {any} srcType 012
*/
2024-09-18 16:58:59 +08:00
export function toSimplifiedChinese(text: string, srcType: any) {
2024-07-01 21:36:47 +08:00
if (srcType == undefined) {
srcType = 0;
}
if (srcType > 2 || srcType < 0) {
throw "srcType 不支持该类型";
}
if (srcType > 0) {
var t2 = GetWordsSearch(false, srcType);
text = TransformationReplace(text, t2);
}
var s2t = GetWordsSearch(false, 0);
text = TransformationReplace(text, s2t);
return text;
}
function TransformationReplace(text: any, wordsSearch: any) {
var ts = wordsSearch.FindAll(text);
var sb = "";
var index = 0;
while (index < text.length) {
var t = null;
var max = -1;
for (var i = 0; i < ts.length; i++) {
var f = ts[i];
if (f.Start == index && f.End > max) {
max = f.End;
t = f;
}
}
if (t == null) {
sb += text[index];
index++;
} else {
sb += wordsSearch._others[t.Index]
index = t.End + 1;
}
}
return sb;
}
function GetWordsSearch(s2t: boolean, srcType: number) {
if (s2t) {
if (srcType === 0) {
if (s2tSearch == null) {
s2tSearch = BuildWordsSearch(_s2t_s, _s2t_t);
}
return s2tSearch;
} else if (srcType === 1) {
if (t2hkSearch == null) {
t2hkSearch = BuildWordsSearch(_t2hk_t, _t2hk_hk);
}
return t2hkSearch;
} else if (srcType == 2) {
if (t2twSearch == null) {
t2twSearch = BuildWordsSearch(_t2tw_t, _t2tw_tw);
}
return t2twSearch;
}
}
if (srcType == 0) {
if (t2sSearch == null) {
t2sSearch = BuildWordsSearch(_t2s_t, _t2s_s);
}
return t2sSearch;
} else if (srcType == 1) {
if (hk2tSearch == null) {
hk2tSearch = BuildWordsSearch(_t2hk_hk, _t2hk_t);
}
return hk2tSearch;
} else if (srcType == 2) {
if (tw2tSearch == null) {
tw2tSearch = BuildWordsSearch(_t2tw_tw, _t2tw_t);
}
return tw2tSearch;
}
return null;
}
function BuildWordsSearch(keywords: string[], toWords: any[]) {
var wordsSearch = new WordsSearch();
wordsSearch.SetKeywords(keywords);
wordsSearch._others = toWords;
return wordsSearch;
}