89 lines
		
	
	
		
			1.9 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
	
	
			
		
		
	
	
			89 lines
		
	
	
		
			1.9 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
	
	
| import { IndexInterface } from "../../type.js";
 | |
| import { regex, replace, collapse } from "../../lang.js";
 | |
| import { encode as encode_balance } from "./balance.js";
 | |
| 
 | |
| export const rtl = /* normalize: */
 | |
| /* collapse: */ /* normalize: */ /* collapse: */ /* normalize: */ /* collapse: */!1;
 | |
| export const tokenize = "";
 | |
| export default {
 | |
|     encode: encode,
 | |
|     rtl: !1,
 | |
|     tokenize: ""
 | |
| 
 | |
|     // Phonetic Normalization
 | |
| 
 | |
| };const regex_ae = regex("ae"),
 | |
| 
 | |
| //regex_ai = regex("ai"),
 | |
| //regex_ay = regex("ay"),
 | |
| //regex_ey = regex("ey"),
 | |
| regex_oe = regex("oe"),
 | |
|       //regex_ue = regex("ue"),
 | |
| //regex_ie = regex("ie"),
 | |
| //regex_sz = regex("sz"),
 | |
| //regex_zs = regex("zs"),
 | |
| //regex_ck = regex("ck"),
 | |
| //regex_cc = regex("cc"),
 | |
| regex_sh = regex("sh"),
 | |
|       regex_th = regex("th"),
 | |
| 
 | |
| //regex_dt = regex("dt"),
 | |
| regex_ph = regex("ph"),
 | |
|       regex_pf = regex("pf"),
 | |
|       pairs = [regex_ae, "a",
 | |
| // regex_ai, "ei",
 | |
| // regex_ay, "ei",
 | |
| // regex_ey, "ei",
 | |
| regex_oe, "o",
 | |
| // regex_ue, "u",
 | |
| // regex_ie, "i",
 | |
| // regex_sz, "s",
 | |
| // regex_zs, "s",
 | |
| regex_sh, "s",
 | |
| // regex_ck, "k",
 | |
| // regex_cc, "k",
 | |
| regex_th, "t",
 | |
| // regex_dt, "t",
 | |
| regex_ph, "f", regex_pf, "f",
 | |
| // regex_ou, "o",
 | |
| // regex_uo, "u"
 | |
| 
 | |
| // regex("(?![aeiouy])h(?![aeiouy])"), "",
 | |
| // regex("(?!^[aeiouy])h(?!^[aeiouy])"), ""
 | |
| regex("(?![aeo])h(?![aeo])"), "", regex("(?!^[aeo])h(?!^[aeo])"), ""];
 | |
| //regex_ou = regex("ou"),
 | |
| //regex_uo = regex("uo");
 | |
| 
 | |
| /**
 | |
|  * @param {string|number} str
 | |
|  * @param {boolean=} _skip_postprocessing
 | |
|  * @this IndexInterface
 | |
|  */
 | |
| 
 | |
| export function encode(str, _skip_postprocessing) {
 | |
| 
 | |
|     if (str) {
 | |
| 
 | |
|         str = encode_balance.call(this, str).join(" ");
 | |
| 
 | |
|         if (2 < str.length) {
 | |
| 
 | |
|             str = replace(str, pairs);
 | |
|         }
 | |
| 
 | |
|         if (!_skip_postprocessing) {
 | |
| 
 | |
|             if (1 < str.length) {
 | |
| 
 | |
|                 str = collapse(str);
 | |
|             }
 | |
| 
 | |
|             if (str) {
 | |
| 
 | |
|                 str = str.split(" ");
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return str || [];
 | |
| } |