UNPKG

wanakana

Version:

Utility library for converting between Kanji, Hiragana, Katakana, and Romaji

www.wanakana.com

WaniKani/WanaKana

1,527 lines (1,492 loc) • 63 kB

JavaScript

'use strict'; /** * Returns detailed type as string (instead of just 'object' for arrays etc) * @private * @param {any} value js value * @returns {String} type of value * @example * typeOf({}); // 'object' * typeOf([]); // 'array' * typeOf(function() {}); // 'function' * typeOf(/a/); // 'regexp' * typeOf(new Date()); // 'date' * typeOf(null); // 'null' * typeOf(undefined); // 'undefined' * typeOf('a'); // 'string' * typeOf(1); // 'number' * typeOf(true); // 'boolean' * typeOf(new Map()); // 'map' * typeOf(new Set()); // 'map' */ function typeOf(value) { if (value === null) { return 'null'; } if (value !== Object(value)) { return typeof value; } return {}.toString .call(value) .slice(8, -1) .toLowerCase(); } /** * Checks if input string is empty * @param {String} input text input * @return {Boolean} true if no input */ function isEmpty(input) { if (typeOf(input) !== 'string') { return true; } return !input.length; } /** * Takes a character and a unicode range. Returns true if the char is in the range. * @param {String} char unicode character * @param {Number} start unicode start range * @param {Number} end unicode end range * @return {Boolean} */ function isCharInRange(char = '', start, end) { if (isEmpty(char)) return false; const code = char.charCodeAt(0); return start <= code && code <= end; } const VERSION = '5.3.1'; const TO_KANA_METHODS = { HIRAGANA: 'toHiragana', KATAKANA: 'toKatakana', }; const ROMANIZATIONS = { HEPBURN: 'hepburn', }; /** * Default config for WanaKana, user passed options will be merged with these * @type {DefaultOptions} * @name DefaultOptions * @property {Boolean} [useObsoleteKana=false] - Set to true to use obsolete characters, such as ゐ and ゑ. * @example * toHiragana('we', { useObsoleteKana: true }) * // => 'ゑ' * @property {Boolean} [passRomaji=false] - Set to true to pass romaji when using mixed syllabaries with toKatakana() or toHiragana() * @example * toHiragana('only convert the katakana: ヒラガナ', { passRomaji: true }) * // => "only convert the katakana: ひらがな" * @property {Boolean} [convertLongVowelMark=true] - Set to false to prevent conversions of 'ー' to extended vowels with toHiragana() * @example * toHiragana('ラーメン', { convertLongVowelMark: false }); * // => 'らーめん * @property {Boolean} [upcaseKatakana=false] - Set to true to convert katakana to uppercase using toRomaji() * @example * toRomaji('ひらがなカタカナ', { upcaseKatakana: true }) * // => "hiragana KATAKANA" * @property {Boolean | 'toHiragana' | 'toKatakana'} [IMEMode=false] - Set to true, 'toHiragana', or 'toKatakana' to handle conversion while it is being typed. * @property {'hepburn'} [romanization='hepburn'] - choose toRomaji() romanization map (currently only 'hepburn') * @property {Object.<String, String>} [customKanaMapping] - custom map will be merged with default conversion * @example * toKana('wanakana', { customKanaMapping: { na: 'に', ka: 'Bana' }) }; * // => 'わにBanaに' * @property {Object.<String, String>} [customRomajiMapping] - custom map will be merged with default conversion * @example * toRomaji('つじぎり', { customRomajiMapping: { じ: 'zi', つ: 'tu', り: 'li' }) }; * // => 'tuzigili' */ const DEFAULT_OPTIONS = { useObsoleteKana: false, passRomaji: false, convertLongVowelMark: true, upcaseKatakana: false, IMEMode: false, romanization: ROMANIZATIONS.HEPBURN, }; const LATIN_UPPERCASE_START = 0x41; const LATIN_UPPERCASE_END = 0x5a; const LOWERCASE_ZENKAKU_START = 0xff41; const LOWERCASE_ZENKAKU_END = 0xff5a; const UPPERCASE_ZENKAKU_START = 0xff21; const UPPERCASE_ZENKAKU_END = 0xff3a; const HIRAGANA_START = 0x3041; const HIRAGANA_END = 0x3096; const KATAKANA_START = 0x30a1; const KATAKANA_END = 0x30fc; const KANJI_START = 0x4e00; const KANJI_END = 0x9faf; const KANJI_ITERATION_MARK = 0x3005; // 々 const PROLONGED_SOUND_MARK = 0x30fc; // ー const KANA_SLASH_DOT = 0x30fb; // ・ const ZENKAKU_NUMBERS = [0xff10, 0xff19]; const ZENKAKU_UPPERCASE = [UPPERCASE_ZENKAKU_START, UPPERCASE_ZENKAKU_END]; const ZENKAKU_LOWERCASE = [LOWERCASE_ZENKAKU_START, LOWERCASE_ZENKAKU_END]; const ZENKAKU_PUNCTUATION_1 = [0xff01, 0xff0f]; const ZENKAKU_PUNCTUATION_2 = [0xff1a, 0xff1f]; const ZENKAKU_PUNCTUATION_3 = [0xff3b, 0xff3f]; const ZENKAKU_PUNCTUATION_4 = [0xff5b, 0xff60]; const ZENKAKU_SYMBOLS_CURRENCY = [0xffe0, 0xffee]; const HIRAGANA_CHARS = [0x3040, 0x309f]; const KATAKANA_CHARS = [0x30a0, 0x30ff]; const HANKAKU_KATAKANA = [0xff66, 0xff9f]; const KATAKANA_PUNCTUATION = [0x30fb, 0x30fc]; const KANA_PUNCTUATION = [0xff61, 0xff65]; const CJK_SYMBOLS_PUNCTUATION = [0x3000, 0x303f]; const COMMON_CJK = [0x4e00, 0x9fff]; const RARE_CJK = [0x3400, 0x4dbf]; const KANA_RANGES = [ HIRAGANA_CHARS, KATAKANA_CHARS, KANA_PUNCTUATION, HANKAKU_KATAKANA, ]; const JA_PUNCTUATION_RANGES = [ CJK_SYMBOLS_PUNCTUATION, KANA_PUNCTUATION, KATAKANA_PUNCTUATION, ZENKAKU_PUNCTUATION_1, ZENKAKU_PUNCTUATION_2, ZENKAKU_PUNCTUATION_3, ZENKAKU_PUNCTUATION_4, ZENKAKU_SYMBOLS_CURRENCY, ]; // All Japanese unicode start and end ranges // Includes kanji, kana, zenkaku latin chars, punctuation, and number ranges. const JAPANESE_RANGES = [ ...KANA_RANGES, ...JA_PUNCTUATION_RANGES, ZENKAKU_UPPERCASE, ZENKAKU_LOWERCASE, ZENKAKU_NUMBERS, COMMON_CJK, RARE_CJK, ]; const MODERN_ENGLISH = [0x0000, 0x007f]; const HEPBURN_MACRON_RANGES = [ [0x0100, 0x0101], [0x0112, 0x0113], [0x012a, 0x012b], [0x014c, 0x014d], [0x016a, 0x016b], // Ū ū ]; const SMART_QUOTE_RANGES = [ [0x2018, 0x2019], [0x201c, 0x201d], // “ ” ]; const ROMAJI_RANGES = [MODERN_ENGLISH, ...HEPBURN_MACRON_RANGES]; const EN_PUNCTUATION_RANGES = [ [0x20, 0x2f], [0x3a, 0x3f], [0x5b, 0x60], [0x7b, 0x7e], ...SMART_QUOTE_RANGES, ]; /** * Tests a character. Returns true if the character is [Katakana](https://en.wikipedia.org/wiki/Katakana). * @param {String} char character string to test * @return {Boolean} */ function isCharJapanese(char = '') { return JAPANESE_RANGES.some(([start, end]) => isCharInRange(char, start, end)); } /** * Test if `input` only includes [Kanji](https://en.wikipedia.org/wiki/Kanji), [Kana](https://en.wikipedia.org/wiki/Kana), zenkaku numbers, and JA punctuation/symbols.” * @param {String} [input=''] text * @param {RegExp} [allowed] additional test allowed to pass for each char * @return {Boolean} true if passes checks * @example * isJapanese('泣き虫') * // => true * isJapanese('あア') * // => true * isJapanese('２月') // Zenkaku numbers allowed * // => true * isJapanese('泣き虫。！〜＄') // Zenkaku/JA punctuation * // => true * isJapanese('泣き虫.!~$') // Latin punctuation fails * // => false * isJapanese('A泣き虫') * // => false * isJapanese('≪偽括弧≫', /[≪≫]/); * // => true */ function isJapanese(input = '', allowed) { const augmented = typeOf(allowed) === 'regexp'; return isEmpty(input) ? false : [...input].every((char) => { const isJa = isCharJapanese(char); return !augmented ? isJa : isJa || allowed.test(char); }); } var safeIsNaN = Number.isNaN || function ponyfill(value) { return typeof value === 'number' && value !== value; }; function isEqual(first, second) { if (first === second) { return true; } if (safeIsNaN(first) && safeIsNaN(second)) { return true; } return false; } function areInputsEqual(newInputs, lastInputs) { if (newInputs.length !== lastInputs.length) { return false; } for (var i = 0; i < newInputs.length; i++) { if (!isEqual(newInputs[i], lastInputs[i])) { return false; } } return true; } function memoizeOne(resultFn, isEqual) { if (isEqual === void 0) { isEqual = areInputsEqual; } var cache = null; function memoized() { var newArgs = []; for (var _i = 0; _i < arguments.length; _i++) { newArgs[_i] = arguments[_i]; } if (cache && cache.lastThis === this && isEqual(newArgs, cache.lastArgs)) { return cache.lastResult; } var lastResult = resultFn.apply(this, newArgs); cache = { lastResult: lastResult, lastArgs: newArgs, lastThis: this, }; return lastResult; } memoized.clear = function clear() { cache = null; }; return memoized; } var has = Object.prototype.hasOwnProperty; function find(iter, tar, key) { for (key of iter.keys()) { if (dequal(key, tar)) return key; } } function dequal(foo, bar) { var ctor, len, tmp; if (foo === bar) return true; if (foo && bar && (ctor = foo.constructor) === bar.constructor) { if (ctor === Date) return foo.getTime() === bar.getTime(); if (ctor === RegExp) return foo.toString() === bar.toString(); if (ctor === Array) { if ((len = foo.length) === bar.length) { while (len-- && dequal(foo[len], bar[len])) ; } return len === -1; } if (ctor === Set) { if (foo.size !== bar.size) { return false; } for (len of foo) { tmp = len; if (tmp && typeof tmp === 'object') { tmp = find(bar, tmp); if (!tmp) return false; } if (!bar.has(tmp)) return false; } return true; } if (ctor === Map) { if (foo.size !== bar.size) { return false; } for (len of foo) { tmp = len[0]; if (tmp && typeof tmp === 'object') { tmp = find(bar, tmp); if (!tmp) return false; } if (!dequal(len[1], bar.get(tmp))) { return false; } } return true; } if (ctor === ArrayBuffer) { foo = new Uint8Array(foo); bar = new Uint8Array(bar); } else if (ctor === DataView) { if ((len = foo.byteLength) === bar.byteLength) { while (len-- && foo.getInt8(len) === bar.getInt8(len)) ; } return len === -1; } if (ArrayBuffer.isView(foo)) { if ((len = foo.byteLength) === bar.byteLength) { while (len-- && foo[len] === bar[len]) ; } return len === -1; } if (!ctor || typeof foo === 'object') { len = 0; for (ctor in foo) { if (has.call(foo, ctor) && ++len && !has.call(bar, ctor)) return false; if (!(ctor in bar) || !dequal(foo[ctor], bar[ctor])) return false; } return Object.keys(bar).length === len; } } return foo !== foo && bar !== bar; } /** * Easy re-use of merging with default options * @param {Object} opts user options * @returns user options merged over default options */ const mergeWithDefaultOptions = (opts = {}) => Object.assign({}, DEFAULT_OPTIONS, opts); function applyMapping(string, mapping, convertEnding) { const root = mapping; function nextSubtree(tree, nextChar) { const subtree = tree[nextChar]; if (subtree === undefined) { return undefined; } // if the next child node does not have a node value, set its node value to the input return Object.assign({ '': tree[''] + nextChar }, tree[nextChar]); } function newChunk(remaining, currentCursor) { // start parsing a new chunk const firstChar = remaining.charAt(0); return parse(Object.assign({ '': firstChar }, root[firstChar]), remaining.slice(1), currentCursor, currentCursor + 1); } function parse(tree, remaining, lastCursor, currentCursor) { if (!remaining) { if (convertEnding || Object.keys(tree).length === 1) { // nothing more to consume, just commit the last chunk and return it // so as to not have an empty element at the end of the result return tree[''] ? [[lastCursor, currentCursor, tree['']]] : []; } // if we don't want to convert the ending, because there are still possible continuations // return null as the final node value return [[lastCursor, currentCursor, null]]; } if (Object.keys(tree).length === 1) { return [[lastCursor, currentCursor, tree['']]].concat(newChunk(remaining, currentCursor)); } const subtree = nextSubtree(tree, remaining.charAt(0)); if (subtree === undefined) { return [[lastCursor, currentCursor, tree['']]].concat(newChunk(remaining, currentCursor)); } // continue current branch return parse(subtree, remaining.slice(1), lastCursor, currentCursor + 1); } return newChunk(string, 0); } // transform the tree, so that for example hepburnTree['ゔ']['ぁ'][''] === 'va' // or kanaTree['k']['y']['a'][''] === 'きゃ' function transform(tree) { return Object.entries(tree).reduce((map, [char, subtree]) => { const endOfBranch = typeOf(subtree) === 'string'; // eslint-disable-next-line no-param-reassign map[char] = endOfBranch ? { '': subtree } : transform(subtree); return map; }, {}); } function getSubTreeOf(tree, string) { return string.split('').reduce((correctSubTree, char) => { if (correctSubTree[char] === undefined) { // eslint-disable-next-line no-param-reassign correctSubTree[char] = {}; } return correctSubTree[char]; }, tree); } /** * Creates a custom mapping tree, returns a function that accepts a defaultMap which the newly created customMapping will be merged with and returned * (customMap) => (defaultMap) => mergedMap * @param {Object} customMap { 'ka' : 'な' } * @return {Function} (defaultMap) => defaultMergedWithCustomMap * @example * const sillyMap = createCustomMapping({ 'ちゃ': 'time', '茎': 'cookie'　}); * // sillyMap is passed defaultMapping to merge with when called in toRomaji() * toRomaji("It's 茎ちゃよ", { customRomajiMapping: sillyMap }); * // => 'It's cookie time yo'; */ function createCustomMapping(customMap = {}) { const customTree = {}; if (typeOf(customMap) === 'object') { Object.entries(customMap).forEach(([roma, kana]) => { let subTree = customTree; roma.split('').forEach((char) => { if (subTree[char] === undefined) { subTree[char] = {}; } subTree = subTree[char]; }); subTree[''] = kana; }); } return function makeMap(map) { const mapCopy = JSON.parse(JSON.stringify(map)); function transformMap(mapSubtree, customSubtree) { if (mapSubtree === undefined || typeOf(mapSubtree) === 'string') { return customSubtree; } return Object.entries(customSubtree).reduce((newSubtree, [char, subtree]) => { // eslint-disable-next-line no-param-reassign newSubtree[char] = transformMap(mapSubtree[char], subtree); return newSubtree; }, mapSubtree); } return transformMap(mapCopy, customTree); }; } // allow consumer to pass either function or object as customMapping function mergeCustomMapping(map, customMapping) { if (!customMapping) { return map; } return typeOf(customMapping) === 'function' ? customMapping(map) : createCustomMapping(customMapping)(map); } // NOTE: not exactly kunrei shiki, for example ぢゃ -> dya instead of zya, to avoid name clashing /* eslint-disable */ // prettier-ignore const BASIC_KUNREI = { a: 'あ', i: 'い', u: 'う', e: 'え', o: 'お', k: { a: 'か', i: 'き', u: 'く', e: 'け', o: 'こ', }, s: { a: 'さ', i: 'し', u: 'す', e: 'せ', o: 'そ', }, t: { a: 'た', i: 'ち', u: 'つ', e: 'て', o: 'と', }, n: { a: 'な', i: 'に', u: 'ぬ', e: 'ね', o: 'の', }, h: { a: 'は', i: 'ひ', u: 'ふ', e: 'へ', o: 'ほ', }, m: { a: 'ま', i: 'み', u: 'む', e: 'め', o: 'も', }, y: { a: 'や', u: 'ゆ', o: 'よ' }, r: { a: 'ら', i: 'り', u: 'る', e: 'れ', o: 'ろ', }, w: { a: 'わ', i: 'ゐ', e: 'ゑ', o: 'を', }, g: { a: 'が', i: 'ぎ', u: 'ぐ', e: 'げ', o: 'ご', }, z: { a: 'ざ', i: 'じ', u: 'ず', e: 'ぜ', o: 'ぞ', }, d: { a: 'だ', i: 'ぢ', u: 'づ', e: 'で', o: 'ど', }, b: { a: 'ば', i: 'び', u: 'ぶ', e: 'べ', o: 'ぼ', }, p: { a: 'ぱ', i: 'ぴ', u: 'ぷ', e: 'ぺ', o: 'ぽ', }, v: { a: 'ゔぁ', i: 'ゔぃ', u: 'ゔ', e: 'ゔぇ', o: 'ゔぉ', }, }; const SPECIAL_SYMBOLS$1 = { '.': '。', ',': '、', ':': '：', '/': '・', '!': '！', '?': '？', '~': '〜', '-': 'ー', '‘': '「', '’': '」', '“': '『', '”': '』', '[': '［', ']': '］', '(': '（', ')': '）', '{': '｛', '}': '｝', }; const CONSONANTS = { k: 'き', s: 'し', t: 'ち', n: 'に', h: 'ひ', m: 'み', r: 'り', g: 'ぎ', z: 'じ', d: 'ぢ', b: 'び', p: 'ぴ', v: 'ゔ', q: 'く', f: 'ふ', }; const SMALL_Y$1 = { ya: 'ゃ', yi: 'ぃ', yu: 'ゅ', ye: 'ぇ', yo: 'ょ' }; const SMALL_VOWELS = { a: 'ぁ', i: 'ぃ', u: 'ぅ', e: 'ぇ', o: 'ぉ' }; // typing one should be the same as having typed the other instead const ALIASES = { sh: 'sy', ch: 'ty', cy: 'ty', chy: 'ty', shy: 'sy', j: 'zy', jy: 'zy', // exceptions to above rules shi: 'si', chi: 'ti', tsu: 'tu', ji: 'zi', fu: 'hu', }; // xtu -> っ const SMALL_LETTERS = Object.assign({ tu: 'っ', wa: 'ゎ', ka: 'ヵ', ke: 'ヶ', }, SMALL_VOWELS, SMALL_Y$1); // don't follow any notable patterns const SPECIAL_CASES = { yi: 'い', wu: 'う', ye: 'いぇ', wi: 'うぃ', we: 'うぇ', kwa: 'くぁ', whu: 'う', // because it's not thya for てゃ but tha // and tha is not てぁ, but てゃ tha: 'てゃ', thu: 'てゅ', tho: 'てょ', dha: 'でゃ', dhu: 'でゅ', dho: 'でょ', }; const AIUEO_CONSTRUCTIONS = { wh: 'う', kw: 'く', qw: 'く', q: 'く', gw: 'ぐ', sw: 'す', ts: 'つ', th: 'て', tw: 'と', dh: 'で', dw: 'ど', fw: 'ふ', f: 'ふ', }; /* eslint-enable */ function createRomajiToKanaMap$1() { const kanaTree = transform(BASIC_KUNREI); // pseudo partial application const subtreeOf = (string) => getSubTreeOf(kanaTree, string); // add tya, sya, etc. Object.entries(CONSONANTS).forEach(([consonant, yKana]) => { Object.entries(SMALL_Y$1).forEach(([roma, kana]) => { // for example kyo -> き + ょ subtreeOf(consonant + roma)[''] = yKana + kana; }); }); Object.entries(SPECIAL_SYMBOLS$1).forEach(([symbol, jsymbol]) => { subtreeOf(symbol)[''] = jsymbol; }); // things like うぃ, くぃ, etc. Object.entries(AIUEO_CONSTRUCTIONS).forEach(([consonant, aiueoKana]) => { Object.entries(SMALL_VOWELS).forEach(([vowel, kana]) => { const subtree = subtreeOf(consonant + vowel); subtree[''] = aiueoKana + kana; }); }); // different ways to write ん ['n', "n'", 'xn'].forEach((nChar) => { subtreeOf(nChar)[''] = 'ん'; }); // c is equivalent to k, but not for chi, cha, etc. that's why we have to make a copy of k kanaTree.c = JSON.parse(JSON.stringify(kanaTree.k)); Object.entries(ALIASES).forEach(([string, alternative]) => { const allExceptLast = string.slice(0, string.length - 1); const last = string.charAt(string.length - 1); const parentTree = subtreeOf(allExceptLast); // copy to avoid recursive containment parentTree[last] = JSON.parse(JSON.stringify(subtreeOf(alternative))); }); function getAlternatives(string) { return [...Object.entries(ALIASES), ...[['c', 'k']]].reduce((list, [alt, roma]) => (string.startsWith(roma) ? list.concat(string.replace(roma, alt)) : list), []); } Object.entries(SMALL_LETTERS).forEach(([kunreiRoma, kana]) => { const last = (char) => char.charAt(char.length - 1); const allExceptLast = (chars) => chars.slice(0, chars.length - 1); const xRoma = `x${kunreiRoma}`; const xSubtree = subtreeOf(xRoma); xSubtree[''] = kana; // ltu -> xtu -> っ const parentTree = subtreeOf(`l${allExceptLast(kunreiRoma)}`); parentTree[last(kunreiRoma)] = xSubtree; // ltsu -> ltu -> っ getAlternatives(kunreiRoma).forEach((altRoma) => { ['l', 'x'].forEach((prefix) => { const altParentTree = subtreeOf(prefix + allExceptLast(altRoma)); altParentTree[last(altRoma)] = subtreeOf(prefix + kunreiRoma); }); }); }); Object.entries(SPECIAL_CASES).forEach(([string, kana]) => { subtreeOf(string)[''] = kana; }); // add kka, tta, etc. function addTsu(tree) { return Object.entries(tree).reduce((tsuTree, [key, value]) => { if (!key) { // we have reached the bottom of this branch // eslint-disable-next-line no-param-reassign tsuTree[key] = `っ${value}`; } else { // more subtrees // eslint-disable-next-line no-param-reassign tsuTree[key] = addTsu(value); } return tsuTree; }, {}); } // have to explicitly name c here, because we made it a copy of k, not a reference [...Object.keys(CONSONANTS), 'c', 'y', 'w', 'j'].forEach((consonant) => { const subtree = kanaTree[consonant]; subtree[consonant] = addTsu(subtree); }); // nn should not be っん delete kanaTree.n.n; // solidify the results, so that there there is referential transparency within the tree return Object.freeze(JSON.parse(JSON.stringify(kanaTree))); } let romajiToKanaMap = null; function getRomajiToKanaTree() { if (romajiToKanaMap == null) { romajiToKanaMap = createRomajiToKanaMap$1(); } return romajiToKanaMap; } const USE_OBSOLETE_KANA_MAP = createCustomMapping({ wi: 'ゐ', we: 'ゑ', }); function IME_MODE_MAP(map) { // in IME mode, we do not want to convert single ns const mapCopy = JSON.parse(JSON.stringify(map)); mapCopy.n.n = { '': 'ん' }; mapCopy.n[' '] = { '': 'ん' }; return mapCopy; } /** * Tests if char is in English unicode uppercase range * @param {String} char * @return {Boolean} */ function isCharUpperCase(char = '') { if (isEmpty(char)) return false; return isCharInRange(char, LATIN_UPPERCASE_START, LATIN_UPPERCASE_END); } /** * Returns true if char is 'ー' * @param {String} char to test * @return {Boolean} */ function isCharLongDash(char = '') { if (isEmpty(char)) return false; return char.charCodeAt(0) === PROLONGED_SOUND_MARK; } /** * Tests if char is '・' * @param {String} char * @return {Boolean} true if '・' */ function isCharSlashDot(char = '') { if (isEmpty(char)) return false; return char.charCodeAt(0) === KANA_SLASH_DOT; } /** * Tests a character. Returns true if the character is [Hiragana](https://en.wikipedia.org/wiki/Hiragana). * @param {String} char character string to test * @return {Boolean} */ function isCharHiragana(char = '') { if (isEmpty(char)) return false; if (isCharLongDash(char)) return true; return isCharInRange(char, HIRAGANA_START, HIRAGANA_END); } /** * Convert [Hiragana](https://en.wikipedia.org/wiki/Hiragana) to [Katakana](https://en.wikipedia.org/wiki/Katakana) * Passes through any non-hiragana chars * @private * @param {String} [input=''] text input * @return {String} converted text * @example * hiraganaToKatakana('ひらがな') * // => "ヒラガナ" * hiraganaToKatakana('ひらがな is a type of kana') * // => "ヒラガナ is a type of kana" */ function hiraganaToKatakana(input = '') { const kata = []; input.split('').forEach((char) => { // Short circuit to avoid incorrect codeshift for 'ー' and '・' if (isCharLongDash(char) || isCharSlashDot(char)) { kata.push(char); } else if (isCharHiragana(char)) { // Shift charcode. const code = char.charCodeAt(0) + (KATAKANA_START - HIRAGANA_START); const kataChar = String.fromCharCode(code); kata.push(kataChar); } else { // Pass non-hiragana chars through kata.push(char); } }); return kata.join(''); } // memoize and deeply compare args so we only recreate when necessary const createRomajiToKanaMap = memoizeOne((IMEMode, useObsoleteKana, customKanaMapping) => { let map = getRomajiToKanaTree(); map = IMEMode ? IME_MODE_MAP(map) : map; map = useObsoleteKana ? USE_OBSOLETE_KANA_MAP(map) : map; if (customKanaMapping) { map = mergeCustomMapping(map, customKanaMapping); } return map; }, dequal); /** * Convert [Romaji](https://en.wikipedia.org/wiki/Romaji) to [Kana](https://en.wikipedia.org/wiki/Kana), lowercase text will result in [Hiragana](https://en.wikipedia.org/wiki/Hiragana) and uppercase text will result in [Katakana](https://en.wikipedia.org/wiki/Katakana). * @param {String} [input=''] text * @param {DefaultOptions} [options=defaultOptions] * @param {Object.<string, string>} [map] custom mapping * @return {String} converted text * @example * toKana('onaji BUTTSUUJI') * // => 'おなじブッツウジ' * toKana('ONAJI buttsuuji') * // => 'オナジぶっつうじ' * toKana('座禅‘zazen’スタイル') * // => '座禅「ざぜん」スタイル' * toKana('batsuge-mu') * // => 'ばつげーむ' * toKana('!?.:/,~-‘’“”[](){}') // Punctuation conversion * // => '！？。：・、〜ー「」『』［］（）｛｝' * toKana('we', { useObsoleteKana: true }) * // => 'ゑ' * toKana('wanakana', { customKanaMapping: { na: 'に', ka: 'bana' } }); * // => 'わにbanaに' */ function toKana(input = '', options = {}, map) { let config; if (!map) { config = mergeWithDefaultOptions(options); map = createRomajiToKanaMap(config.IMEMode, config.useObsoleteKana, config.customKanaMapping); } else { config = options; } // throw away the substring index information and just concatenate all the kana return splitIntoConvertedKana(input, config, map) .map((kanaToken) => { const [start, end, kana] = kanaToken; if (kana === null) { // haven't converted the end of the string, since we are in IME mode return input.slice(start); } const enforceHiragana = config.IMEMode === TO_KANA_METHODS.HIRAGANA; const enforceKatakana = config.IMEMode === TO_KANA_METHODS.KATAKANA || [...input.slice(start, end)].every(isCharUpperCase); return enforceHiragana || !enforceKatakana ? kana : hiraganaToKatakana(kana); }) .join(''); } /** * * @private * @param {String} [input=''] input text * @param {DefaultOptions} [options=defaultOptions] toKana options * @param {Object} [map] custom mapping * @returns {Array[]} [[start, end, token]] * @example * splitIntoConvertedKana('buttsuuji') * // => [[0, 2, 'ぶ'], [2, 6, 'っつ'], [6, 7, 'う'], [7, 9, 'じ']] */ function splitIntoConvertedKana(input = '', options = {}, map) { const { IMEMode, useObsoleteKana, customKanaMapping } = options; if (!map) { map = createRomajiToKanaMap(IMEMode, useObsoleteKana, customKanaMapping); } return applyMapping(input.toLowerCase(), map, !IMEMode); } let LISTENERS = []; /** * Automagically replaces input values with converted text to kana * @param {defaultOptions} [options] user config overrides, default conversion is toKana() * @return {Function} event handler with bound options * @private */ function makeOnInput(options) { let prevInput; // Enforce IMEMode if not already specified const mergedConfig = Object.assign({}, mergeWithDefaultOptions(options), { IMEMode: options.IMEMode || true, }); const preConfiguredMap = createRomajiToKanaMap(mergedConfig.IMEMode, mergedConfig.useObsoleteKana, mergedConfig.customKanaMapping); const triggers = [ ...Object.keys(preConfiguredMap), ...Object.keys(preConfiguredMap).map((char) => char.toUpperCase()), ]; return function onInput({ target }) { if (target.value !== prevInput && target.dataset.ignoreComposition !== 'true') { convertInput(target, mergedConfig, preConfiguredMap, triggers); } }; } function convertInput(target, options, map, triggers, prevInput) { const [head, textToConvert, tail] = splitInput(target.value, target.selectionEnd, triggers); const convertedText = toKana(textToConvert, options, map); const changed = textToConvert !== convertedText; if (changed) { const newCursor = head.length + convertedText.length; const newValue = head + convertedText + tail; // eslint-disable-next-line no-param-reassign target.value = newValue; if (tail.length) { // push later on event loop (otherwise mid-text insertion can be 1 char too far to the right) setTimeout(() => target.setSelectionRange(newCursor, newCursor), 1); } else { target.setSelectionRange(newCursor, newCursor); } } else { // eslint-disable-next-line no-param-reassign target.value; } } function onComposition({ type, target, data }) { // navigator.platform is not 100% reliable for singling out all OS, // but for determining desktop "Mac OS" it is effective enough. const isMacOS = /Mac/.test(window.navigator && window.navigator.platform); // We don't want to ignore on Android: // https://github.com/WaniKani/WanaKana/issues/82 // But MacOS IME auto-closes if we don't ignore: // https://github.com/WaniKani/WanaKana/issues/71 // Other platform Japanese IMEs pass through happily if (isMacOS) { if (type === 'compositionupdate' && isJapanese(data)) { // eslint-disable-next-line no-param-reassign target.dataset.ignoreComposition = 'true'; } if (type === 'compositionend') { // eslint-disable-next-line no-param-reassign target.dataset.ignoreComposition = 'false'; } } } function trackListeners(id, inputHandler, compositionHandler) { LISTENERS = LISTENERS.concat({ id, inputHandler, compositionHandler, }); } function untrackListeners({ id: targetId }) { LISTENERS = LISTENERS.filter(({ id }) => id !== targetId); } function findListeners(el) { return (el && LISTENERS.find(({ id }) => id === el.getAttribute('data-wanakana-id'))); } // Handle non-terminal inserted input conversion: // | -> わ| -> わび| -> わ|び -> わs|び -> わsh|び -> わshi|び -> わし|び // or multiple ambiguous positioning (to select which "s" to work from) // こsこs|こsこ -> こsこso|こsこ -> こsこそ|こsこ function splitInput(text = '', cursor = 0, triggers = []) { let head; let toConvert; let tail; if (cursor === 0 && triggers.includes(text[0])) { [head, toConvert, tail] = workFromStart(text, triggers); } else if (cursor > 0) { [head, toConvert, tail] = workBackwards(text, cursor); } else { [head, toConvert] = takeWhileAndSlice(text, (char) => !triggers.includes(char)); [toConvert, tail] = takeWhileAndSlice(toConvert, (char) => !isJapanese(char)); } return [head, toConvert, tail]; } function workFromStart(text, catalystChars) { return [ '', ...takeWhileAndSlice(text, (char) => catalystChars.includes(char) || !isJapanese(char, /[0-9]/)), ]; } function workBackwards(text = '', startIndex = 0) { const [toConvert, head] = takeWhileAndSlice([...text.slice(0, startIndex)].reverse(), (char) => !isJapanese(char)); return [ head.reverse().join(''), toConvert .split('') .reverse() .join(''), text.slice(startIndex), ]; } function takeWhileAndSlice(source = {}, predicate = (x) => !!x) { const result = []; const { length } = source; let i = 0; while (i < length && predicate(source[i], i)) { result.push(source[i]); i += 1; } return [result.join(''), source.slice(i)]; } /* eslint-disable no-console */ const onInput = ({ target: { value, selectionStart, selectionEnd } }) => console.log('input:', { value, selectionStart, selectionEnd }); const onCompositionStart = () => console.log('compositionstart'); const onCompositionUpdate = ({ target: { value, selectionStart, selectionEnd }, data, }) => console.log('compositionupdate', { data, value, selectionStart, selectionEnd, }); const onCompositionEnd = () => console.log('compositionend'); const events = { input: onInput, compositionstart: onCompositionStart, compositionupdate: onCompositionUpdate, compositionend: onCompositionEnd, }; const addDebugListeners = (input) => { Object.entries(events).forEach(([event, handler]) => input.addEventListener(event, handler)); }; const removeDebugListeners = (input) => { Object.entries(events).forEach(([event, handler]) => input.removeEventListener(event, handler)); }; const ELEMENTS = ['TEXTAREA', 'INPUT']; let idCounter = 0; const newId = () => { idCounter += 1; return `${Date.now()}${idCounter}`; }; /** * Binds eventListener for 'input' events to an input field to automagically replace values with kana * Can pass `{ IMEMode: 'toHiragana' || 'toKatakana' }` to enforce kana conversion type * @param {HTMLInputElement | HTMLTextAreaElement} element textarea, input[type="text"] etc * @param {DefaultOptions} [options=defaultOptions] defaults to { IMEMode: true } using `toKana` * @example * bind(document.querySelector('#myInput')); */ function bind(element = {}, options = {}, debug = false) { if (!ELEMENTS.includes(element.nodeName)) { throw new Error(`Element provided to Wanakana bind() was not a valid input or textarea element.\n Received: (${JSON.stringify(element)})`); } if (element.hasAttribute('data-wanakana-id')) { return; } const onInput = makeOnInput(options); const id = newId(); const attributes = [ { name: 'data-wanakana-id', value: id }, { name: 'lang', value: 'ja' }, { name: 'autoCapitalize', value: 'none' }, { name: 'autoCorrect', value: 'off' }, { name: 'autoComplete', value: 'off' }, { name: 'spellCheck', value: 'false' }, ]; const previousAttributes = {}; attributes.forEach((attribute) => { previousAttributes[attribute.name] = element.getAttribute(attribute.name); element.setAttribute(attribute.name, attribute.value); }); element.dataset.previousAttributes = JSON.stringify(previousAttributes); element.addEventListener('input', onInput); element.addEventListener('compositionupdate', onComposition); element.addEventListener('compositionend', onComposition); trackListeners(id, onInput, onComposition); if (debug === true) { addDebugListeners(element); } } /** * Unbinds eventListener from input field * @param {HTMLInputElement | HTMLTextAreaElement} element textarea, input */ function unbind(element, debug = false) { const listeners = findListeners(element); if (listeners == null) { throw new Error(`Element provided to Wanakana unbind() had no listener registered.\n Received: ${JSON.stringify(element)}`); } const { inputHandler, compositionHandler } = listeners; const attributes = JSON.parse(element.dataset.previousAttributes); Object.keys(attributes).forEach((key) => { if (attributes[key]) { element.setAttribute(key, attributes[key]); } else { element.removeAttribute(key); } }); element.removeAttribute('data-previous-attributes'); element.removeAttribute('data-ignore-composition'); element.removeEventListener('input', inputHandler); element.removeEventListener('compositionstart', compositionHandler); element.removeEventListener('compositionupdate', compositionHandler); element.removeEventListener('compositionend', compositionHandler); untrackListeners(listeners); if (debug === true) { removeDebugListeners(element); } } /** * Tests a character. Returns true if the character is [Romaji](https://en.wikipedia.org/wiki/Romaji) (allowing [Hepburn romanisation](https://en.wikipedia.org/wiki/Hepburn_romanization)) * @param {String} char character string to test * @return {Boolean} */ function isCharRomaji(char = '') { if (isEmpty(char)) return false; return ROMAJI_RANGES.some(([start, end]) => isCharInRange(char, start, end)); } /** * Test if `input` is [Romaji](https://en.wikipedia.org/wiki/Romaji) (allowing [Hepburn romanisation](https://en.wikipedia.org/wiki/Hepburn_romanization)) * @param {String} [input=''] text * @param {RegExp} [allowed] additional test allowed to pass for each char * @return {Boolean} true if [Romaji](https://en.wikipedia.org/wiki/Romaji) * @example * isRomaji('Tōkyō and Ōsaka') * // => true * isRomaji('12a*b&c-d') * // => true * isRomaji('あアA') * // => false * isRomaji('お願い') * // => false * isRomaji('a！b&cーd') // Zenkaku punctuation fails * // => false * isRomaji('a！b&cーd', /[！ー]/) * // => true */ function isRomaji(input = '', allowed) { const augmented = typeOf(allowed) === 'regexp'; return isEmpty(input) ? false : [...input].every((char) => { const isRoma = isCharRomaji(char); return !augmented ? isRoma : isRoma || allowed.test(char); }); } /** * Tests a character. Returns true if the character is [Katakana](https://en.wikipedia.org/wiki/Katakana). * @param {String} char character string to test * @return {Boolean} */ function isCharKatakana(char = '') { return isCharInRange(char, KATAKANA_START, KATAKANA_END); } /** * Tests a character. Returns true if the character is [Hiragana](https://en.wikipedia.org/wiki/Hiragana) or [Katakana](https://en.wikipedia.org/wiki/Katakana). * @param {String} char character string to test * @return {Boolean} */ function isCharKana(char = '') { if (isEmpty(char)) return false; return isCharHiragana(char) || isCharKatakana(char); } /** * Test if `input` is [Kana](https://en.wikipedia.org/wiki/Kana) ([Katakana](https://en.wikipedia.org/wiki/Katakana) and/or [Hiragana](https://en.wikipedia.org/wiki/Hiragana)) * @param {String} [input=''] text * @return {Boolean} true if all [Kana](https://en.wikipedia.org/wiki/Kana) * @example * isKana('あ') * // => true * isKana('ア') * // => true * isKana('あーア') * // => true * isKana('A') * // => false * isKana('あAア') * // => false */ function isKana(input = '') { if (isEmpty(input)) return false; return [...input].every(isCharKana); } /** * Test if `input` is [Hiragana](https://en.wikipedia.org/wiki/Hiragana) * @param {String} [input=''] text * @return {Boolean} true if all [Hiragana](https://en.wikipedia.org/wiki/Hiragana) * @example * isHiragana('げーむ') * // => true * isHiragana('A') * // => false * isHiragana('あア') * // => false */ function isHiragana(input = '') { if (isEmpty(input)) return false; return [...input].every(isCharHiragana); } /** * Test if `input` is [Katakana](https://en.wikipedia.org/wiki/Katakana) * @param {String} [input=''] text * @return {Boolean} true if all [Katakana](https://en.wikipedia.org/wiki/Katakana) * @example * isKatakana('ゲーム') * // => true * isKatakana('あ') * // => false * isKatakana('A') * // => false * isKatakana('あア') * // => false */ function isKatakana(input = '') { if (isEmpty(input)) return false; return [...input].every(isCharKatakana); } /** * Returns true if char is '々' * @param {String} char to test * @return {Boolean} */ function isCharIterationMark(char = '') { if (isEmpty(char)) return false; return char.charCodeAt(0) === KANJI_ITERATION_MARK; } /** * Tests a character. Returns true if the character is a CJK ideograph (kanji). * @param {String} char character string to test * @return {Boolean} */ function isCharKanji(char = '') { return isCharInRange(char, KANJI_START, KANJI_END) || isCharIterationMark(char); } /** * Tests if `input` is [Kanji](https://en.wikipedia.org/wiki/Kanji) ([Japanese CJK ideographs](https://en.wikipedia.org/wiki/CJK_Unified_Ideographs)) * @param {String} [input=''] text * @return {Boolean} true if all [Kanji](https://en.wikipedia.org/wiki/Kanji) * @example * isKanji('刀') * // => true * isKanji('切腹') * // => true * isKanji('勢い') * // => false * isKanji('あAア') * // => false * isKanji('🐸') * // => false */ function isKanji(input = '') { if (isEmpty(input)) return false; return [...input].every(isCharKanji); } /** * Test if `input` contains a mix of [Romaji](https://en.wikipedia.org/wiki/Romaji) *and* [Kana](https://en.wikipedia.org/wiki/Kana), defaults to pass through [Kanji](https://en.wikipedia.org/wiki/Kanji) * @param {String} input text * @param {{ passKanji: Boolean}} [options={ passKanji: true }] optional config to pass through kanji * @return {Boolean} true if mixed * @example * isMixed('Abあア')) * // => true * isMixed('お腹A')) // ignores kanji by default * // => true * isMixed('お腹A', { passKanji: false })) * // => false * isMixed('ab')) * // => false * isMixed('あア')) * // => false */ function isMixed(input = '', options = { passKanji: true }) { const chars = [...input]; let hasKanji = false; if (!options.passKanji) { hasKanji = chars.some(isKanji); } return (chars.some(isHiragana) || chars.some(isKatakana)) && chars.some(isRomaji) && !hasKanji; } const isCharInitialLongDash = (char, index) => isCharLongDash(char) && index < 1; const isCharInnerLongDash = (char, index) => isCharLongDash(char) && index > 0; const isKanaAsSymbol = (char) => ['ヶ', 'ヵ'].includes(char); const LONG_VOWELS = { a: 'あ', i: 'い', u: 'う', e: 'え', o: 'う', }; // inject toRomaji to avoid circular dependency between toRomaji <-> katakanaToHiragana function katakanaToHiragana(input = '', toRomaji, { isDestinationRomaji, convertLongVowelMark } = {}) { let previousKana = ''; return input .split('') .reduce((hira, char, index) => { // Short circuit to avoid incorrect codeshift for 'ー' and '・' if (isCharSlashDot(char) || isCharInitialLongDash(char, index) || isKanaAsSymbol(char)) { return hira.concat(char); } // Transform long vowels: 'オー' to 'おう' if (convertLongVowelMark && previousKana && isCharInnerLongDash(char, index)) { // Transform previousKana back to romaji, and slice off the vowel const romaji = toRomaji(previousKana).slice(-1); // However, ensure 'オー' => 'おお' => 'oo' if this is a transform on the way to romaji if (isCharKatakana(input[index - 1]) && romaji === 'o' && isDestinationRomaji) { return hira.concat('お'); } return hira.concat(LONG_VOWELS[romaji]); // Transform all other chars } if (!isCharLongDash(char) && isCharKatakana(char)) { const code = char.charCodeAt(0) + (HIRAGANA_START - KATAKANA_START); const hiraChar = String.fromCharCode(code); previousKana = hiraChar; return hira.concat(hiraChar); } // Pass non katakana chars through previousKana = ''; return hira.concat(char); }, []) .join(''); } let kanaToHepburnMap = null; /* eslint-disable */ // prettier-ignore const BASIC_ROMAJI = { あ: 'a', い: 'i', う: 'u', え: 'e', お: 'o', か: 'ka', き: 'ki', く: 'ku', け: 'ke', こ: 'ko', さ: 'sa', し: 'shi', す: 'su', せ: 'se', そ: 'so', た: 'ta', ち: 'chi', つ: 'tsu', て: 'te', と: 'to', な: 'na', に: 'ni', ぬ: 'nu', ね: 'ne', の: 'no', は: 'ha', ひ: 'hi', ふ: 'fu', へ: 'he', ほ: 'ho', ま: 'ma', み: 'mi', む: 'mu', め: 'me', も: 'mo', ら: 'ra', り: 'ri', る: 'ru', れ: 're', ろ: 'ro', や: 'ya', ゆ: 'yu', よ: 'yo', わ: 'wa', ゐ: 'wi', ゑ: 'we', を: 'wo', ん: 'n', が: 'ga', ぎ: 'gi', ぐ: 'gu', げ: 'ge', ご: 'go', ざ: 'za', じ: 'ji', ず: 'zu', ぜ: 'ze', ぞ: 'zo', だ: 'da', ぢ: 'ji', づ: 'zu', で: 'de', ど: 'do', ば: 'ba', び: 'bi', ぶ: 'bu', べ: 'be', ぼ: 'bo', ぱ: 'pa', ぴ: 'pi', ぷ: 'pu', ぺ: 'pe', ぽ: 'po', ゔぁ: 'va', ゔぃ: 'vi', ゔ: 'vu', ゔぇ: 've', ゔぉ: 'vo', }; /* eslint-enable */ const SPECIAL_SYMBOLS = { '。': '.', '、': ',', '：': ':', '・': '/', '！': '!', '？': '?', '〜': '~', 'ー': '-', '「': '‘', '」': '’', '『': '“', '』': '”', '［': '[', '］': ']', '（': '(', '）': ')', '｛': '{', '｝': '}', '　': ' ', }; // んい -> n'i const AMBIGUOUS_VOWELS = ['あ', 'い', 'う', 'え', 'お', 'や', 'ゆ', 'よ']; const SMALL_Y = { ゃ: 'ya', ゅ: 'yu', ょ: 'yo' }; const SMALL_Y_EXTRA = { ぃ: 'yi', ぇ: 'ye' }; const SMALL_AIUEO = { ぁ: 'a', ぃ: 'i', ぅ: 'u', ぇ: 'e', ぉ: 'o', }; const YOON_KANA = [ 'き', 'に', 'ひ', 'み', 'り', 'ぎ', 'び', 'ぴ', 'ゔ', 'く', 'ふ', ]; const YOON_EXCEPTIONS = { し: 'sh', ち: 'ch', じ: 'j', ぢ: 'j', }; const SMALL_KANA = { っ: '', ゃ: 'ya', ゅ: 'yu', ょ: 'yo', ぁ: 'a', ぃ: 'i', ぅ: 'u', ぇ: 'e', ぉ: 'o', }; // going with the intuitive (yet incorrect) solution where っや -> yya and っぃ -> ii // in other words, just assume the sokuon could have been applied to anything const SOKUON_WHITELIST = { b: 'b', c: 't', d: 'd', f: 'f', g: 'g', h: 'h', j: 'j', k: 'k', m: 'm', p: 'p', q: 'q', r: 'r', s: 's', t: 't', v: 'v', w: 'w', x: 'x', z: 'z', }; function getKanaToHepburnTree() { if (kanaToHepburnMap == null) { kanaToHepburnMap = createKanaToHepburnMap(); } return kanaToHepburnMap; } function getKanaToRomajiTree(romanization) { switch (romanization) { case ROMANIZATIONS.HEPBURN: return getKanaToHepburnTree(); default: return {}; } } function createKanaToHepburnMap() { const romajiTree = transform(BASIC_ROMAJI); const subtreeOf = (string) => getSubTreeOf(romajiTree, string); const setTrans = (string, transliteration) => { subtreeOf(string)[''] = transliteration; }; Object.entries(SPECIAL_SYMBOLS).forEach(([jsymbol, symbol]) => { subtreeOf(jsymbol)[''] = symbol; }); [...Object.entries(SMALL_Y), ...Object.entries(SMALL_AIUEO)].forEach(([roma, kana]) => { setTrans(roma, kana); }); // きゃ -> kya YOON_KANA.forEach((kana) => { const firstRomajiChar = subtreeOf(kana)[''][0]; Object.entries(SMALL_Y).forEach(([yKana, yRoma]) => { setTrans(kana + yKana, firstRomajiChar + yRoma); }); // きぃ -> kyi Object.entries(SMALL_Y_EXTRA).forEach(([yKana, yRoma]) => { setTrans(kana + yKana, firstRomajiChar + yRoma); }); }); Object.entries(YOON_EXCEPTIONS).forEach(([kana, roma]) => { // じゃ -> ja Object.entries(SMALL_Y).forEach(([yKana, yRoma]) => { setTrans(kana + yKana, roma + yRoma[1]); }); // じぃ -> jyi, じぇ -> je setTrans(`${kana}ぃ`, `${roma}yi`); setTrans(`${kana}ぇ`, `${roma}e`); }); romajiTree['っ'] = resolveTsu(romajiTree); Object.entries(SMALL_KANA).forEach(([kana, roma]) => { setTrans(kana, roma); }); AMBIGUOUS_VOWELS.forEach((kana) => { setTrans(`ん${kana}`, `n'${subtreeOf(kana)['']}`); }); // NOTE: could be re-enabled with an option? // // んば -> mbo // const LABIAL = [ // 'ば', 'び', 'ぶ', 'べ', 'ぼ', // 'ぱ', 'ぴ', 'ぷ', 'ぺ', 'ぽ', // 'ま', 'み', 'む', 'め', 'も', // ]; // LABIAL.forEach((kana) => { // setTrans(`ん${kana}`, `m${subtreeOf(kana)['']}`); // }); return Object.freeze(JSON.parse(JSON.stringify(romajiTree))); } function resolveTsu(tree) { return Object.entries(tree).reduce((tsuTree, [key, value]) => { if (!key) { // we have reached the bottom of this branch const consonant = value.charAt(0); // eslint-disable-next-line no-param-reassign tsuTree[key] = Object.keys(SOKUON_WHITELIST).includes(consonant) ? SOKUON_WHITELIST[consonant] + value : value; } else { // more subtrees // eslint-disable-next-line no-param-reassign tsuTree[key] = resolveTsu(value); } return tsuTree; }, {}); } // memoize and deeply compare args so we only recreate when necessary const createKanaToRomajiMap = memoizeOne((romanization, customRomajiMapping) => { let map = getKanaToRomajiTree(romanization); if (customRomajiMapping) { map = mergeCustomMapping(map, customRomajiMapping); } return map; }, dequal); /** * Convert kana to romaji * @param {String} kana text input * @param {DefaultOptions} [options=defaultOptions] * @param {Object.<string, string>} [map] custom mapping * @return {String} converted text * @example * toRomaj