From c110f0860e2ae7bc378c36f8eb6048956ebc3a28 Mon Sep 17 00:00:00 2001 From: DW <36347199+chocological00@users.noreply.github.com> Date: Mon, 3 Feb 2020 18:30:49 -0500 Subject: [PATCH] Korean, English Nyaziation and special case exclusion (#5813) --- src/misc/nyaize.ts | 50 ++++++++++++++++++++++++++++++++++++++++++++-- 1 file changed, 48 insertions(+), 2 deletions(-) diff --git a/src/misc/nyaize.ts b/src/misc/nyaize.ts index 38c710176..0b9b83d9a 100644 --- a/src/misc/nyaize.ts +++ b/src/misc/nyaize.ts @@ -1,11 +1,57 @@ +import rndstr from 'rndstr'; + export function nyaize(text: string): string { - return text + const [toNyaize, exclusionMap] = exclude(text); + const nyaized = toNyaize // ja-JP .replace(/な/g, 'にゃ').replace(/ナ/g, 'ニャ').replace(/ナ/g, 'ニャ') // en-US .replace(/morning/gi, 'mornyan').replace(/everyone/gi, 'everynyan') + .replace(/o/g, 'owo').replace(/u/g, 'uwu') // ko-KR .replace(/[나-낳]/g, match => String.fromCharCode( - match.codePointAt(0)! + '냐'.charCodeAt(0) - '나'.charCodeAt(0) + match.charCodeAt(0)! + '냐'.charCodeAt(0) - '나'.charCodeAt(0) + )).replace(/(다$)|(다(?=\.))|(다(?= ))|(다(?=!))|(다(?=\?))/gm, '다냥') + .replace(/(야(?=\?))|(야$)|(야(?= ))/gm, '냥'); + return replaceExceptions(nyaized, exclusionMap); +} + +export function denyaize(text: string): string { + return text + .replace(/にゃ/g, 'な').replace(/ニャ/g, 'ナ').replace(/ニャ/g, 'ナ') + .replace(/owo/g, 'o').replace(/uwu/g, 'u') + .replace(/mornyan/gi, 'morning').replace(/everynyan/gi, 'everyone') // this will result in case related bug + .replace(/(다냥$)|(다냥(?=\.))|(다냥(?= ))|(다냥(?=!))|(다냥(?=\?))/gm, '다') + .replace(/(냥(?=\?))|(냥$)|(냥(?= ))/gm, '야') + .replace(/[냐-냫]/g, match => String.fromCharCode( + match.charCodeAt(0)! + '나'.charCodeAt(0) - '냐'.charCodeAt(0) )); } + +function exclude(text: string): [string, Record] { + const map: Record = {}; + function substitute(match: string): string { + let randomstr: string; + do { + randomstr = rndstr({ length: 16, chars: '🀀-🀫' }); + } while(Object.prototype.hasOwnProperty.call(map, randomstr)); + map[randomstr] = match; + return randomstr; + } + const replaced = text + .replace(/(https?:\/\/.*?)(?= |$)/gm, match => substitute(match)) // URL + .replace(/:([a-z0-9_+-]+):/gim, match => substitute(match)) // emoji + .replace(/#([^\s.,!?'"#:\/\[\]【】]+)/gm, match => substitute(match)) // hashtag + .replace(/@\w([\w-]*\w)?(?:@[\w.\-]+\w)?/gm, match => substitute(match)) // mention + .replace(/<\/?[a-zA-Z]*?>/g, match => substitute(match)) // , , etc. + .replace(/`([^`\n]+?)`/g, match => substitute(match)) // inline code + .replace(/```(.+?)?\n([\s\S]+?)```(\n|$)/gm, match => substitute(match)); // code block + return [replaced, map]; +} + +function replaceExceptions(text: string, map: Record): string { + for(const rule in map) + if(Object.prototype.hasOwnProperty.call(map, rule)) + text = text.replace(rule, map[rule]); + return text; +} \ No newline at end of file