From d2e9841f96ebff61d4a5c26a322484f6268115f1 Mon Sep 17 00:00:00 2001 From: StefanVukovic99 Date: Fri, 22 Mar 2024 15:27:35 +0100 Subject: expand deinflection format (#745) * abstract deinflections * undo redundant changes * remove cast * switch to js * MultiLanguageTransformer * comments * comments * fix test * suffixInflection * fix bench * substring instead of replace * without heuristic * suffixMap * add other language deinflections * wip * catch cycles * fix tests * uninflect to deinflect * use less regex * add suru masu stem deinflection --- ext/js/language/language-transforms.js | 54 ++++++++++++++++++++++++++++++++++ 1 file changed, 54 insertions(+) create mode 100644 ext/js/language/language-transforms.js (limited to 'ext/js/language/language-transforms.js') diff --git a/ext/js/language/language-transforms.js b/ext/js/language/language-transforms.js new file mode 100644 index 00000000..ee8af88b --- /dev/null +++ b/ext/js/language/language-transforms.js @@ -0,0 +1,54 @@ +/* + * Copyright (C) 2024 Yomitan Authors + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see . + */ + + +/** + * @param {string} inflectedSuffix + * @param {string} deinflectedSuffix + * @param {string[]} conditionsIn + * @param {string[]} conditionsOut + * @returns {import('language-transformer').SuffixRule} + */ +export function suffixInflection(inflectedSuffix, deinflectedSuffix, conditionsIn, conditionsOut) { + const suffixRegExp = new RegExp(inflectedSuffix + '$'); + return { + type: 'suffix', + isInflected: suffixRegExp, + deinflected: deinflectedSuffix, + deinflect: (text) => text.slice(0, -inflectedSuffix.length) + deinflectedSuffix, + conditionsIn, + conditionsOut + }; +} + +/** + * @param {string} inflectedPrefix + * @param {string} deinflectedPrefix + * @param {string[]} conditionsIn + * @param {string[]} conditionsOut + * @returns {import('language-transformer').Rule} + */ +export function prefixInflection(inflectedPrefix, deinflectedPrefix, conditionsIn, conditionsOut) { + const prefixRegExp = new RegExp('^' + inflectedPrefix); + return { + type: 'prefix', + isInflected: prefixRegExp, + deinflect: (text) => deinflectedPrefix + text.slice(inflectedPrefix.length), + conditionsIn, + conditionsOut + }; +} -- cgit v1.2.3