diff options
author | StefanVukovic99 <stefanvukovic44@gmail.com> | 2024-03-22 15:27:35 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-03-22 14:27:35 +0000 |
commit | d2e9841f96ebff61d4a5c26a322484f6268115f1 (patch) | |
tree | 3c1351fa3b25994eab8456ea8457ee153bb98aa9 /ext/js/language/language-transforms.js | |
parent | 7681131782d958997663b1fb443a3e32e8eef550 (diff) |
expand deinflection format (#745)
* abstract deinflections
* undo redundant changes
* remove cast
* switch to js
* MultiLanguageTransformer
* comments
* comments
* fix test
* suffixInflection
* fix bench
* substring instead of replace
* without heuristic
* suffixMap
* add other language deinflections
* wip
* catch cycles
* fix tests
* uninflect to deinflect
* use less regex
* add suru masu stem deinflection
Diffstat (limited to 'ext/js/language/language-transforms.js')
-rw-r--r-- | ext/js/language/language-transforms.js | 54 |
1 files changed, 54 insertions, 0 deletions
diff --git a/ext/js/language/language-transforms.js b/ext/js/language/language-transforms.js new file mode 100644 index 00000000..ee8af88b --- /dev/null +++ b/ext/js/language/language-transforms.js @@ -0,0 +1,54 @@ +/* + * Copyright (C) 2024 Yomitan Authors + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see <https://www.gnu.org/licenses/>. + */ + + +/** + * @param {string} inflectedSuffix + * @param {string} deinflectedSuffix + * @param {string[]} conditionsIn + * @param {string[]} conditionsOut + * @returns {import('language-transformer').SuffixRule} + */ +export function suffixInflection(inflectedSuffix, deinflectedSuffix, conditionsIn, conditionsOut) { + const suffixRegExp = new RegExp(inflectedSuffix + '$'); + return { + type: 'suffix', + isInflected: suffixRegExp, + deinflected: deinflectedSuffix, + deinflect: (text) => text.slice(0, -inflectedSuffix.length) + deinflectedSuffix, + conditionsIn, + conditionsOut + }; +} + +/** + * @param {string} inflectedPrefix + * @param {string} deinflectedPrefix + * @param {string[]} conditionsIn + * @param {string[]} conditionsOut + * @returns {import('language-transformer').Rule} + */ +export function prefixInflection(inflectedPrefix, deinflectedPrefix, conditionsIn, conditionsOut) { + const prefixRegExp = new RegExp('^' + inflectedPrefix); + return { + type: 'prefix', + isInflected: prefixRegExp, + deinflect: (text) => deinflectedPrefix + text.slice(inflectedPrefix.length), + conditionsIn, + conditionsOut + }; +} |