From 3a2a740b6517d18de726a44b75b34155fe8f1259 Mon Sep 17 00:00:00 2001 From: StefanVukovic99 Date: Mon, 3 Jun 2024 23:11:34 +0200 Subject: [sh] preprocess accent marks (#1024) --- .../sh/serbo-croatian-text-preprocessors.js | 31 ++++++++++++++++++++++ 1 file changed, 31 insertions(+) create mode 100644 ext/js/language/sh/serbo-croatian-text-preprocessors.js (limited to 'ext/js/language/sh/serbo-croatian-text-preprocessors.js') diff --git a/ext/js/language/sh/serbo-croatian-text-preprocessors.js b/ext/js/language/sh/serbo-croatian-text-preprocessors.js new file mode 100644 index 00000000..7b1b69a1 --- /dev/null +++ b/ext/js/language/sh/serbo-croatian-text-preprocessors.js @@ -0,0 +1,31 @@ +/* + * Copyright (C) 2024 Yomitan Authors + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see . + */ + +import {basicTextProcessorOptions} from '../text-processors.js'; + +/** @type {import('language').TextProcessor} */ +export const removeSerboCroatianAccentMarks = { + name: 'Remove diacritics', + description: 'A\u0301 → A, a\u0301 → a', + options: basicTextProcessorOptions, + process: (str, setting) => ( + setting ? + str.normalize('NFD').replace(/[aeiourAEIOUR][\u0300-\u036f]/g, (match) => match[0]) : + str + ), + +}; -- cgit v1.2.3