/* * Copyright (C) 2024 Yomitan Authors * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ import {basicTextPreprocessorOptions} from '../text-preprocessors.js'; const optionalDiacritics = [ '\u0618', // Small Fatha '\u0619', // Small Damma '\u061A', // Small Kasra '\u064B', // Fathatan '\u064C', // Dammatan '\u064D', // Kasratan '\u064E', // Fatha '\u064F', // Damma '\u0650', // Kasra '\u0651', // Shadda '\u0652' // Sukun ]; const diacriticsRegex = new RegExp(`[${optionalDiacritics.join('')}]`, 'g'); /** @type {import('language').TextPreprocessor} */ export const removeArabicScriptDiacritics = { name: 'Remove diacritics', description: 'وَلَدَ ⬅️ ولد', options: basicTextPreprocessorOptions, process: (text, setting) => { return setting ? text.replace(diacriticsRegex, '') : text; } };