From 3a2a740b6517d18de726a44b75b34155fe8f1259 Mon Sep 17 00:00:00 2001 From: StefanVukovic99 Date: Mon, 3 Jun 2024 23:11:34 +0200 Subject: [sh] preprocess accent marks (#1024) --- ext/js/language/language-descriptors.js | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) (limited to 'ext/js/language/language-descriptors.js') diff --git a/ext/js/language/language-descriptors.js b/ext/js/language/language-descriptors.js index defd73a8..98d3f6c8 100644 --- a/ext/js/language/language-descriptors.js +++ b/ext/js/language/language-descriptors.js @@ -34,6 +34,7 @@ import {koreanTransforms} from './ko/korean-transforms.js'; import {latinTransforms} from './la/latin-transforms.js'; import {removeRussianDiacritics, yoToE} from './ru/russian-text-preprocessors.js'; import {oldIrishTransforms} from './sga/old-irish-transforms.js'; +import {removeSerboCroatianAccentMarks} from './sh/serbo-croatian-text-preprocessors.js'; import {albanianTransforms} from './sq/albanian-transforms.js'; import {capitalizeFirstLetter, decapitalize, removeAlphabeticDiacritics} from './text-processors.js'; import {isStringPartiallyChinese} from './zh/chinese.js'; @@ -224,7 +225,10 @@ const languageDescriptors = [ iso: 'sh', name: 'Serbo-Croatian', exampleText: 'čitaše', - textPreprocessors: capitalizationPreprocessors, + textPreprocessors: { + ...capitalizationPreprocessors, + removeSerboCroatianAccentMarks, + }, }, { iso: 'sq', -- cgit v1.2.3