diff options
| author | toasted-nutbread <toasted-nutbread@users.noreply.github.com> | 2024-02-25 11:20:44 -0500 | 
|---|---|---|
| committer | GitHub <noreply@github.com> | 2024-02-25 16:20:44 +0000 | 
| commit | 2e9ea19207a7410f929bb908759d48cb2340f29c (patch) | |
| tree | a6bde1297d693bb8d50e4c93a963aa3179e5a2ce /ext | |
| parent | 73169f06dff767020718a5715eba97d3575ba7e1 (diff) | |
"isJapanese" check move (#730)
* Move isStringPartiallyJapanese out of ClipboardMonitor
* Create isStringPartiallyJapanese function
* Add textMayBeTranslatable
* Rename API function
* Rename internal function
* Add helper
* Update translatable check
* Pass language to TextScanner
* Pass language explicitly
* Use textMayBeTranslatable
* No redundant translatable check
* Update eslint
* Remove double newline
* Collapse
* Rename
Diffstat (limited to 'ext')
| -rw-r--r-- | ext/js/app/frontend.js | 1 | ||||
| -rw-r--r-- | ext/js/background/backend.js | 18 | ||||
| -rw-r--r-- | ext/js/comm/api.js | 9 | ||||
| -rw-r--r-- | ext/js/comm/clipboard-monitor.js | 3 | ||||
| -rw-r--r-- | ext/js/display/display-generator.js | 32 | ||||
| -rw-r--r-- | ext/js/display/display.js | 2 | ||||
| -rw-r--r-- | ext/js/display/query-parser.js | 3 | ||||
| -rw-r--r-- | ext/js/display/sandbox/structured-content-generator.js | 9 | ||||
| -rw-r--r-- | ext/js/display/search-display-controller.js | 21 | ||||
| -rw-r--r-- | ext/js/language/language-descriptors.js | 2 | ||||
| -rwxr-xr-x | ext/js/language/languages.js | 11 | ||||
| -rw-r--r-- | ext/js/language/text-scanner.js | 12 | ||||
| -rw-r--r-- | ext/js/language/text-utilities.js | 29 | 
13 files changed, 118 insertions, 34 deletions
| diff --git a/ext/js/app/frontend.js b/ext/js/app/frontend.js index 0b7393a0..4c0faef1 100644 --- a/ext/js/app/frontend.js +++ b/ext/js/app/frontend.js @@ -474,6 +474,7 @@ export class Frontend {          await this._updatePopup();          const preventMiddleMouse = this._getPreventMiddleMouseValueForPageType(scanningOptions.preventMiddleMouse); +        this._textScanner.language = options.general.language;          this._textScanner.setOptions({              inputs: scanningOptions.inputs,              deepContentScan: scanningOptions.deepDomScan, diff --git a/ext/js/background/backend.js b/ext/js/background/backend.js index 79023ac9..6340d021 100644 --- a/ext/js/background/backend.js +++ b/ext/js/background/backend.js @@ -34,8 +34,8 @@ import {arrayBufferToBase64} from '../data/sandbox/array-buffer-util.js';  import {DictionaryDatabase} from '../dictionary/dictionary-database.js';  import {Environment} from '../extension/environment.js';  import {ObjectPropertyAccessor} from '../general/object-property-accessor.js'; -import {distributeFuriganaInflected, isCodePointJapanese, isStringPartiallyJapanese, convertKatakanaToHiragana as jpConvertKatakanaToHiragana} from '../language/ja/japanese.js'; -import {getLanguageSummaries} from '../language/languages.js'; +import {distributeFuriganaInflected, isCodePointJapanese, convertKatakanaToHiragana as jpConvertKatakanaToHiragana} from '../language/ja/japanese.js'; +import {getLanguageSummaries, isTextLookupWorthy} from '../language/languages.js';  import {Translator} from '../language/translator.js';  import {AudioDownloader} from '../media/audio-downloader.js';  import {getFileExtensionFromAudioMediaType, getFileExtensionFromImageMediaType} from '../media/media-util.js'; @@ -175,7 +175,7 @@ export class Backend {              ['isTabSearchPopup',             this._onApiIsTabSearchPopup.bind(this)],              ['triggerDatabaseUpdated',       this._onApiTriggerDatabaseUpdated.bind(this)],              ['testMecab',                    this._onApiTestMecab.bind(this)], -            ['textHasJapaneseCharacters',    this._onApiTextHasJapaneseCharacters.bind(this)], +            ['isTextLookupWorthy',           this._onApiIsTextLookupWorthy.bind(this)],              ['getTermFrequencies',           this._onApiGetTermFrequencies.bind(this)],              ['findAnkiNotes',                this._onApiFindAnkiNotes.bind(this)],              ['openCrossFramePort',           this._onApiOpenCrossFramePort.bind(this)], @@ -310,7 +310,11 @@ export class Backend {       * @param {import('clipboard-monitor').EventArgument<'change'>} details       */      async _onClipboardTextChange({text}) { -        const {clipboard: {maximumSearchLength}} = this._getProfileOptions({current: true}, false); +        const { +            general: {language}, +            clipboard: {maximumSearchLength} +        } = this._getProfileOptions({current: true}, false); +        if (!isTextLookupWorthy(text, language)) { return; }          if (text.length > maximumSearchLength) {              text = text.substring(0, maximumSearchLength);          } @@ -839,9 +843,9 @@ export class Backend {          return true;      } -    /** @type {import('api').ApiHandler<'textHasJapaneseCharacters'>} */ -    _onApiTextHasJapaneseCharacters({text}) { -        return isStringPartiallyJapanese(text); +    /** @type {import('api').ApiHandler<'isTextLookupWorthy'>} */ +    _onApiIsTextLookupWorthy({text, language}) { +        return isTextLookupWorthy(text, language);      }      /** @type {import('api').ApiHandler<'getTermFrequencies'>} */ diff --git a/ext/js/comm/api.js b/ext/js/comm/api.js index 30fcfc29..e8db7846 100644 --- a/ext/js/comm/api.js +++ b/ext/js/comm/api.js @@ -321,11 +321,12 @@ export class API {      }      /** -     * @param {import('api').ApiParam<'textHasJapaneseCharacters', 'text'>} text -     * @returns {Promise<import('api').ApiReturn<'textHasJapaneseCharacters'>>} +     * @param {import('api').ApiParam<'isTextLookupWorthy', 'text'>} text +     * @param {import('api').ApiParam<'isTextLookupWorthy', 'language'>} language +     * @returns {Promise<import('api').ApiReturn<'isTextLookupWorthy'>>}       */ -    textHasJapaneseCharacters(text) { -        return this._invoke('textHasJapaneseCharacters', {text}); +    isTextLookupWorthy(text, language) { +        return this._invoke('isTextLookupWorthy', {text, language});      }      /** diff --git a/ext/js/comm/clipboard-monitor.js b/ext/js/comm/clipboard-monitor.js index d101b467..067ecb67 100644 --- a/ext/js/comm/clipboard-monitor.js +++ b/ext/js/comm/clipboard-monitor.js @@ -17,7 +17,6 @@   */  import {EventDispatcher} from '../core/event-dispatcher.js'; -import {isStringPartiallyJapanese} from '../language/ja/japanese.js';  /**   * @augments EventDispatcher<import('clipboard-monitor').Events> @@ -71,7 +70,7 @@ export class ClipboardMonitor extends EventDispatcher {                  text !== this._previousText              ) {                  this._previousText = text; -                if (canChange && isStringPartiallyJapanese(text)) { +                if (canChange) {                      this.trigger('change', {text});                  }              } diff --git a/ext/js/display/display-generator.js b/ext/js/display/display-generator.js index 22912e9f..0b3236e9 100644 --- a/ext/js/display/display-generator.js +++ b/ext/js/display/display-generator.js @@ -20,7 +20,8 @@ import {ExtensionError} from '../core/extension-error.js';  import {isObject} from '../core/utilities.js';  import {getDisambiguations, getGroupedPronunciations, getTermFrequency, groupKanjiFrequencies, groupTermFrequencies, groupTermTags, isNonNounVerbOrAdjective} from '../dictionary/dictionary-data-util.js';  import {HtmlTemplateCollection} from '../dom/html-template-collection.js'; -import {distributeFurigana, getKanaMorae, getPitchCategory, isCodePointKanji, isStringPartiallyJapanese} from '../language/ja/japanese.js'; +import {distributeFurigana, getKanaMorae, getPitchCategory, isCodePointKanji} from '../language/ja/japanese.js'; +import {getLanguageFromText} from '../language/text-utilities.js';  import {createPronunciationDownstepPosition, createPronunciationGraph, createPronunciationText} from './sandbox/pronunciation-generator.js';  import {StructuredContentGenerator} from './sandbox/structured-content-generator.js'; @@ -991,12 +992,7 @@ export class DisplayGenerator {       * @param {string} [language]       */      _setTextContent(node, value, language) { -        if (typeof language === 'string') { -            node.lang = language; -        } else if (isStringPartiallyJapanese(value)) { -            node.lang = 'ja'; -        } - +        this._setElementLanguage(node, language, value);          node.textContent = value;      } @@ -1008,11 +1004,7 @@ export class DisplayGenerator {      _setMultilineTextContent(node, value, language) {          // This can't just call _setTextContent because the lack of <br> elements will          // cause the text to not copy correctly. -        if (typeof language === 'string') { -            node.lang = language; -        } else if (isStringPartiallyJapanese(value)) { -            node.lang = 'ja'; -        } +        this._setElementLanguage(node, language, value);          let start = 0;          while (true) { @@ -1029,6 +1021,22 @@ export class DisplayGenerator {      }      /** +     * @param {HTMLElement} element +     * @param {string|undefined} language +     * @param {string} content +     */ +    _setElementLanguage(element, language, content) { +        if (typeof language === 'string') { +            element.lang = language; +        } else { +            const language2 = getLanguageFromText(content); +            if (language2 !== null) { +                element.lang = language2; +            } +        } +    } + +    /**       * @param {string} reading       * @param {import('dictionary').TermPronunciation[]} termPronunciations       * @param {string[]} wordClasses diff --git a/ext/js/display/display.js b/ext/js/display/display.js index f6efb5ac..80f5e9ae 100644 --- a/ext/js/display/display.js +++ b/ext/js/display/display.js @@ -425,6 +425,7 @@ export class Display extends EventDispatcher {              readingMode: options.parsing.readingMode,              useInternalParser: options.parsing.enableScanningParser,              useMecabParser: options.parsing.enableMecabParser, +            language: options.general.language,              scanning: {                  inputs: scanningOptions.inputs,                  deepContentScan: scanningOptions.deepDomScan, @@ -1834,6 +1835,7 @@ export class Display extends EventDispatcher {          }          const {scanning: scanningOptions, sentenceParsing: sentenceParsingOptions} = options; +        this._contentTextScanner.language = options.general.language;          this._contentTextScanner.setOptions({              inputs: [{                  include: 'mouse0', diff --git a/ext/js/display/query-parser.js b/ext/js/display/query-parser.js index d27b9394..f6c26ce7 100644 --- a/ext/js/display/query-parser.js +++ b/ext/js/display/query-parser.js @@ -92,7 +92,7 @@ export class QueryParser extends EventDispatcher {      /**       * @param {import('display').QueryParserOptions} display       */ -    setOptions({selectedParser, termSpacing, readingMode, useInternalParser, useMecabParser, scanning}) { +    setOptions({selectedParser, termSpacing, readingMode, useInternalParser, useMecabParser, language, scanning}) {          let selectedParserChanged = false;          if (selectedParser === null || typeof selectedParser === 'string') {              selectedParserChanged = (this._selectedParser !== selectedParser); @@ -115,6 +115,7 @@ export class QueryParser extends EventDispatcher {              if (typeof scanLength === 'number') {                  this._scanLength = scanLength;              } +            this._textScanner.language = language;              this._textScanner.setOptions(scanning);          }          this._textScanner.setEnabled(true); diff --git a/ext/js/display/sandbox/structured-content-generator.js b/ext/js/display/sandbox/structured-content-generator.js index 1dfde39b..90a47158 100644 --- a/ext/js/display/sandbox/structured-content-generator.js +++ b/ext/js/display/sandbox/structured-content-generator.js @@ -16,7 +16,7 @@   * along with this program.  If not, see <https://www.gnu.org/licenses/>.   */ -import {isStringPartiallyJapanese} from '../../language/ja/japanese.js'; +import {getLanguageFromText} from '../../language/text-utilities.js';  export class StructuredContentGenerator {      /** @@ -163,8 +163,11 @@ export class StructuredContentGenerator {          if (typeof content === 'string') {              if (content.length > 0) {                  container.appendChild(this._createTextNode(content)); -                if (language === null && isStringPartiallyJapanese(content)) { -                    container.lang = 'ja'; +                if (language === null) { +                    const language2 = getLanguageFromText(content); +                    if (language2 !== null) { +                        container.lang = language2; +                    }                  }              }              return; diff --git a/ext/js/display/search-display-controller.js b/ext/js/display/search-display-controller.js index e23d5d50..00f5efc6 100644 --- a/ext/js/display/search-display-controller.js +++ b/ext/js/display/search-display-controller.js @@ -103,7 +103,7 @@ export class SearchDisplayController {          this._searchBackButton.addEventListener('click', this._onSearchBackButtonClick.bind(this), false);          this._wanakanaEnableCheckbox.addEventListener('change', this._onWanakanaEnableChange.bind(this));          window.addEventListener('copy', this._onCopy.bind(this)); -        this._clipboardMonitor.on('change', this._onExternalSearchUpdate.bind(this)); +        this._clipboardMonitor.on('change', this._onClipboardMonitorChange.bind(this));          this._clipboardMonitorEnableCheckbox.addEventListener('change', this._onClipboardMonitorEnableChange.bind(this));          this._display.hotkeyHandler.on('keydownNonHotkey', this._onKeyDown.bind(this)); @@ -271,9 +271,26 @@ export class SearchDisplayController {      }      /** @type {import('application').ApiHandler<'searchDisplayControllerUpdateSearchQuery'>} */ -    _onExternalSearchUpdate({text, animate = true}) { +    _onExternalSearchUpdate({text, animate}) { +        void this._updateSearchFromClipboard(text, animate, false); +    } + +    /** +     * @param {import('clipboard-monitor').Events['change']} event +     */ +    _onClipboardMonitorChange({text}) { +        void this._updateSearchFromClipboard(text, true, true); +    } + +    /** +     * @param {string} text +     * @param {boolean} animate +     * @param {boolean} checkText +     */ +    async _updateSearchFromClipboard(text, animate, checkText) {          const options = this._display.getOptions();          if (options === null) { return; } +        if (checkText && !await this._display.application.api.isTextLookupWorthy(text, options.general.language)) { return; }          const {clipboard: {autoSearchContent, maximumSearchLength}} = options;          if (text.length > maximumSearchLength) {              text = text.substring(0, maximumSearchLength); diff --git a/ext/js/language/language-descriptors.js b/ext/js/language/language-descriptors.js index beb1417e..d78a96e5 100644 --- a/ext/js/language/language-descriptors.js +++ b/ext/js/language/language-descriptors.js @@ -18,6 +18,7 @@  import {removeArabicScriptDiacritics} from './ar/arabic-text-preprocessors.js';  import {eszettPreprocessor} from './de/german-text-preprocessors.js';  import {collapseEmphaticSequences, convertAlphabeticCharacters, convertHalfWidthCharacters, convertHiraganaToKatakana, convertNumericCharacters} from './ja/japanese-text-preprocessors.js'; +import {isStringPartiallyJapanese} from './ja/japanese.js';  import {removeLatinDiacritics} from './la/latin-text-preprocessors.js';  import {removeRussianDiacritics, yoToE} from './ru/russian-text-preprocessors.js';  import {capitalizeFirstLetter, decapitalize} from './text-preprocessors.js'; @@ -114,6 +115,7 @@ const languageDescriptors = [          iso: 'ja',          name: 'Japanese',          exampleText: '読め', +        isTextLookupWorthy: isStringPartiallyJapanese,          textPreprocessors: {              convertHalfWidthCharacters,              convertNumericCharacters, diff --git a/ext/js/language/languages.js b/ext/js/language/languages.js index f964dfec..fd58477d 100755 --- a/ext/js/language/languages.js +++ b/ext/js/language/languages.js @@ -47,3 +47,14 @@ export function getAllLanguageTextPreprocessors() {      }      return results;  } + +/** + * @param {string} text + * @param {string} language + * @returns {boolean} + */ +export function isTextLookupWorthy(text, language) { +    const descriptor = languageDescriptorMap.get(language); +    if (typeof descriptor === 'undefined') { return false; } +    return typeof descriptor.isTextLookupWorthy === 'undefined' || descriptor.isTextLookupWorthy(text); +} diff --git a/ext/js/language/text-scanner.js b/ext/js/language/text-scanner.js index 64333093..ad5ba12b 100644 --- a/ext/js/language/text-scanner.js +++ b/ext/js/language/text-scanner.js @@ -70,6 +70,8 @@ export class TextScanner extends EventDispatcher {          this._includeSelector = null;          /** @type {?string} */          this._excludeSelector = null; +        /** @type {?string} */ +        this._language = null;          /** @type {?import('text-scanner').InputInfo} */          this._inputInfoCurrent = null; @@ -188,6 +190,10 @@ export class TextScanner extends EventDispatcher {          this._excludeSelector = value;      } +    /** @type {?string} */ +    get language() { return this._language; } +    set language(value) { this._language = value; } +      /** */      prepare() {          this._isPrepared = true; @@ -449,7 +455,7 @@ export class TextScanner extends EventDispatcher {              const result = await this._findDictionaryEntries(textSource, searchTerms, searchKanji, optionsContext);              if (result !== null) {                  ({dictionaryEntries, sentence, type} = result); -            } else if (textSource !== null && textSource instanceof TextSourceElement && await this._hasJapanese(textSource.fullContent)) { +            } else if (textSource !== null && textSource instanceof TextSourceElement && await this._isTextLookupWorthy(textSource.fullContent)) {                  dictionaryEntries = [];                  sentence = {text: '', offset: 0};              } @@ -1549,9 +1555,9 @@ export class TextScanner extends EventDispatcher {       * @param {string} text       * @returns {Promise<boolean>}       */ -    async _hasJapanese(text) { +    async _isTextLookupWorthy(text) {          try { -            return await this._api.textHasJapaneseCharacters(text); +            return this._language !== null && await this._api.isTextLookupWorthy(text, this._language);          } catch (e) {              return false;          } diff --git a/ext/js/language/text-utilities.js b/ext/js/language/text-utilities.js new file mode 100644 index 00000000..ca8958aa --- /dev/null +++ b/ext/js/language/text-utilities.js @@ -0,0 +1,29 @@ +/* + * Copyright (C) 2024  Yomitan Authors + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program.  If not, see <https://www.gnu.org/licenses/>. + */ + +import {isStringPartiallyJapanese} from './ja/japanese.js'; + +/** + * Returns the language that the string might be by using some heuristic checks. + * Values returned are ISO codes. `null` is returned if no language can be determined. + * @param {string} text + * @returns {?string} + */ +export function getLanguageFromText(text) { +    if (isStringPartiallyJapanese(text)) { return 'ja'; } +    return null; +} |