diff options
Diffstat (limited to 'test')
-rw-r--r-- | test/test-document-util.js | 23 | ||||
-rw-r--r-- | test/test-options-util.js | 17 |
2 files changed, 38 insertions, 2 deletions
diff --git a/test/test-document-util.js b/test/test-document-util.js index 09f0c5e7..2311e25f 100644 --- a/test/test-document-util.js +++ b/test/test-document-util.js @@ -181,8 +181,29 @@ async function testDocumentTextScanningFunctions(dom, {DocumentUtil, TextSourceR } if (source === null) { continue; } + // Sentence info + const terminatorString = '…。..??!!'; + const terminatorMap = new Map(); + for (const char of terminatorString) { + terminatorMap.set(char, [false, true]); + } + const quoteArray = [['「', '」'], ['『', '』'], ['\'', '\''], ['"', '"']]; + const forwardQuoteMap = new Map(); + const backwardQuoteMap = new Map(); + for (const [char1, char2] of quoteArray) { + forwardQuoteMap.set(char1, [char2, false]); + backwardQuoteMap.set(char2, [char1, false]); + } + // Test docSentenceExtract - const sentenceActual = documentUtil.extractSentence(source, false, sentenceScanExtent).text; + const sentenceActual = documentUtil.extractSentence( + source, + false, + sentenceScanExtent, + terminatorMap, + forwardQuoteMap, + backwardQuoteMap + ).text; assert.strictEqual(sentenceActual, sentence); // Clean diff --git a/test/test-options-util.js b/test/test-options-util.js index 8b7254c6..5ce9313e 100644 --- a/test/test-options-util.js +++ b/test/test-options-util.js @@ -420,7 +420,22 @@ function createProfileOptionsUpdatedTestData1() { fieldTemplates: null }, sentenceParsing: { - scanExtent: 200 + scanExtent: 200, + enableTerminationCharacters: true, + terminationCharacters: [ + {enabled: true, character1: '「', character2: '」', includeCharacterAtStart: false, includeCharacterAtEnd: false}, + {enabled: true, character1: '『', character2: '』', includeCharacterAtStart: false, includeCharacterAtEnd: false}, + {enabled: true, character1: '"', character2: '"', includeCharacterAtStart: false, includeCharacterAtEnd: false}, + {enabled: true, character1: '\'', character2: '\'', includeCharacterAtStart: false, includeCharacterAtEnd: false}, + {enabled: true, character1: '.', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '!', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '?', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '.', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '。', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '!', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '?', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true}, + {enabled: true, character1: '…', character2: null, includeCharacterAtStart: false, includeCharacterAtEnd: true} + ] } }; } |