diff options
author | toasted-nutbread <toasted-nutbread@users.noreply.github.com> | 2021-02-26 23:23:16 -0500 |
---|---|---|
committer | GitHub <noreply@github.com> | 2021-02-26 23:23:16 -0500 |
commit | 0bf0620c3579a5fe94c529673db105a83d6c3755 (patch) | |
tree | 8a49078a858c4e8b41959f93bb0a8aea162e97cc /test/test-japanese.js | |
parent | b994414b14b224c02359b5e31f6994653a3d4458 (diff) |
Improve kana segmentation (#1446)
* Improve edge case furigana distribution for mixed hiragana/katakana
* Update/add tests
Diffstat (limited to 'test/test-japanese.js')
-rw-r--r-- | test/test-japanese.js | 21 |
1 files changed, 17 insertions, 4 deletions
diff --git a/test/test-japanese.js b/test/test-japanese.js index 590d3157..1a4fc494 100644 --- a/test/test-japanese.js +++ b/test/test-japanese.js @@ -402,7 +402,8 @@ function testDistributeFurigana() { [ ['スズメの涙', 'すずめのなみだ'], [ - {text: 'スズメの', furigana: 'すずめの'}, + {text: 'スズメ', furigana: 'すずめ'}, + {text: 'の', furigana: ''}, {text: '涙', furigana: 'なみだ'} ] ], @@ -464,14 +465,16 @@ function testDistributeFurigana() { [ ['くノ一', 'くのいち'], [ - {text: 'くノ', furigana: 'くの'}, + {text: 'く', furigana: ''}, + {text: 'ノ', furigana: 'の'}, {text: '一', furigana: 'いち'} ] ], [ ['くノ一', 'くのいち'], [ - {text: 'くノ', furigana: 'くの'}, + {text: 'く', furigana: ''}, + {text: 'ノ', furigana: 'の'}, {text: '一', furigana: 'いち'} ] ], @@ -691,9 +694,19 @@ function testDistributeFurigana() { [ ['ページ違反', 'ぺーじいはん'], [ - {text: 'ページ', furigana: 'ぺーじ'}, + {text: 'ペ', furigana: 'ぺ'}, + {text: 'ー', furigana: ''}, + {text: 'ジ', furigana: 'じ'}, {text: '違反', furigana: 'いはん'} ] + ], + // Mismatched kana + [ + ['サボる', 'サボル'], + [ + {text: 'サボ', furigana: ''}, + {text: 'る', furigana: 'ル'} + ] ] ]; |