1*6777b538SAndroid Build Coastguard Workerdiff --git a/source/data/brkitr/ja.txt b/source/data/brkitr/ja.txt 2*6777b538SAndroid Build Coastguard Workerindex 363a74f6..7ae4b8f6 100644 3*6777b538SAndroid Build Coastguard Worker--- a/source/data/brkitr/ja.txt 4*6777b538SAndroid Build Coastguard Worker+++ b/source/data/brkitr/ja.txt 5*6777b538SAndroid Build Coastguard Worker@@ -11,6 +11,7 @@ ja{ 6*6777b538SAndroid Build Coastguard Worker line_phrase:process(dependency){"line_phrase_cj.brk"} 7*6777b538SAndroid Build Coastguard Worker line_strict:process(dependency){"line.brk"} 8*6777b538SAndroid Build Coastguard Worker line_strict_phrase:process(dependency){"line_phrase_cj.brk"} 9*6777b538SAndroid Build Coastguard Worker+ word:process(dependency){"word_ja.brk"} 10*6777b538SAndroid Build Coastguard Worker } 11*6777b538SAndroid Build Coastguard Worker extensions{ 12*6777b538SAndroid Build Coastguard Worker } 13*6777b538SAndroid Build Coastguard Workerdiff --git a/source/data/brkitr/rules/word.txt b/source/data/brkitr/rules/word.txt 14*6777b538SAndroid Build Coastguard Workerindex b4603823..58c18cbc 100644 15*6777b538SAndroid Build Coastguard Worker--- a/source/data/brkitr/rules/word.txt 16*6777b538SAndroid Build Coastguard Worker+++ b/source/data/brkitr/rules/word.txt 17*6777b538SAndroid Build Coastguard Worker@@ -84,13 +84,11 @@ $Control = [\p{Grapheme_Cluster_Break = Control}]; 18*6777b538SAndroid Build Coastguard Worker $HangulSyllable = [\uac00-\ud7a3]; 19*6777b538SAndroid Build Coastguard Worker $ComplexContext = [:LineBreak = Complex_Context:]; 20*6777b538SAndroid Build Coastguard Worker $KanaKanji = [$Han $Hiragana $Katakana]; 21*6777b538SAndroid Build Coastguard Worker-$dictionaryCJK = [$KanaKanji $HangulSyllable]; 22*6777b538SAndroid Build Coastguard Worker-$dictionary = [$ComplexContext $dictionaryCJK]; 23*6777b538SAndroid Build Coastguard Worker+$dictionary = [$ComplexContext]; 24*6777b538SAndroid Build Coastguard Worker 25*6777b538SAndroid Build Coastguard Worker # TODO: check if handling of katakana in dictionary makes rules incorrect/void 26*6777b538SAndroid Build Coastguard Worker 27*6777b538SAndroid Build Coastguard Worker-# leave CJK scripts out of ALetterPlus 28*6777b538SAndroid Build Coastguard Worker-$ALetterPlus = [$ALetter-$dictionaryCJK [$ComplexContext-$Extend-$Control]]; 29*6777b538SAndroid Build Coastguard Worker+$ALetterPlus = [$ALetter [$ComplexContext-$Extend-$Control]]; 30*6777b538SAndroid Build Coastguard Worker 31*6777b538SAndroid Build Coastguard Worker 32*6777b538SAndroid Build Coastguard Worker ## ------------------------------------------------- 33*6777b538SAndroid Build Coastguard Worker@@ -185,10 +183,6 @@ $ExtendNumLet $ExFm* $Katakana {400}; # (13b) 34*6777b538SAndroid Build Coastguard Worker # 35*6777b538SAndroid Build Coastguard Worker ^$Regional_Indicator $ExFm* $Regional_Indicator; 36*6777b538SAndroid Build Coastguard Worker 37*6777b538SAndroid Build Coastguard Worker-# special handling for CJK characters: chain for later dictionary segmentation 38*6777b538SAndroid Build Coastguard Worker-$HangulSyllable $HangulSyllable {200}; 39*6777b538SAndroid Build Coastguard Worker-$KanaKanji $KanaKanji {400}; # different rule status if both kana and kanji found 40*6777b538SAndroid Build Coastguard Worker- 41*6777b538SAndroid Build Coastguard Worker # Rule 999 42*6777b538SAndroid Build Coastguard Worker # Match a single code point if no other rule applies. 43*6777b538SAndroid Build Coastguard Worker .; 44