xref: /aosp_15_r20/external/cronet/third_party/icu/cast/brkitr.patch (revision 6777b5387eb2ff775bb5750e3f5d96f37fb7352b)
1*6777b538SAndroid Build Coastguard Workerdiff --git a/source/data/brkitr/ja.txt b/source/data/brkitr/ja.txt
2*6777b538SAndroid Build Coastguard Workerindex 363a74f6..7ae4b8f6 100644
3*6777b538SAndroid Build Coastguard Worker--- a/source/data/brkitr/ja.txt
4*6777b538SAndroid Build Coastguard Worker+++ b/source/data/brkitr/ja.txt
5*6777b538SAndroid Build Coastguard Worker@@ -11,6 +11,7 @@ ja{
6*6777b538SAndroid Build Coastguard Worker         line_phrase:process(dependency){"line_phrase_cj.brk"}
7*6777b538SAndroid Build Coastguard Worker         line_strict:process(dependency){"line.brk"}
8*6777b538SAndroid Build Coastguard Worker         line_strict_phrase:process(dependency){"line_phrase_cj.brk"}
9*6777b538SAndroid Build Coastguard Worker+	word:process(dependency){"word_ja.brk"}
10*6777b538SAndroid Build Coastguard Worker     }
11*6777b538SAndroid Build Coastguard Worker     extensions{
12*6777b538SAndroid Build Coastguard Worker     }
13*6777b538SAndroid Build Coastguard Workerdiff --git a/source/data/brkitr/rules/word.txt b/source/data/brkitr/rules/word.txt
14*6777b538SAndroid Build Coastguard Workerindex b4603823..58c18cbc 100644
15*6777b538SAndroid Build Coastguard Worker--- a/source/data/brkitr/rules/word.txt
16*6777b538SAndroid Build Coastguard Worker+++ b/source/data/brkitr/rules/word.txt
17*6777b538SAndroid Build Coastguard Worker@@ -84,13 +84,11 @@ $Control        = [\p{Grapheme_Cluster_Break = Control}];
18*6777b538SAndroid Build Coastguard Worker $HangulSyllable = [\uac00-\ud7a3];
19*6777b538SAndroid Build Coastguard Worker $ComplexContext = [:LineBreak = Complex_Context:];
20*6777b538SAndroid Build Coastguard Worker $KanaKanji      = [$Han $Hiragana $Katakana];
21*6777b538SAndroid Build Coastguard Worker-$dictionaryCJK  = [$KanaKanji $HangulSyllable];
22*6777b538SAndroid Build Coastguard Worker-$dictionary     = [$ComplexContext $dictionaryCJK];
23*6777b538SAndroid Build Coastguard Worker+$dictionary     = [$ComplexContext];
24*6777b538SAndroid Build Coastguard Worker
25*6777b538SAndroid Build Coastguard Worker # TODO: check if handling of katakana in dictionary makes rules incorrect/void
26*6777b538SAndroid Build Coastguard Worker
27*6777b538SAndroid Build Coastguard Worker-# leave CJK scripts out of ALetterPlus
28*6777b538SAndroid Build Coastguard Worker-$ALetterPlus  = [$ALetter-$dictionaryCJK [$ComplexContext-$Extend-$Control]];
29*6777b538SAndroid Build Coastguard Worker+$ALetterPlus  = [$ALetter [$ComplexContext-$Extend-$Control]];
30*6777b538SAndroid Build Coastguard Worker
31*6777b538SAndroid Build Coastguard Worker
32*6777b538SAndroid Build Coastguard Worker ## -------------------------------------------------
33*6777b538SAndroid Build Coastguard Worker@@ -185,10 +183,6 @@ $ExtendNumLet  $ExFm* $Katakana     {400};    #  (13b)
34*6777b538SAndroid Build Coastguard Worker #
35*6777b538SAndroid Build Coastguard Worker ^$Regional_Indicator $ExFm* $Regional_Indicator;
36*6777b538SAndroid Build Coastguard Worker
37*6777b538SAndroid Build Coastguard Worker-# special handling for CJK characters: chain for later dictionary segmentation
38*6777b538SAndroid Build Coastguard Worker-$HangulSyllable $HangulSyllable {200};
39*6777b538SAndroid Build Coastguard Worker-$KanaKanji $KanaKanji {400}; # different rule status if both kana and kanji found
40*6777b538SAndroid Build Coastguard Worker-
41*6777b538SAndroid Build Coastguard Worker # Rule 999
42*6777b538SAndroid Build Coastguard Worker #     Match a single code point if no other rule applies.
43*6777b538SAndroid Build Coastguard Worker .;
44