2 # Copyright (C) 2002-2010, International Business Machines Corporation and others.
7 # ICU Character Break Rules, also known as Grapheme Cluster Boundaries
8 # See Unicode Standard Annex #29.
9 # These rules are based on TR29 Revision 16, for Unicode Version 6.0
13 # Character Class Definitions.
15 $CR = [\p{Grapheme_Cluster_Break = CR}];
16 $LF = [\p{Grapheme_Cluster_Break = LF}];
17 $Control = [\p{Grapheme_Cluster_Break = Control}];
18 $Extend = [\p{Grapheme_Cluster_Break = Extend} + [\u0E33 \u0EB3]];
21 # Korean Syllable Definitions
23 $L = [\p{Grapheme_Cluster_Break = L}];
24 $V = [\p{Grapheme_Cluster_Break = V}];
25 $T = [\p{Grapheme_Cluster_Break = T}];
27 $LV = [\p{Grapheme_Cluster_Break = LV}];
28 $LVT = [\p{Grapheme_Cluster_Break = LVT}];
31 ## -------------------------------------------------
38 $L ($L | $V | $LV | $LVT);
42 [^$Control $CR $LF] $Extend;
44 ## -------------------------------------------------
48 ($L | $V | $LV | $LVT) $L;
52 $Extend [^$Control $CR $LF];
55 ## -------------------------------------------------
60 ## -------------------------------------------------