]> git.saurik.com Git - apple/icu.git/blobdiff - icuSources/data/unidata/base_unidata/LineBreak.txt
ICU-461.12.tar.gz
[apple/icu.git] / icuSources / data / unidata / base_unidata / LineBreak.txt
index e28f360cdedab2c85e07d4965884291cb3ea94b8..ad45076d5b80b9d4b6e3b8bc1dcef38fb37a4dff 100644 (file)
@@ -1,5 +1,5 @@
-# LineBreak-5.1.0.txt
-# Date: 2007-12-10, 16:24:00 PST [KW]
+# LineBreak-6.0.0.txt
+# Date: 2010-08-18, 17:25:00 PDT [KW]
 #
 # Line Break Properties
 #
@@ -7,7 +7,7 @@
 # Unicode Character Database.
 # It contains both normative and informative data.
 #
-# Copyright (c) 1991-2007 Unicode, Inc.
+# Copyright (c) 1991-2010 Unicode, Inc.
 # For terms of use, see http://www.unicode.org/terms_of_use.html
 #
 # The format is two fields separated by a semicolon.
 #         "BK", "CR", "LF", "CM", "SG", "GL", "CB", "SP", "ZW",
 #         "NL", "WJ", "JL", "JV", "JT", "H2", "H3"
 #   Informative:
-#         "XX", "OP", "CL", "QU", "NS", "EX", "SY",
+#         "XX", "OP", "CL", "CP", "QU", "NS", "EX", "SY",
 #         "IS", "PR", "PO", "NU", "AL", "ID", "IN", "HY",
 #         "BB", "BA", "SA", "AI", "B2"
-#  - All code points, assigned and unassigned, that are not listed 
+#  - All code points, assigned and unassigned, that are not listed
 #         explicitly are given the value "XX".
+# The unassigned code points that default to "ID" include ranges in the
+# following blocks:
+#     CJK Unified Ideographs Extension A:       U+3400..U+4DBF
+#     CJK Unified Ideographs:                   U+4E00..U+9FFF
+#     CJK Compatibility Ideographs:             U+F900..U+FAFF
+#     CJK Unified Ideographs Extension B:      U+20000..U+2A6DF
+#     CJK Unified Ideographs Extension C:      U+2A700..U+2B73F
+#     CJK Unified Ideographs Extension D:      U+2B740..U+2B81F
+#     CJK Compatibility Ideographs Supplement: U+2F800..U+2FA1F
+#     and any other reserved code points on
+#         Planes 2 and 3:                      U+20000..U+2FFFD
+#                                              U+30000..U+3FFFD
 #  - Characters ranges are specified as for other property files in
 #         the Unicode Character Database.
 #
 # The Unicode name of each character is provided in a comment for help
 # in identifying the characters.
 #
-# See UAX #14: Line Breaking Properties, for more information
+# See UAX #14: Unicode Line Breaking Algorithm, for more information
 #
 # @missing: 0000..10FFFF; XX
 0000..0008;CM
@@ -46,7 +58,7 @@
 0026;AL
 0027;QU
 0028;OP
-0029;CL
+0029;CP
 002A;AL
 002B;PR
 002C;IS
@@ -60,7 +72,7 @@
 0040..005A;AL
 005B;OP
 005C;PR
-005D;CL
+005D;CP
 005E..007A;AL
 007B;OP
 007C;BA
 038E..03A1;AL
 03A3..0482;AL
 0483..0489;CM
-048A..0523;AL
+048A..0527;AL
 0531..0556;AL
 0559..055F;AL
 0561..0587;AL
 0610..061A;CM
 061B;EX
 061E..061F;EX
-0621..064A;AL
-064B..065E;CM
+0620..064A;AL
+064B..065F;CM
 0660..0669;NU
 066A;PO
 066B..066C;NU
 06D4;EX
 06D5;AL
 06D6..06DC;CM
-06DD;AL
-06DE..06E4;CM
+06DD..06DE;AL
+06DF..06E4;CM
 06E5..06E6;AL
 06E7..06E8;CM
 06E9;AL
 07F8;IS
 07F9;EX
 07FA;AL
-0901..0903;CM
+0800..0815;AL
+0816..0819;CM
+081A;AL
+081B..0823;CM
+0824;AL
+0825..0827;CM
+0828;AL
+0829..082D;CM
+0830..083E;AL
+0840..0858;AL
+0859..085B;CM
+085E;AL
+0900..0903;CM
 0904..0939;AL
-093C;CM
+093A..093C;CM
 093D;AL
-093E..094D;CM
+093E..094F;CM
 0950;AL
-0951..0954;CM
+0951..0957;CM
 0958..0961;AL
 0962..0963;CM
 0964..0965;BA
 0966..096F;NU
-0970..0972;AL
-097B..097F;AL
+0970..0977;AL
+0979..097F;AL
 0981..0983;CM
 0985..098C;AL
 098F..0990;AL
 09E2..09E3;CM
 09E6..09EF;NU
 09F0..09F1;AL
-09F2..09F3;PR
-09F4..09FA;AL
+09F2..09F3;PO
+09F4..09F8;AL
+09F9;PO
+09FA;AL
+09FB;PR
 0A01..0A03;CM
 0A05..0A0A;AL
 0A0F..0A10;AL
 0B5F..0B61;AL
 0B62..0B63;CM
 0B66..0B6F;NU
-0B70..0B71;AL
+0B70..0B77;AL
 0B82;CM
 0B83;AL
 0B85..0B8A;AL
 0D02..0D03;CM
 0D05..0D0C;AL
 0D0E..0D10;AL
-0D12..0D28;AL
-0D2A..0D39;AL
+0D12..0D3A;AL
 0D3D;AL
 0D3E..0D44;CM
 0D46..0D48;CM
 0D4A..0D4D;CM
+0D4E;AL
 0D57;CM
 0D60..0D61;AL
 0D62..0D63;CM
 0F80..0F84;CM
 0F85;BA
 0F86..0F87;CM
-0F88..0F8B;AL
-0F90..0F97;CM
+0F88..0F8C;AL
+0F8D..0F97;CM
 0F99..0FBC;CM
 0FBE..0FBF;BA
 0FC0..0FC5;AL
 0FD0..0FD1;BB
 0FD2;BA
 0FD3;BB
-0FD4;AL
+0FD4..0FD8;AL
+0FD9..0FDA;GL
 1000..103F;SA
 1040..1049;NU
 104A..104B;BA
 104C..104F;AL
 1050..108F;SA
 1090..1099;NU
-109E..109F;SA
+109A..109F;SA
 10A0..10C5;AL
 10D0..10FC;AL
-1100..1159;JL
-115F;JL
-1160..11A2;JV
-11A8..11F9;JT
+1100..115F;JL
+1160..11A7;JV
+11A8..11FF;JT
 1200..1248;AL
 124A..124D;AL
 1250..1256;AL
 12D8..1310;AL
 1312..1315;AL
 1318..135A;AL
-135F;CM
+135D..135F;CM
 1360;AL
 1361;BA
 1362..137C;AL
 1380..1399;AL
 13A0..13F4;AL
-1401..1676;AL
+1400;BA
+1401..167F;AL
 1680;BA
 1681..169A;AL
 169B;OP
 1880..18A8;AL
 18A9;CM
 18AA;AL
+18B0..18F5;AL
 1900..191C;AL
 1920..192B;CM
 1930..193B;CM
 1946..194F;NU
 1950..196D;SA
 1970..1974;SA
-1980..19A9;SA
+1980..19AB;SA
 19B0..19C9;SA
 19D0..19D9;NU
+19DA;SA
 19DE..19DF;SA
 19E0..1A16;AL
 1A17..1A1B;CM
 1A1E..1A1F;AL
+1A20..1A5E;SA
+1A60..1A7C;SA
+1A7F;CM
+1A80..1A89;NU
+1A90..1A99;NU
+1AA0..1AAD;SA
 1B00..1B04;CM
 1B05..1B33;AL
 1B34..1B44;CM
 1B45..1B4B;AL
 1B50..1B59;NU
-1B5A..1B60;BA
+1B5A..1B5B;BA
+1B5C;AL
+1B5D..1B60;BA
 1B61..1B6A;AL
 1B6B..1B73;CM
 1B74..1B7C;AL
 1BA1..1BAA;CM
 1BAE..1BAF;AL
 1BB0..1BB9;NU
-1C00..1C23;AL
+1BC0..1BE5;AL
+1BE6..1BF3;CM
+1BFC..1C23;AL
 1C24..1C37;CM
 1C3B..1C3F;BA
 1C40..1C49;NU
 1C50..1C59;NU
 1C5A..1C7D;AL
 1C7E..1C7F;BA
+1CD0..1CD2;CM
+1CD3;AL
+1CD4..1CE8;CM
+1CE9..1CEC;AL
+1CED;CM
+1CEE..1CF1;AL
+1CF2;CM
 1D00..1DBF;AL
 1DC0..1DE6;CM
-1DFE..1DFF;CM
+1DFC..1DFF;CM
 1E00..1F15;AL
 1F18..1F1D;AL
 1F20..1F45;AL
 2085..208C;AL
 208D;OP
 208E;CL
-2090..2094;AL
+2090..209C;AL
 20A0..20A6;PR
 20A7;PO
 20A8..20B5;PR
+20B6;PO
+20B7..20B9;PR
 20D0..20F0;CM
 2100..2102;AL
 2103;PO
 2121..2122;AI
 2123..212A;AL
 212B;AI
-212C..214F;AL
-2153;AL
+212C..2153;AL
 2154..2155;AI
 2156..215A;AL
 215B;AI
 216C..216F;AL
 2170..2179;AI
 217A..2188;AL
+2189;AI
 2190..2199;AI
 219A..21D1;AL
 21D2;AI
 2313..2328;AL
 2329;OP
 232A;CL
-232B..23E7;AL
+232B..23F3;AL
 2400..2426;AL
 2440..244A;AL
 2460..24FE;AI
 266E;AL
 266F;AI
 2670..269D;AL
-26A0..26BC;AL
+269E..269F;AI
+26A0..26BD;AL
+26BE..26BF;AI
 26C0..26C3;AL
-2701..2704;AL
-2706..2709;AL
-270C..2727;AL
-2729..274B;AL
-274D;AL
-274F..2752;AL
-2756;AL
+26C4..26CD;AI
+26CE;AL
+26CF..26E1;AI
+26E2;AL
+26E3;AI
+26E4..26E7;AL
+26E8..26FF;AI
+2701..2756;AL
+2757;AI
 2758..275A;AL
 275B..275E;QU
-2761;AL
+275F..2761;AL
 2762..2763;EX
 2764..2767;AL
 2768;OP
 2774;OP
 2775;CL
 2776..2793;AI
-2794;AL
-2798..27AF;AL
-27B1..27BE;AL
-27C0..27C4;AL
+2794..27C4;AL
 27C5;OP
 27C6;CL
 27C7..27CA;AL
 27CC;AL
-27D0..27E5;AL
+27CE..27E5;AL
 27E6;OP
 27E7;CL
 27E8;OP
 29FD;CL
 29FE..2B4C;AL
 2B50..2B54;AL
+2B55..2B59;AI
 2C00..2C2E;AL
 2C30..2C5E;AL
-2C60..2C6F;AL
-2C71..2C7D;AL
-2C80..2CEA;AL
+2C60..2CEE;AL
+2CEF..2CF1;CM
 2CF9;EX
 2CFA..2CFC;BA
 2CFD;AL
 2D00..2D25;AL
 2D30..2D65;AL
 2D6F;AL
+2D70;BA
+2D7F;CM
 2D80..2D96;AL
 2DA0..2DA6;AL
 2DA8..2DAE;AL
 2E2A..2E2D;BA
 2E2E;EX
 2E2F;AL
-2E30;BA
+2E30..2E31;BA
 2E80..2E99;ID
 2E9B..2EF3;ID
 2F00..2FD5;ID
 30FF;ID
 3105..312D;ID
 3131..318E;ID
-3190..31B7;ID
+3190..31BA;ID
 31C0..31E3;ID
 31F0..31FF;NS
 3200..321E;ID
-3220..3243;ID
+3220..3247;ID
+3248..324F;AI
 3250..32FE;ID
 3300..33FF;ID
 3400..4DB5;ID
+4DB6..4DBF;ID
 4DC0..4DFF;AL
-4E00..9FC3;ID
+4E00..9FCB;ID
+9FCC..9FFF;ID
 A000..A014;ID
 A015;NS
 A016..A48C;ID
 A490..A4C6;ID
+A4D0..A4FD;AL
+A4FE..A4FF;BA
 A500..A60C;AL
 A60D;BA
 A60E;EX
@@ -1003,14 +1060,19 @@ A60F;BA
 A610..A61F;AL
 A620..A629;NU
 A62A..A62B;AL
-A640..A65F;AL
-A662..A66E;AL
+A640..A66E;AL
 A66F..A672;CM
 A673;AL
 A67C..A67D;CM
 A67E..A697;AL
-A700..A78C;AL
-A7FB..A801;AL
+A6A0..A6EF;AL
+A6F0..A6F1;CM
+A6F2;AL
+A6F3..A6F7;BA
+A700..A78E;AL
+A790..A791;AL
+A7A0..A7A9;AL
+A7FA..A801;AL
 A802;CM
 A803..A805;AL
 A806;CM
@@ -1019,6 +1081,9 @@ A80B;CM
 A80C..A822;AL
 A823..A827;CM
 A828..A82B;AL
+A830..A837;AL
+A838;PO
+A839;AL
 A840..A873;AL
 A874..A875;BB
 A876..A877;EX
@@ -1027,6 +1092,8 @@ A882..A8B3;AL
 A8B4..A8C4;CM
 A8CE..A8CF;BA
 A8D0..A8D9;NU
+A8E0..A8F1;CM
+A8F2..A8FB;AL
 A900..A909;NU
 A90A..A925;AL
 A926..A92D;CM
@@ -1034,6 +1101,16 @@ A92E..A92F;BA
 A930..A946;AL
 A947..A953;CM
 A95F;AL
+A960..A97C;JL
+A980..A983;CM
+A984..A9B2;AL
+A9B3..A9C0;CM
+A9C1..A9C6;AL
+A9C7..A9C9;BA
+A9CA..A9CD;AL
+A9CF;AL
+A9D0..A9D9;NU
+A9DE..A9DF;AL
 AA00..AA28;AL
 AA29..AA36;CM
 AA40..AA42;AL
@@ -1043,6 +1120,19 @@ AA4C..AA4D;CM
 AA50..AA59;NU
 AA5C;AL
 AA5D..AA5F;BA
+AA60..AA7B;SA
+AA80..AAC2;SA
+AADB..AADF;SA
+AB01..AB06;AL
+AB09..AB0E;AL
+AB11..AB16;AL
+AB20..AB26;AL
+AB28..AB2E;AL
+ABC0..ABE2;AL
+ABE3..ABEA;CM
+ABEB;BA
+ABEC..ABED;CM
+ABF0..ABF9;NU
 AC00;H2
 AC01..AC1B;H3
 AC1C;H2
@@ -1841,13 +1931,18 @@ D76C;H2
 D76D..D787;H3
 D788;H2
 D789..D7A3;H3
+D7B0..D7C6;JV
+D7CB..D7FB;JT
 D800..DB7F;SG
 DB80..DBFF;SG
 DC00..DFFF;SG
 E000..F8FF;XX
 F900..FA2D;ID
-FA30..FA6A;ID
+FA2E..FA2F;ID
+FA30..FA6D;ID
+FA6E..FA6F;ID
 FA70..FAD9;ID
+FADA..FAFF;ID
 FB00..FB06;AL
 FB13..FB17;AL
 FB1D;AL
@@ -1857,7 +1952,7 @@ FB38..FB3C;AL
 FB3E;AL
 FB40..FB41;AL
 FB43..FB44;AL
-FB46..FBB1;AL
+FB46..FBC1;AL
 FBD3..FD3D;AL
 FD3E;OP
 FD3F;CL
@@ -1993,8 +2088,10 @@ FFFD;AI
 1080A..10835;AL
 10837..10838;AL
 1083C;AL
-1083F;AL
-10900..10919;AL
+1083F..10855;AL
+10857;BA
+10858..1085F;AL
+10900..1091B;AL
 1091F;BA
 10920..10939;AL
 1093F;AL
@@ -2010,9 +2107,45 @@ FFFD;AI
 10A40..10A47;AL
 10A50..10A57;BA
 10A58;AL
+10A60..10A7F;AL
+10B00..10B35;AL
+10B39..10B3F;BA
+10B40..10B55;AL
+10B58..10B72;AL
+10B78..10B7F;AL
+10C00..10C48;AL
+10E60..10E7E;AL
+11000..11002;CM
+11003..11037;AL
+11038..11046;CM
+11047..11048;BA
+11049..1104D;AL
+11052..11065;AL
+11066..1106F;NU
+11080..11082;CM
+11083..110AF;AL
+110B0..110BA;CM
+110BB..110BD;AL
+110BE..110C1;BA
 12000..1236E;AL
 12400..12462;AL
 12470..12473;BA
+13000..13257;AL
+13258..1325A;OP
+1325B..1325D;CL
+1325E..13281;AL
+13282;CL
+13283..13285;AL
+13286;OP
+13287;CL
+13288;OP
+13289;CL
+1328A..13378;AL
+13379;OP
+1337A..1337B;CL
+1337C..1342E;AL
+16800..16A38;AL
+1B000..1B001;ID
 1D000..1D0F5;AL
 1D100..1D126;AL
 1D129..1D164;AL
@@ -2052,8 +2185,57 @@ FFFD;AI
 1D7CE..1D7FF;NU
 1F000..1F02B;AL
 1F030..1F093;AL
+1F0A0..1F0AE;AL
+1F0B1..1F0BE;AL
+1F0C1..1F0CF;AL
+1F0D1..1F0DF;AL
+1F100..1F10A;AI
+1F110..1F12D;AI
+1F12E;AL
+1F130..1F169;AI
+1F170..1F19A;AI
+1F1E6..1F1FF;AL
+1F200..1F202;ID
+1F210..1F23A;ID
+1F240..1F248;ID
+1F250..1F251;ID
+1F300..1F320;AL
+1F330..1F335;AL
+1F337..1F37C;AL
+1F380..1F393;AL
+1F3A0..1F3C4;AL
+1F3C6..1F3CA;AL
+1F3E0..1F3F0;AL
+1F400..1F43E;AL
+1F440;AL
+1F442..1F4F7;AL
+1F4F9..1F4FC;AL
+1F500..1F53D;AL
+1F550..1F567;AL
+1F5FB..1F5FF;AL
+1F601..1F610;AL
+1F612..1F614;AL
+1F616;AL
+1F618;AL
+1F61A;AL
+1F61C..1F61E;AL
+1F620..1F625;AL
+1F628..1F62B;AL
+1F62D;AL
+1F630..1F633;AL
+1F635..1F640;AL
+1F645..1F64F;AL
+1F680..1F6C5;AL
+1F700..1F773;AL
 20000..2A6D6;ID
+2A6D7..2A6FF;ID
+2A700..2B734;ID
+2B735..2B73F;ID
+2B740..2B81D;ID
+2B81E..2F7FF;ID
 2F800..2FA1D;ID
+2FA1E..2FFFD;ID
+30000..3FFFD;ID
 E0001;CM
 E0020..E007F;CM
 E0100..E01EF;CM