Updated Branches: refs/heads/master 1dced2235 -> 0df8da88c
http://git-wip-us.apache.org/repos/asf/lucy/blob/0df8da88/modules/unicode/ucd/WordBreakTest.json ---------------------------------------------------------------------- diff --git a/modules/unicode/ucd/WordBreakTest.json b/modules/unicode/ucd/WordBreakTest.json index 9d3d2b9..2340c5a 100644 --- a/modules/unicode/ucd/WordBreakTest.json +++ b/modules/unicode/ucd/WordBreakTest.json @@ -104,6 +104,14 @@ ] }, { + "text" : "\u0001ð¦", + "words" : [] + }, + { + "text" : "\u0001Ìð¦", + "words" : [] + }, + { "text" : "\u0001Â", "words" : [] }, @@ -332,6 +340,14 @@ ] }, { + "text" : "\rð¦", + "words" : [] + }, + { + "text" : "\rÌð¦", + "words" : [] + }, + { "text" : "\rÂ", "words" : [] }, @@ -560,6 +576,14 @@ ] }, { + "text" : "\nð¦", + "words" : [] + }, + { + "text" : "\nÌð¦", + "words" : [] + }, + { "text" : "\nÂ", "words" : [] }, @@ -788,6 +812,14 @@ ] }, { + "text" : "\u000bð¦", + "words" : [] + }, + { + "text" : "\u000bÌð¦", + "words" : [] + }, + { "text" : "\u000bÂ", "words" : [] }, @@ -1048,6 +1080,18 @@ ] }, { + "text" : "ã±ð¦", + "words" : [ + "ã±" + ] + }, + { + "text" : "ã±Ìð¦", + "words" : [ + "ã±Ì" + ] + }, + { "text" : "ã±Â", "words" : [ "ã±Â" @@ -1332,6 +1376,18 @@ ] }, { + "text" : "Að¦", + "words" : [ + "A" + ] + }, + { + "text" : "AÌð¦", + "words" : [ + "AÌ" + ] + }, + { "text" : "AÂ", "words" : [ "AÂ" @@ -1568,6 +1624,14 @@ ] }, { + "text" : ":ð¦", + "words" : [] + }, + { + "text" : ":Ìð¦", + "words" : [] + }, + { "text" : ":Â", "words" : [] }, @@ -1796,6 +1860,14 @@ ] }, { + "text" : ",ð¦", + "words" : [] + }, + { + "text" : ",Ìð¦", + "words" : [] + }, + { "text" : ",Â", "words" : [] }, @@ -2024,6 +2096,14 @@ ] }, { + "text" : "'ð¦", + "words" : [] + }, + { + "text" : "'Ìð¦", + "words" : [] + }, + { "text" : "'Â", "words" : [] }, @@ -2282,6 +2362,18 @@ ] }, { + "text" : "0ð¦", + "words" : [ + "0" + ] + }, + { + "text" : "0Ìð¦", + "words" : [ + "0Ì" + ] + }, + { "text" : "0Â", "words" : [ "0Â" @@ -2546,6 +2638,18 @@ ] }, { + "text" : "_ð¦", + "words" : [ + "_" + ] + }, + { + "text" : "_Ìð¦", + "words" : [ + "_Ì" + ] + }, + { "text" : "_Â", "words" : [ "_Â" @@ -2678,6 +2782,242 @@ ] }, { + "text" : "ð¦\u0001", + "words" : [] + }, + { + "text" : "ð¦Ì\u0001", + "words" : [] + }, + { + "text" : "ð¦\r", + "words" : [] + }, + { + "text" : "ð¦Ì\r", + "words" : [] + }, + { + "text" : "ð¦\n", + "words" : [] + }, + { + "text" : "ð¦Ì\n", + "words" : [] + }, + { + "text" : "ð¦\u000b", + "words" : [] + }, + { + "text" : "ð¦Ì\u000b", + "words" : [] + }, + { + "text" : "ð¦ã±", + "words" : [ + "ã±" + ] + }, + { + "text" : "ð¦Ìã±", + "words" : [ + "ã±" + ] + }, + { + "text" : "ð¦A", + "words" : [ + "A" + ] + }, + { + "text" : "ð¦ÌA", + "words" : [ + "A" + ] + }, + { + "text" : "ð¦:", + "words" : [] + }, + { + "text" : "ð¦Ì:", + "words" : [] + }, + { + "text" : "ð¦,", + "words" : [] + }, + { + "text" : "ð¦Ì,", + "words" : [] + }, + { + "text" : "ð¦'", + "words" : [] + }, + { + "text" : "ð¦Ì'", + "words" : [] + }, + { + "text" : "ð¦0", + "words" : [ + "0" + ] + }, + { + "text" : "ð¦Ì0", + "words" : [ + "0" + ] + }, + { + "text" : "ð¦_", + "words" : [ + "_" + ] + }, + { + "text" : "ð¦Ì_", + "words" : [ + "_" + ] + }, + { + "text" : "ð¦ð¦", + "words" : [] + }, + { + "text" : "ð¦Ìð¦", + "words" : [] + }, + { + "text" : "ð¦Â", + "words" : [] + }, + { + "text" : "ð¦ÌÂ", + "words" : [] + }, + { + "text" : "ð¦Ì", + "words" : [] + }, + { + "text" : "ð¦ÌÌ", + "words" : [] + }, + { + "text" : "ð¦aâ ", + "words" : [ + "aâ " + ] + }, + { + "text" : "ð¦Ìaâ ", + "words" : [ + "aâ " + ] + }, + { + "text" : "ð¦a:", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦Ìa:", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦a'", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦Ìa'", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦a'â ", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦Ìa'â ", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦a,", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦Ìa,", + "words" : [ + "a" + ] + }, + { + "text" : "ð¦1:", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦Ì1:", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦1'", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦Ì1'", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦1,", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦Ì1,", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦1.â ", + "words" : [ + "1" + ] + }, + { + "text" : "ð¦Ì1.â ", + "words" : [ + "1" + ] + }, + { "text" : "Â\u0001", "words" : [] }, @@ -2782,6 +3122,14 @@ ] }, { + "text" : "Âð¦", + "words" : [] + }, + { + "text" : "ÂÌð¦", + "words" : [] + }, + { "text" : "ÂÂ", "words" : [] }, @@ -3010,6 +3358,14 @@ ] }, { + "text" : "Ìð¦", + "words" : [] + }, + { + "text" : "ÌÌð¦", + "words" : [] + }, + { "text" : "ÌÂ", "words" : [] }, @@ -3268,6 +3624,18 @@ ] }, { + "text" : "aâ ð¦", + "words" : [ + "aâ " + ] + }, + { + "text" : "aâ Ìð¦", + "words" : [ + "aâ Ì" + ] + }, + { "text" : "aâ Â", "words" : [ "aâ Â" @@ -3538,6 +3906,18 @@ ] }, { + "text" : "a:ð¦", + "words" : [ + "a" + ] + }, + { + "text" : "a:Ìð¦", + "words" : [ + "a" + ] + }, + { "text" : "a:Â", "words" : [ "a" @@ -3816,6 +4196,18 @@ ] }, { + "text" : "a'ð¦", + "words" : [ + "a" + ] + }, + { + "text" : "a'Ìð¦", + "words" : [ + "a" + ] + }, + { "text" : "a'Â", "words" : [ "a" @@ -4094,6 +4486,18 @@ ] }, { + "text" : "a'â ð¦", + "words" : [ + "a" + ] + }, + { + "text" : "a'â Ìð¦", + "words" : [ + "a" + ] + }, + { "text" : "a'â Â", "words" : [ "a" @@ -4374,6 +4778,18 @@ ] }, { + "text" : "a,ð¦", + "words" : [ + "a" + ] + }, + { + "text" : "a,Ìð¦", + "words" : [ + "a" + ] + }, + { "text" : "a,Â", "words" : [ "a" @@ -4664,6 +5080,18 @@ ] }, { + "text" : "1:ð¦", + "words" : [ + "1" + ] + }, + { + "text" : "1:Ìð¦", + "words" : [ + "1" + ] + }, + { "text" : "1:Â", "words" : [ "1" @@ -4952,6 +5380,18 @@ ] }, { + "text" : "1'ð¦", + "words" : [ + "1" + ] + }, + { + "text" : "1'Ìð¦", + "words" : [ + "1" + ] + }, + { "text" : "1'Â", "words" : [ "1" @@ -5232,6 +5672,18 @@ ] }, { + "text" : "1,ð¦", + "words" : [ + "1" + ] + }, + { + "text" : "1,Ìð¦", + "words" : [ + "1" + ] + }, + { "text" : "1,Â", "words" : [ "1" @@ -5512,6 +5964,18 @@ ] }, { + "text" : "1.â ð¦", + "words" : [ + "1" + ] + }, + { + "text" : "1.â Ìð¦", + "words" : [ + "1" + ] + }, + { "text" : "1.â Â", "words" : [ "1" @@ -5716,5 +6180,52 @@ "words" : [ "3â aâ â " ] + }, + { + "text" : "að¦b", + "words" : [ + "a", + "b" + ] + }, + { + "text" : "ð·ðº", + "words" : [] + }, + { + "text" : "ð·ðºð¸", + "words" : [] + }, + { + "text" : "ð·ðºð¸ðª", + "words" : [] + }, + { + "text" : "ð·ðºâð¸ðª", + "words" : [] + }, + { + "text" : "ð¦ð§ð¨", + "words" : [] + }, + { + "text" : "ð¦âð§ð¨", + "words" : [] + }, + { + "text" : "ð¦ð§âð¨", + "words" : [] + }, + { + "text" : " âÙ", + "words" : [ + "Ù" + ] + }, + { + "text" : "Ùâ ", + "words" : [ + "Ùâ" + ] } ]
