Updated Branches:
  refs/heads/master 1dced2235 -> 0df8da88c

http://git-wip-us.apache.org/repos/asf/lucy/blob/0df8da88/modules/unicode/ucd/WordBreakTest.json
----------------------------------------------------------------------
diff --git a/modules/unicode/ucd/WordBreakTest.json 
b/modules/unicode/ucd/WordBreakTest.json
index 9d3d2b9..2340c5a 100644
--- a/modules/unicode/ucd/WordBreakTest.json
+++ b/modules/unicode/ucd/WordBreakTest.json
@@ -104,6 +104,14 @@
       ]
    },
    {
+      "text" : "\u0001🇦",
+      "words" : []
+   },
+   {
+      "text" : "\u0001̈🇦",
+      "words" : []
+   },
+   {
       "text" : "\u0001­",
       "words" : []
    },
@@ -332,6 +340,14 @@
       ]
    },
    {
+      "text" : "\r🇦",
+      "words" : []
+   },
+   {
+      "text" : "\r̈🇦",
+      "words" : []
+   },
+   {
       "text" : "\r­",
       "words" : []
    },
@@ -560,6 +576,14 @@
       ]
    },
    {
+      "text" : "\n🇦",
+      "words" : []
+   },
+   {
+      "text" : "\n̈🇦",
+      "words" : []
+   },
+   {
       "text" : "\n­",
       "words" : []
    },
@@ -788,6 +812,14 @@
       ]
    },
    {
+      "text" : "\u000b🇦",
+      "words" : []
+   },
+   {
+      "text" : "\u000b̈🇦",
+      "words" : []
+   },
+   {
       "text" : "\u000b­",
       "words" : []
    },
@@ -1048,6 +1080,18 @@
       ]
    },
    {
+      "text" : "〱🇦",
+      "words" : [
+         "〱"
+      ]
+   },
+   {
+      "text" : "〱̈🇦",
+      "words" : [
+         "〱̈"
+      ]
+   },
+   {
       "text" : "〱­",
       "words" : [
          "〱­"
@@ -1332,6 +1376,18 @@
       ]
    },
    {
+      "text" : "A🇦",
+      "words" : [
+         "A"
+      ]
+   },
+   {
+      "text" : "Ä🇦",
+      "words" : [
+         "Ä"
+      ]
+   },
+   {
       "text" : "A­",
       "words" : [
          "A­"
@@ -1568,6 +1624,14 @@
       ]
    },
    {
+      "text" : ":🇦",
+      "words" : []
+   },
+   {
+      "text" : ":̈🇦",
+      "words" : []
+   },
+   {
       "text" : ":­",
       "words" : []
    },
@@ -1796,6 +1860,14 @@
       ]
    },
    {
+      "text" : ",🇦",
+      "words" : []
+   },
+   {
+      "text" : ",̈🇦",
+      "words" : []
+   },
+   {
       "text" : ",­",
       "words" : []
    },
@@ -2024,6 +2096,14 @@
       ]
    },
    {
+      "text" : "'🇦",
+      "words" : []
+   },
+   {
+      "text" : "'̈🇦",
+      "words" : []
+   },
+   {
       "text" : "'­",
       "words" : []
    },
@@ -2282,6 +2362,18 @@
       ]
    },
    {
+      "text" : "0🇦",
+      "words" : [
+         "0"
+      ]
+   },
+   {
+      "text" : "0̈🇦",
+      "words" : [
+         "0̈"
+      ]
+   },
+   {
       "text" : "0­",
       "words" : [
          "0­"
@@ -2546,6 +2638,18 @@
       ]
    },
    {
+      "text" : "_🇦",
+      "words" : [
+         "_"
+      ]
+   },
+   {
+      "text" : "_̈🇦",
+      "words" : [
+         "_̈"
+      ]
+   },
+   {
       "text" : "_­",
       "words" : [
          "_­"
@@ -2678,6 +2782,242 @@
       ]
    },
    {
+      "text" : "🇦\u0001",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈\u0001",
+      "words" : []
+   },
+   {
+      "text" : "🇦\r",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈\r",
+      "words" : []
+   },
+   {
+      "text" : "🇦\n",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈\n",
+      "words" : []
+   },
+   {
+      "text" : "🇦\u000b",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈\u000b",
+      "words" : []
+   },
+   {
+      "text" : "🇦〱",
+      "words" : [
+         "〱"
+      ]
+   },
+   {
+      "text" : "🇦̈〱",
+      "words" : [
+         "〱"
+      ]
+   },
+   {
+      "text" : "🇦A",
+      "words" : [
+         "A"
+      ]
+   },
+   {
+      "text" : "🇦̈A",
+      "words" : [
+         "A"
+      ]
+   },
+   {
+      "text" : "🇦:",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈:",
+      "words" : []
+   },
+   {
+      "text" : "🇦,",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈,",
+      "words" : []
+   },
+   {
+      "text" : "🇦'",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈'",
+      "words" : []
+   },
+   {
+      "text" : "🇦0",
+      "words" : [
+         "0"
+      ]
+   },
+   {
+      "text" : "🇦̈0",
+      "words" : [
+         "0"
+      ]
+   },
+   {
+      "text" : "🇦_",
+      "words" : [
+         "_"
+      ]
+   },
+   {
+      "text" : "🇦̈_",
+      "words" : [
+         "_"
+      ]
+   },
+   {
+      "text" : "🇦🇦",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈🇦",
+      "words" : []
+   },
+   {
+      "text" : "🇦­",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈­",
+      "words" : []
+   },
+   {
+      "text" : "🇦̀",
+      "words" : []
+   },
+   {
+      "text" : "🇦̈̀",
+      "words" : []
+   },
+   {
+      "text" : "🇦a⁠",
+      "words" : [
+         "a⁠"
+      ]
+   },
+   {
+      "text" : "🇦̈a⁠",
+      "words" : [
+         "a⁠"
+      ]
+   },
+   {
+      "text" : "🇦a:",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦̈a:",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦a'",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦̈a'",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦a'⁠",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦̈a'⁠",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦a,",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦̈a,",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "🇦1:",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦̈1:",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦1'",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦̈1'",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦1,",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦̈1,",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦1.⁠",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "🇦̈1.⁠",
+      "words" : [
+         "1"
+      ]
+   },
+   {
       "text" : "­\u0001",
       "words" : []
    },
@@ -2782,6 +3122,14 @@
       ]
    },
    {
+      "text" : "­🇦",
+      "words" : []
+   },
+   {
+      "text" : "­̈🇦",
+      "words" : []
+   },
+   {
       "text" : "­­",
       "words" : []
    },
@@ -3010,6 +3358,14 @@
       ]
    },
    {
+      "text" : "̀🇦",
+      "words" : []
+   },
+   {
+      "text" : "̀̈🇦",
+      "words" : []
+   },
+   {
       "text" : "̀­",
       "words" : []
    },
@@ -3268,6 +3624,18 @@
       ]
    },
    {
+      "text" : "a⁠🇦",
+      "words" : [
+         "a⁠"
+      ]
+   },
+   {
+      "text" : "a⁠̈🇦",
+      "words" : [
+         "a⁠̈"
+      ]
+   },
+   {
       "text" : "a⁠­",
       "words" : [
          "a⁠­"
@@ -3538,6 +3906,18 @@
       ]
    },
    {
+      "text" : "a:🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "a:̈🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
       "text" : "a:­",
       "words" : [
          "a"
@@ -3816,6 +4196,18 @@
       ]
    },
    {
+      "text" : "a'🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "a'̈🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
       "text" : "a'­",
       "words" : [
          "a"
@@ -4094,6 +4486,18 @@
       ]
    },
    {
+      "text" : "a'⁠🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "a'⁠̈🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
       "text" : "a'⁠­",
       "words" : [
          "a"
@@ -4374,6 +4778,18 @@
       ]
    },
    {
+      "text" : "a,🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
+      "text" : "a,̈🇦",
+      "words" : [
+         "a"
+      ]
+   },
+   {
       "text" : "a,­",
       "words" : [
          "a"
@@ -4664,6 +5080,18 @@
       ]
    },
    {
+      "text" : "1:🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "1:̈🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
       "text" : "1:­",
       "words" : [
          "1"
@@ -4952,6 +5380,18 @@
       ]
    },
    {
+      "text" : "1'🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "1'̈🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
       "text" : "1'­",
       "words" : [
          "1"
@@ -5232,6 +5672,18 @@
       ]
    },
    {
+      "text" : "1,🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "1,̈🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
       "text" : "1,­",
       "words" : [
          "1"
@@ -5512,6 +5964,18 @@
       ]
    },
    {
+      "text" : "1.⁠🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
+      "text" : "1.⁠̈🇦",
+      "words" : [
+         "1"
+      ]
+   },
+   {
       "text" : "1.⁠­",
       "words" : [
          "1"
@@ -5716,5 +6180,52 @@
       "words" : [
          "3⁠a⁠⁠"
       ]
+   },
+   {
+      "text" : "a🇦b",
+      "words" : [
+         "a",
+         "b"
+      ]
+   },
+   {
+      "text" : "🇷🇺",
+      "words" : []
+   },
+   {
+      "text" : "🇷🇺🇸",
+      "words" : []
+   },
+   {
+      "text" : "🇷🇺🇸🇪",
+      "words" : []
+   },
+   {
+      "text" : "🇷🇺​🇸🇪",
+      "words" : []
+   },
+   {
+      "text" : "🇦🇧🇨",
+      "words" : []
+   },
+   {
+      "text" : "🇦‍🇧🇨",
+      "words" : []
+   },
+   {
+      "text" : "🇦🇧‍🇨",
+      "words" : []
+   },
+   {
+      "text" : " ‍ن",
+      "words" : [
+         "ن"
+      ]
+   },
+   {
+      "text" : "ن‍ ",
+      "words" : [
+         "ن‍"
+      ]
    }
 ]

Reply via email to