version https://git-lfs.github.com/spec/v1
-oid sha256:1abc0174ae76c79801fe369dac52cd4c42a09d6c2b92919b1f7736d46ea10e1d
-size 10855096
+oid sha256:2f219f5ba7169a47b6b3edcda6d1daabf68831a7c0b1e8e7731c92a57f427994
+size 10728537
# TODO: figure out how to have a single copy of the file for use by both C and Java.
-# Temp debugging tests
+# Temp debugging tests
<word>
-# test normalization/dictionary handling of halfwidth katakana: same dictionary phrase in fullwidth and halfwidth
-<data>•芽キャベツ<400>芽キャベツ<400></data>
-
+<data>•Isn't<200></data>
+<char>
+<data>•\U00010020•\U00010000\N{COMBINING MACRON}•</data>
########################################################################################
#
<data>•123 •Start •with •a •number.•</data>
<data>•'•start •with •a •case-•ignorable •cha'r'a'cter•</data>
-
+<data>•' '' •start •with •case-•ignorable & •case-•insensitive •cha'r'a'cter•</data>
+<data>• ''•aaa' •bbb '•ccc' '•ddd''' '''•eee '''•fff''' •ggg ''•</data>
+# Note: apostrophe is case-ignorable. space is not cased.
##########################################################################################
#
#
# Trac ticket 5595 Test Case
-<word>
<data>•บท<200>ที่๑พายุ<200>ไซโคลน<200>โด<200>โรธี<200>อาศัย<200>อยู่<200>ท่ามกลาง<200>\
ทุ่งใหญ่<200>ใน<200>แคนซัส<200>กับ<200>ลุง<200>เฮ<200>นรี<200>ชาวไร่<200>และ<200>ป้า<200>เอ็ม<200>\
ภรรยา<200>ชาวไร่<200>บ้าน<200>ของ<200>พวก<200>เขา<200>หลัง<200>เล็ก<200>เพราะ<200>ไม้<200>\