cldr
Version:
Library for extracting data from CLDR (the Unicode Common Locale Data Repository)
34 lines (33 loc) • 1.17 kB
text/xml
<!-- Copyright © 1991-2024 Unicode, Inc.
For terms of use, see http://www.unicode.org/copyright.html
SPDX-License-Identifier: Unicode-3.0
CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
-->
<ldml>
<identity>
<version number="$Revision$"/>
<language type="ja"/>
</identity>
<segmentations>
<segmentation type="LineBreak">
<variables>
<variable id="$ID">[[\p{Line_Break=Ideographic}] [$CJ]]</variable>
<variable id="$NS">\p{Line_Break=Nonstarter}</variable>
</variables>
</segmentation>
<segmentation type="WordBreak">
<variables>
<variable id="$Hiragana">\p{Hiragana}</variable>
<variable id="$Hiragana">($Hiragana $FE*)</variable>
<variable id="$Ideographic">[[\p{Ideographic}] [\u3005 \u3007 \u303B]]</variable>
<variable id="$Ideographic">($Ideographic $FE*)</variable>
</variables>
<segmentRules>
<rule id="13.3"> $Hiragana × $Hiragana </rule>
<rule id="13.4"> $Ideographic × $Ideographic </rule>
</segmentRules>
</segmentation>
</segmentations>
</ldml>