Skip to content

Commit

Permalink
chore(resources): update to latest LDML
Browse files Browse the repository at this point in the history
- maybe last 'techpreview' update

Unblocks: chore(developer): support xmlns on keyboard3 files 🙀  #10803
Unblocks: chore(developer): rename unicodeSet to uset 🙀  #10657

For: #10803
  • Loading branch information
srl295 committed Feb 27, 2024
1 parent a92d475 commit db32e40
Show file tree
Hide file tree
Showing 18 changed files with 204 additions and 675 deletions.
146 changes: 72 additions & 74 deletions resources/standards-data/ldml-keyboards/techpreview/3.0/bn.xml
Original file line number Diff line number Diff line change
@@ -1,6 +1,5 @@
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE keyboard3 SYSTEM "../dtd/ldmlKeyboard3.dtd">
<keyboard3 locale="bn" conformsTo="techpreview">
<keyboard3 xmlns="https://schemas.unicode.org/cldr/45/keyboard3" locale="bn" conformsTo="techpreview">
<!--
History:
Based on
Expand All @@ -13,15 +12,16 @@
<version number="1.3.0" />
<info name="SIL Bengali-Assamese Phonetic" indicator="bn" layout="QWERTY" />

<displays>
<display keyId="au-lengthener" display="" />
<display keyId="vis-hasant" display="" /> <!-- TODO: distinguish from regular hasant? -->
<display keyId="more" display="" />
</displays>

<keys>
<import base="cldr" path="techpreview/keys-Zyyy-punctuation.xml" />
<import base="cldr" path="techpreview/keys-Zyyy-currency.xml" />

<!-- key names based on https://www.loc.gov/catdir/cpso/romanization/bengali.pdf + Assamese for /wa/ -->

<!-- UNSHIFTED KEYS -->
<!-- E: (top) row -->
<key id="candrabindu" output="\u{0981}" /> <!---->
<key id="1" output="" />
<key id="2" output="" />
<key id="3" output="" />
Expand All @@ -32,86 +32,67 @@
<key id="8" output="" />
<key id="9" output="" />
<key id="0" output="" />
<!-- hyphen -->
<!-- equal -->

<!-- D: -->
<!-- special keys and marks -->
<key id="au-lenghtener" output="\m{A}" />
<key id="candrabindu" output="\u{0981}" /> <!---->
<key id="hasant" output="\u{09CD}" />
<key id="more" output="\m{q}" /> <!-- 'additional characters' -->
<key id="wa" output="" /> <!-- Assamese-->
<key id="e" output="\u{09C7}" />
<key id="ra" output="" />
<key id="ta" output="" />
<key id="sha" output="" />
<key id="u" output="\u{09C1}" />
<key id="i" output="\u{09BF}" />
<key id="o" output="\u{09CB}" />
<key id="pa" output="" />
<key id="nukta" output="\u{09BC}" />
<key id="vis-hasant" output="\m{X}" />

<!-- C: -->
<!-- key names based on https://www.loc.gov/catdir/cpso/romanization/bengali.pdf + Assamese for /wa/ -->
<key id="ā" output="\u{09BE}" />
<key id="sa" output="" />
<key id="ai" output="\u{09C8}" />
<key id="au" output="\u{09CC}" />
<key id="ba" output="" />
<key id="bha" output="" />
<key id="ca" output="" />
<key id="cha" output="" />
<key id="ḍa" output="" />
<key id="da" output="" />
<key id="ṭa" output="" />
<key id="dahri" output="" />
<key id="ḍha" output="" />
<key id="dha" output="" />
<key id="e" output="\u{09C7}" />
<key id="ga" output="" />
<key id="gha" output="" />
<key id="ha" output="" />
<key id="i" output="\u{09BF}" />
<key id="ī" output="\u{09C0}" />
<key id="ja" output="" />
<key id="jha" output="" />
<key id="ka" output="" />
<key id="kha" output="" />
<key id="la" output="" />

<!-- B: -->
<key id="śa" output="" />
<key id="hasant" output="\u{09CD}" />
<key id="ca" output="" />
<key id="ḍa" output="" />
<key id="ba" output="" />
<key id="na" output="" />
<key id="ma" output="" />
<!-- comma -->
<key id="dahri" output="" />


<!-- SHIFTED KEYS -->
<key id="" output="\u{0982}" />
<!-- exclam, etc -->

<!-- gap -->
<key id="ma" output="" />
<key id="ṅa" output="" />
<key id="ña" output="" />
<key id="ai" output="\u{09C8}" />
<key id="" output="\u{09C3}" />
<key id="tha" output="" />
<key id="ẏa" output="য়" /> <!-- Missing in Keyman version of file-->
<key id="ū" output="\u{09C2}" />
<key id="ī" output="\u{09C0}" />
<key id="au" output="\u{09CC}" />
<key id="ṇa" output="" />
<key id="na" output="" />
<key id="o" output="\u{09CB}" />
<key id="pa" output="" />
<key id="pha" output="" />

<key id="lengthener" output="\m{A}" />
<key id="" output="\u{09C3}" />
<key id="ra" output="" />
<key id="śa" output="" />
<key id="sa" output="" />
<key id="sha" output="" />
<key id="dha" output="" />
<key id="ṭa" output="" />
<key id="ta" output="" />
<key id="ṭha" output="" />
<key id="gha" output="" />
<!-- gap -->
<key id="jha" output="" />
<key id="kha" output="" />
<!-- gap -->

<!-- gap -->
<key id="vis-hasant" output="\m{X}" />
<key id="cha" output="" />
<key id="ḍha" output="" />
<key id="bha" output="" />
<key id="ṇa" output="" />
<key id="ṅa" output="" />
<!-- less-than -->
<key id="nukta" output="\u{09BC}" />
<!-- question -->


<key id="tha" output="" />
<key id="u" output="\u{09C1}" />
<key id="ū" output="\u{09C2}" />
<key id="wa" output="" /> <!-- Assamese transliteration -->
<key id="ya" output="" />
<key id="ẏa" output="য়" /> <!-- Missing in Keyman version of file-->
</keys>
<layers formId="us">
<layer modifiers="none">
<row keys="candrabindu 1 2 3 4 5 6 7 8 9 0 hyphen equal" />
<row keys="more wa e ra ta sha u i o pa open-square close-square backslash" />
<row keys="more wa e ra ta ya u i o pa open-square close-square backslash" />
<row keys="ā sa da ṭa ga ha ja ka la semi-colon apos" />
<row keys="śa hasant ca ḍa ba na ma comma dahri slash" />
<row keys="space" />
Expand All @@ -120,16 +101,16 @@
<row
keys="ṃ bang at hash dollar percent caret amp asterisk open-paren close-paren underscore plus" />
<row keys="gap ña ai ṛ tha ẏa ū ī au pha open-curly close-curly pipe" />
<row keys="lengthener sha dha ṭha gha gap jha kha gap colon double-quote" />
<row keys="au-lenghtener sha dha ṭha gha gap jha kha gap colon double-quote" />
<row keys="gap vis-hasant cha ḍha bha ṇa ṅa open-angle nukta question" />
<row keys="space" />
</layer>
</layers>

<transforms type="simple">
<transformGroup>
<transform from="\u{09C7}\m{A}" to="\u{09CC}" /> <!-- E + lengthener = AU -->
<!-- <transform from="\u{09C7}\u{09BE}" to="\u{09CB}" /> --> <!-- E + O = O This is handled by normalization. -->
<transform from="\u{09C7}\m{A}" to="\u{09CC}" /> <!-- E + au-lenghtener = AU -->
<!-- <transform from="\u{09C7}\u{09BE}" to="\u09CB" /> --> <!-- E + A = O This is handled by normalization. -->

<!-- these suport the 'q' key -->
<transform from="\m{q}:" to="\u{0983}" />
Expand All @@ -154,17 +135,34 @@
<transform from="\m{q}\m{A}" to="" />
<transform from="\m{q}\m{X}" to="\u{09CD}\u{200C}" /> <!-- virama + zwnj-->
</transformGroup>
<!-- TODO: document these -->
<transformGroup>
<transformGroup>
<!-- Nukta is tertiary, that is, it follows a tertiaryBase sequence -->
<reorder from="\u{09BC}" tertiary="3"/>
<!--
virama (hasant) followed by any other spacing chars has order 10, because this sequence goes after the consonant to which the virama pertains.
For example:
U+099A U+09CD U+099B
CA virama CHA
0 10 10
-->
<reorder from="\u{09CD}[\u{0980}\u{0985}-\u{098C}\u{098F}\u{0990}\u{0993}-\u{09A8}\u{09AA}-\u{09B0}\u{09B2}\u{09B6}-\u{09B9}\u{09BD}\u{09DC}\u{09DD}\u{09DF}-\u{09E1}\u{09E6}-\u{09F1}\u{09FC}]" order="10" tertiaryBase="true"/>
<!-- 10: virama + zwj/zwnj + spacing mark is also 10-->
<reorder from="\u{09CD}[\u{200C}\u{200D}][\u{0980}\u{0985}-\u{098C}\u{098F}\u{0990}\u{0993}-\u{09A8}\u{09AA}-\u{09B0}\u{09B2}\u{09B6}-\u{09B9}\u{09BD}\u{09DC}\u{09DD}\u{09DF}-\u{09E1}\u{09E6}-\u{09F1}\u{09FC}]" order="10" tertiaryBase="true"/>
<!-- 120: A virama not followed by a spacing mark goes further to the right (past the sandhi mark, below) -->
<reorder from="\u{09CD}" order="120" tertiaryBase="true"/>
<!-- The next three rules make sure the DVs are in the correct order-->
<!-- 60: left side dependent vowels -->
<reorder from="[\u{09BF}\u{09C7}\u{09C8}]" order="60"/>
<!-- 70: lower dependent vowels -->
<reorder from="[\u{09C1}-\u{09C4}\u{09E2}\u{09E3}]" order="70"/>
<reorder from="[\u{09BE}\u{09C0}\u{09CB}\u{09CC}]" order="75"/>
<!-- 75: right side dependent vowels. Note U+09D7 AU LENGTH MARK is included due to NFD -->
<reorder from="[\u{09BE}\u{09C0}\u{09CB}\u{09CC}\u{09D7}]" order="75"/>
<!-- 85: candrabindu -->
<reorder from="\u{0981}" order="85"/>
<!-- 95: anusvara and visarga -->
<reorder from="[\u{0982}\u{0983}]" order="95"/>
<!-- 117: sandhi mark -->
<reorder from="\u{09FE}" order="117"/>
</transformGroup>
</transforms>
Expand Down
Original file line number Diff line number Diff line change
@@ -1,5 +1,4 @@
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE keyboard3 SYSTEM "../dtd/ldmlKeyboard3.dtd">
<!--
This file is part of the CLDR Keyboard Technical Preview.
This is a sample data file.
Expand All @@ -8,7 +7,7 @@
Also NOTE: this is really a test keyboard. CLDR-12026 will be for the real new azerty keyboard
-->
<keyboard3 locale="fr-t-k0-azerty" conformsTo="techpreview">
<keyboard3 xmlns="https://schemas.unicode.org/cldr/45/keyboard3" locale="fr-t-k0-azerty" conformsTo="techpreview">
<locales>
<locale id="br" /> <!-- example of including Breton -->
</locales>
Expand Down Expand Up @@ -52,7 +51,7 @@
<key id="extra" gap="true" />
<!--
TODO: need discussion
<key id="enter" output="\u{000A}" />
<key id="enter" to="\u{000A}" />
-->
<key id="enter" gap="true" />

Expand Down

This file was deleted.

Loading

0 comments on commit db32e40

Please sign in to comment.