diff options
Diffstat (limited to 'extra/locale/collation/iso14651_t1')
-rw-r--r-- | extra/locale/collation/iso14651_t1 | 1495 |
1 files changed, 1495 insertions, 0 deletions
diff --git a/extra/locale/collation/iso14651_t1 b/extra/locale/collation/iso14651_t1 new file mode 100644 index 000000000..b44d34a54 --- /dev/null +++ b/extra/locale/collation/iso14651_t1 @@ -0,0 +1,1495 @@ + +# Déclaration des systèmes d'écriture / Declaration of scripts +script <SPECIAL> +script <LATIN> +script <ARABINT> +script <ARABFOR> +script <HEBREU> +script <GREC> +script <CYRIL> +script <HAN> + +# Déclaration des symboles internes / Declaration of internal symbols +# +# SYMB N° Expl. +# +collating-symbol <RES-1> +# +# <ARABINT>/<ARABFOR> +# +# +collating-symbol <ANO> # 2 normal --> voir/see <MIN> +collating-symbol <AIS> # 3 isol. +collating-symbol <AFI> # 4 final +collating-symbol <AII> # 5 initial +collating-symbol <AME> # 6 medial/m<e'>dian +# +collating-symbol <MIN> # 7 minuscule/minuscule (bas de casse/lower case) +collating-symbol <IMI> # 8 inférieur min./subscript min. (indice/index) +collating-symbol <EMI> # 9 supér. min./superscript min. (exposant/exponent) +collating-symbol <CAP> # 10 capitale/capital (haut de casse/upper case) +collating-symbol <AMI> # 8 minuscule grecque/Greek lower case +collating-symbol <ICA> # 11 inférieur en capitale/subscript capital +collating-symbol <ECA> # 12 supérieur en capitale/superscript capital +# +# <ARABINT>/<ARABFOR> +# +collating-symbol <AMA> # 13 accent madda +collating-symbol <AHA> # 14 accent hamza +collating-symbol <AHW> # 14-1 accent hamza/waw +collating-symbol <AHS> # 14-2 accent hamza under / hamza souscrit +collating-symbol <AYE> # 14-3 accent under yeh / accent souscrit du ya' +collating-symbol <YBA> # 14-4 accent hamza/yeh barree +# +collating-symbol <BAS> # 15 de base/basic (non accentué/non-accented) +# +collating-symbol <PCL> # 16 particulier/peculiar +collating-symbol <LIG> # 17 ligature/ligature +collating-symbol <ACA> # 18 accent aigu/acute accent +collating-symbol <GRA> # 20 accent grave/grave accent +collating-symbol <BRE> # 21 brève/breve +collating-symbol <CIR> # 22 accent circonflexe/circumflex accent +collating-symbol <CAR> # 23 caron/caron +collating-symbol <RNE> # 24 rond supérieur/ring above +collating-symbol <REU> # 25 tréma/diaeresis (ou/or umlaut) +collating-symbol <DAC> # 26 double ac. aigu/double acute ac. +collating-symbol <TIL> # 27 tilde/tilde +collating-symbol <PCT> # 28 point/dot +collating-symbol <OBL> # 29 barre oblique/oblique +collating-symbol <CDI> # 30 cédille/cedilla +collating-symbol <OGO> # 31 ogonek/ogonek +collating-symbol <MAC> # 32 macron/macron +# +# GREC +# +collating-symbol <TNS> # accent aigu/tonos/acute accent +collating-symbol <DLT> # tr<e'>ma/dialytica/diaeresis +collating-symbol <DTT> # dialytika tonos +# +collating-symbol <0> +collating-symbol <1> +collating-symbol <2> +collating-symbol <3> +collating-symbol <4> +collating-symbol <5> +collating-symbol <6> +collating-symbol <7> +collating-symbol <8> +collating-symbol <9> +# +collating-symbol <a> +collating-symbol <b> +collating-symbol <c> +collating-symbol <d> +collating-symbol <e> +collating-symbol <f> +collating-symbol <g> +collating-symbol <h> +collating-symbol <i> +collating-symbol <j> +collating-symbol <k> +collating-symbol <l> +collating-symbol <m> +collating-symbol <n> +collating-symbol <o> +collating-symbol <p> +collating-symbol <q> +collating-symbol <r> +collating-symbol <s> +collating-symbol <t> +collating-symbol <u> +collating-symbol <v> +collating-symbol <w> +collating-symbol <x> +collating-symbol <y> +collating-symbol <z> +collating-symbol <th> +# +# <ARABINT>/<ARABFOR> +# +collating-symbol <hamza> +collating-symbol <alef> +collating-symbol <beh> +collating-symbol <peh> +collating-symbol <teh_marbuta> +collating-symbol <teh> +collating-symbol <tteh> +collating-symbol <theh> +collating-symbol <jeem> +collating-symbol <tcheh> +collating-symbol <hah> +collating-symbol <khah> +collating-symbol <dal> +collating-symbol <ddal> +collating-symbol <thal> +collating-symbol <reh> +collating-symbol <rreh> +collating-symbol <zain> +collating-symbol <jeh> +collating-symbol <seen> +collating-symbol <sheen> +collating-symbol <sad> +collating-symbol <dad> +collating-symbol <tah> +collating-symbol <zah> +collating-symbol <ain> +collating-symbol <ghain> +collating-symbol <feh> +collating-symbol <qaf> +collating-symbol <kaf> +collating-symbol <keheh> +collating-symbol <gaf> +collating-symbol <lam> +collating-symbol <meem> +collating-symbol <noon> +collating-symbol <noon_ghunna> +collating-symbol <heh> +collating-symbol <heh_yeh> +collating-symbol <waw> +collating-symbol <alef_maksura> +collating-symbol <yeh_barree> +# +# <HEBREU> +# +collating-symbol <alef_heb> +collating-symbol <bet> +collating-symbol <gimel> +collating-symbol <dalet> +collating-symbol <he> +collating-symbol <vav> +collating-symbol <zayin> +collating-symbol <het> +collating-symbol <tet> +collating-symbol <yod> +collating-symbol <kaf_fin> +collating-symbol <kaf_heb> +collating-symbol <lamed> +collating-symbol <mem_fin> +collating-symbol <mem> +collating-symbol <nun_fin> +collating-symbol <nun> +collating-symbol <samekh> +collating-symbol <ayin> +collating-symbol <pe_fin> +collating-symbol <pe> +collating-symbol <tsadi_fin> +collating-symbol <tsadi> +collating-symbol <qof> +collating-symbol <resh> +collating-symbol <shin> +collating-symbol <tav> +# +# GREC +# +collating-symbol <ALPHA> +collating-symbol <BETA> +collating-symbol <GAMMA> +collating-symbol <DELTA> +collating-symbol <EPSILON> +collating-symbol <ZETA> +collating-symbol <ETA> +collating-symbol <THETA> +collating-symbol <IOTA> +collating-symbol <KAPPA> +collating-symbol <LAMBDA> +collating-symbol <MU> +collating-symbol <NU> +collating-symbol <XI> +collating-symbol <OMICRON> +collating-symbol <PI> +collating-symbol <RHO> +collating-symbol <SIGMA> +collating-symbol <TAU> +collating-symbol <UPSILON> +collating-symbol <PHI> +collating-symbol <CHI> +collating-symbol <PSI> +collating-symbol <OMEGA> +# +# CYRIL +# +collating-symbol <CYR-A> +collating-symbol <CYR-BE> +collating-symbol <CYR-VE> +collating-symbol <CYR-GHE> +collating-symbol <CYR-DE> +collating-symbol <CYR-GZHE> +collating-symbol <CYR-DJE> +collating-symbol <CYR-IE> +collating-symbol <UKR-IE> +collating-symbol <CYR-IO> +collating-symbol <CYR-ZHE> +collating-symbol <CYR-ZE> +collating-symbol <CYR-DZE> +collating-symbol <CYR-I> +collating-symbol <UKR-I> +collating-symbol <UKR-YI> +collating-symbol <CYR-IBRE> +collating-symbol <CYR-JE> +collating-symbol <CYR-KA> +collating-symbol <CYR-EL> +collating-symbol <CYR-LJE> +collating-symbol <CYR-EM> +collating-symbol <CYR-EN> +collating-symbol <CYR-NJE> +collating-symbol <CYR-O> +collating-symbol <CYR-PE> +collating-symbol <CYR-ER> +collating-symbol <CYR-ES> +collating-symbol <CYR-TE> +collating-symbol <CYR-KJE> +collating-symbol <CYR-TSHE> +collating-symbol <CYR-OU> +collating-symbol <CYR-OUBRE> +collating-symbol <CYR-EF> +collating-symbol <CYR-HA> +collating-symbol <CYR-TSE> +collating-symbol <CYR-CHE> +collating-symbol <CYR-DCHE> +collating-symbol <CYR-SHA> +collating-symbol <CYR-SHTSHA> +collating-symbol <CYR-SIGDUR> +collating-symbol <CYR-YEROU> +collating-symbol <CYR-SIGMOUIL> +collating-symbol <CYR-E> +collating-symbol <CYR-YOU> +collating-symbol <CYR-YA> + +# Ordre des symboles internes / Order of internal symbols +# +# SYMB. N° +# +<RES-1> +<MIN> +# forme de base (bas de casse, arabe intrinsèque, +# hébreu intrinsèque, etc. +# basic form (lower case, intrinsic Arabic +# intrinsic Hebrew and so on) +# +# <ARABINT>/<ARABFOR> +# +# +<ANO> # voir +<AIS> # isol. +# 3 +<AFI> # final +# 4 +<AII> # initial +# 5 +<AME> # medial/m<e'>dian +# 6 +# +<IMI> # 7 +<EMI> # 8 +<CAP> # 9 +<ICA> # 10 +<ECA> # 11 +<AMI> +#alternate lower case/ +# 12 +# +#minuscules spéciales après majuscules +# <ARABINT>/<ARABFOR> +# +<AMA> # accent madda #13 +<AHA> # accent hamza #14 +<AHW> # accent hamza/waw #14 1 +<AHS> # accent hamza under / hamza souscrit #14 2 +<AYE> # accent under yeh / accent souscrit du ya' #14 3 +<YBA> # accent hamza/yeh barree #14 4 +# +<BAS> # 15 +# +<PCL> # 16 +<LIG> # 17 +<ACA> # 18 +<GRA> # 19 +<BRE> # 20 +<CIR> # 21 +<CAR> # 22 +<RNE> # 23 +<REU> # 24 +<DAC> # 25 +<TIL> # 26 +<PCT> # 27 +<OBL> # 28 +<CDI> # 29 +<OGO> # 30 +<MAC> # 31 +# +# GREC +# +<TNS> # accent aigu/tonos/acute accent +<DLT> # tr<e'>ma/dialytica/diaeresis +<DTT> # dialytika tonos +# +<0> # 48 +<1> # 49 +<2> # 50 +<3> # 51 +<4> # 52 +<5> # 53 +<6> # 54 +<7> # 55 +<8> # 56 +<9> # 57 +# +<a> # 97 +<b> # 98 +<c> # 99 +<d> # 100 +<e> # 101 +<f> # 102 +<g> # 103 +<h> # 104 +<i> # 105 +<j> # 106 +<k> # 107 +<l> # 108 +<m> # 109 +<n> # 110 +<o> # 111 +<p> # 112 +<q> # 113 +<r> # 114 +<s> # 115 +<t> # 116 +<u> # 117 +<v> # 118 +<w> # 119 +<x> # 120 +<y> # 121 +<z> # 122 +<th># 122b +# +# <ARABINT>/<ARABFOR> +# +<hamza> +<alef> +<beh> +<peh> +<teh_marbuta> +<teh> +<tteh> +<theh> +<jeem> +<tcheh> +<hah> +<khah> +<dal> +<ddal> +<thal> +<reh> +<rreh> +<zain> +<jeh> +<seen> +<sheen> +<sad> +<dad> +<tah> +<zah> +<ain> +<ghain> +<feh> +<qaf> +<kaf> +<keheh> +<gaf> +<lam> +<meem> +<noon> +<noon_ghunna> +<heh> +<heh_yeh> +<waw> +<alef_maksura> +<yeh_barree> +# +# <HEBREU> +# +<alef_heb> +<bet> +<gimel> +<dalet> +<he> +<vav> +<zayin> +<het> +<tet> +<yod> +<kaf_fin> +<kaf_heb> +<lamed> +<mem_fin> +<mem> +<nun_fin> +<nun> +<samekh> +<ayin> +<pe_fin> +<pe> +<tsadi_fin> +<tsadi> +<qof> +<resh> +<shin> +<tav> +# +#GREC +# +<ALPHA> +<BETA> +<GAMMA> +<DELTA> +<EPSILON> +<ZETA> +<ETA> +<THETA> +<IOTA> +<KAPPA> +<LAMBDA> +<MU> +<NU> +<XI> +<OMICRON> +<PI> +<RHO> +<SIGMA> +<TAU> +<UPSILON> +<PHI> +<CHI> +<PSI> +<OMEGA> +# +#CYRIL +# +<CYR-A> +<CYR-BE> +<CYR-VE> +<CYR-GHE> +<CYR-DE> +<CYR-GZHE> +<CYR-DJE> +<CYR-IE> +<UKR-IE> +<CYR-IO> +<CYR-ZHE> +<CYR-ZE> +<CYR-DZE> +<CYR-I> +<UKR-I> +<UKR-YI> +<CYR-IBRE> +<CYR-JE> +<CYR-KA> +<CYR-EL> +<CYR-LJE> +<CYR-EM> +<CYR-EN> +<CYR-NJE> +<CYR-O> +<CYR-PE> +<CYR-ER> +<CYR-ES> +<CYR-TE> +<CYR-KJE> +<CYR-TSHE> +<CYR-OU> +<CYR-OUBRE> +<CYR-EF> +<CYR-HA> +<CYR-TSE> +<CYR-CHE> +<CYR-DCHE> +<CYR-SHA> +<CYR-SHTSHA> +<CYR-SIGDUR> +<CYR-YEROU> +<CYR-SIGMOUIL> +<CYR-E> +<CYR-YOU> +<CYR-YA> + +order_start <SPECIAL>;forward;backward;forward;forward,position +# +# Tout caractère non précisément défini sera considéré comme caractère spécial +# et considéré uniquement au dernier niveau. +# +# Any character not precisely specified will be considered as a special +# character and considered only at the last level. +# <U0000>......<U7FFFFFFF> IGNORE;IGNORE;IGNORE;<U0000>......<U7FFFFFFF> +# +# SYMB. N° GLY +# +<U0020> IGNORE;IGNORE;IGNORE;<U0020> # 32 <SP> +<U005F> IGNORE;IGNORE;IGNORE;<U005F> # 33 _ +<U0332> IGNORE;IGNORE;IGNORE;<U0332> # 34 <"_> +<U00AF> IGNORE;IGNORE;IGNORE;<U00AF> # 35 - (MACRON) +<U00AD> IGNORE;IGNORE;IGNORE;<U00AD> # 36 <SHY> +<U002D> IGNORE;IGNORE;IGNORE;<U002D> # 37 - +<U002C> IGNORE;IGNORE;IGNORE;<U002C> # 38 , +<U003B> IGNORE;IGNORE;IGNORE;<U003B> # 39 ; +<U003A> IGNORE;IGNORE;IGNORE;<U003A> # 40 : +<U0021> IGNORE;IGNORE;IGNORE;<U0021> # 41 ! +<U00A1> IGNORE;IGNORE;IGNORE;<U00A1> # 42 ¡ +<U003F> IGNORE;IGNORE;IGNORE;<U003F> # 43 ? +<U00BF> IGNORE;IGNORE;IGNORE;<U00BF> # 44 ¿ +<U002F> IGNORE;IGNORE;IGNORE;<U002F> # 45 / +<U0338> IGNORE;IGNORE;IGNORE;<U0338> # 46 <"/> +<U002E> IGNORE;IGNORE;IGNORE;<U002E> # 47 . +<U00B7> IGNORE;IGNORE;IGNORE;<U00B7> # 58 × +<U00B8> IGNORE;IGNORE;IGNORE;<U00B8> # 59 ¸ +<U0328> IGNORE;IGNORE;IGNORE;<U0328> # 60 <";> +<U0027> IGNORE;IGNORE;IGNORE;<U0027> # 61 ' +<U2018> IGNORE;IGNORE;IGNORE;<U2018> # 62 <'6> +<U2019> IGNORE;IGNORE;IGNORE;<U2019> # 63 <'9> +<U0022> IGNORE;IGNORE;IGNORE;<U0022> # 64 " +<U201C> IGNORE;IGNORE;IGNORE;<U201C> # 65 <"6> +<U201D> IGNORE;IGNORE;IGNORE;<U201D> # 66 <"9> +<U00AB> IGNORE;IGNORE;IGNORE;<U00AB> # 67 « +<U00BB> IGNORE;IGNORE;IGNORE;<U00BB> # 68 » +<U0028> IGNORE;IGNORE;IGNORE;<U0028> # 69 ( +<U207D> IGNORE;IGNORE;IGNORE;<U207D> # 70 <(S> +<U0029> IGNORE;IGNORE;IGNORE;<U0029> # 71 ) +<U207E> IGNORE;IGNORE;IGNORE;<U207E> # 72 <)S> +<U005B> IGNORE;IGNORE;IGNORE;<U005B> # 73 [ +<U005D> IGNORE;IGNORE;IGNORE;<U005D> # 74 ] +<U007B> IGNORE;IGNORE;IGNORE;<U007B> # 75 { +<U007D> IGNORE;IGNORE;IGNORE;<U007D> # 76 } +<U00A7> IGNORE;IGNORE;IGNORE;<U00A7> # 77 § +<U00B6> IGNORE;IGNORE;IGNORE;<U00B6> # 78 ¶ +<U00A9> IGNORE;IGNORE;IGNORE;<U00A9> # 79 © +<U00AE> IGNORE;IGNORE;IGNORE;<U00AE> # 80 ® +<U2122> IGNORE;IGNORE;IGNORE;<U2122> # 81 <TM> +<U0040> IGNORE;IGNORE;IGNORE;<U0040> # 82 @ +<U00A4> IGNORE;IGNORE;IGNORE;<U00A4> # 83 ¤ +<U00A2> IGNORE;IGNORE;IGNORE;<U00A2> # 84 ¢ +<U0024> IGNORE;IGNORE;IGNORE;<U0024> # 85 $ +<U00A3> IGNORE;IGNORE;IGNORE;<U00A3> # 86 £ +<U00A5> IGNORE;IGNORE;IGNORE;<U00A5> # 87 ¥ +<U20A0> IGNORE;IGNORE;IGNORE;<U20A0> # ecu +<U20A1> IGNORE;IGNORE;IGNORE;<U20A1> # colon +<U20A2> IGNORE;IGNORE;IGNORE;<U20A2> # cruzeiro +<U20A3> IGNORE;IGNORE;IGNORE;<U20A3> # french franc +<U20A4> IGNORE;IGNORE;IGNORE;<U20A4> # lira +<U20A5> IGNORE;IGNORE;IGNORE;<U20A5> # mill +<U20A6> IGNORE;IGNORE;IGNORE;<U20A6> # naira +<U20A7> IGNORE;IGNORE;IGNORE;<U20A7> # peseta +<U20A8> IGNORE;IGNORE;IGNORE;<U20A8> # rupee +<U20A9> IGNORE;IGNORE;IGNORE;<U20A9> # won +<U20AA> IGNORE;IGNORE;IGNORE;<U20AA> # new sheqel +<U20AB> IGNORE;IGNORE;IGNORE;<U20AB> # dong +<U20AC> IGNORE;IGNORE;IGNORE;<U20AC> # euro +<U20AD> IGNORE;IGNORE;IGNORE;<U20AD> # kip +<U20AE> IGNORE;IGNORE;IGNORE;<U20AE> # tugrik +<U20AF> IGNORE;IGNORE;IGNORE;<U20AF> # drachma +<U002A> IGNORE;IGNORE;IGNORE;<U002A> # 88 * +<U005C> IGNORE;IGNORE;IGNORE;<U005C> # 89 +<U0026> IGNORE;IGNORE;IGNORE;<U0026> # 90 & +<U0023> IGNORE;IGNORE;IGNORE;<U0023> # 91 # +<U0025> IGNORE;IGNORE;IGNORE;<U0025> # 92 % +<U207B> IGNORE;IGNORE;IGNORE;<U207D> # 93 <-S> +<U002B> IGNORE;IGNORE;IGNORE;<U002B> # 94 + +<U207A> IGNORE;IGNORE;IGNORE;<U207E> # 95 <+S> +<U00B1> IGNORE;IGNORE;IGNORE;<U00B1> # 96 ± +<U00B4> IGNORE;IGNORE;IGNORE;<0> # 123 ´ +<U0060> IGNORE;IGNORE;IGNORE;<1> # 124 ` +<U0306> IGNORE;IGNORE;IGNORE;<2> # 125 <"(> +<U005E> IGNORE;IGNORE;IGNORE;<3> # 126 ^ +<U030C> IGNORE;IGNORE;IGNORE;<4> # 127 <"<> +<U030A> IGNORE;IGNORE;IGNORE;<5> # 128 <"0> +<U00A8> IGNORE;IGNORE;IGNORE;<6> # 129 ¨ +<U030B> IGNORE;IGNORE;IGNORE;<7> # 130 <""> +<U007E> IGNORE;IGNORE;IGNORE;<8> # 131 ~ +<U0307> IGNORE;IGNORE;IGNORE;<9> # 132 <".> +<U00F7> IGNORE;IGNORE;IGNORE;<a> # 133 ¸ +<U00D7> IGNORE;IGNORE;IGNORE;<b> # 134 ´ +<U2260> IGNORE;IGNORE;IGNORE;<c> # 135 <!=> +<U003C> IGNORE;IGNORE;IGNORE;<d> # 136 < +<U2264> IGNORE;IGNORE;IGNORE;<e> # 137 <=<> +<U003D> IGNORE;IGNORE;IGNORE;<f> # 138 = +<U2265> IGNORE;IGNORE;IGNORE;<g> # 139 </>=> +<U003E> IGNORE;IGNORE;IGNORE;<h> # 140 > +<U00AC> IGNORE;IGNORE;IGNORE;<i> # 141 ¬ +<U007C> IGNORE;IGNORE;IGNORE;<j> # 142 | +<U00A6> IGNORE;IGNORE;IGNORE;<k> # 143 | +<U00B0> IGNORE;IGNORE;IGNORE;<l> # 144 ° +<U00B5> IGNORE;IGNORE;IGNORE;<m> # 145 m +<U2126> IGNORE;IGNORE;IGNORE;<n> # 146 <Om> +<U220E> IGNORE;IGNORE;IGNORE;<o> # 147 <FP> +<U250C> IGNORE;IGNORE;IGNORE;<p> # 148 <_V/>> +<U252C> IGNORE;IGNORE;IGNORE;<q> # 149 <_V-> +<U2510> IGNORE;IGNORE;IGNORE;<r> # 150 <_V<w> +<U251C> IGNORE;IGNORE;IGNORE;<s> # 151 <_!/>> +<U253C> IGNORE;IGNORE;IGNORE;<t> # 152 <_!-> +<U2524> IGNORE;IGNORE;IGNORE;<u> # 153 <_!<> +<U2514> IGNORE;IGNORE;IGNORE;<v> # 154 <_A/>> +<U2534> IGNORE;IGNORE;IGNORE;<w> # 155 <_-A> +<U2518> IGNORE;IGNORE;IGNORE;<x> # 156 <_A<> +<U2502> IGNORE;IGNORE;IGNORE;<y> # 157 <_!> +<U2500> IGNORE;IGNORE;IGNORE;<z> # 158 <_-> # +<U2501> IGNORE;IGNORE;IGNORE;<U2501> # 159 <_=> +<U2190> IGNORE;IGNORE;IGNORE;<U2190> # 160 <<-> +<U2192> IGNORE;IGNORE;IGNORE;<U2192> # 161 <-/>> +<U20D1> IGNORE;IGNORE;IGNORE;<U20D1> # 162 <"7> +<U2191> IGNORE;IGNORE;IGNORE;<U2191> # 163 <-!> +<U2193> IGNORE;IGNORE;IGNORE;<U2193> # 164 <-v> +<U266A> IGNORE;IGNORE;IGNORE;<U266A> # 165 <_d!> +<U2571> IGNORE;IGNORE;IGNORE;<U2571> # 166 <_/>//> +<U2572> IGNORE;IGNORE;IGNORE;<U2572> # 167 <_<\> +<U25E2> IGNORE;IGNORE;IGNORE;<U25E2> # 168 <_./>//> +<U25E3> IGNORE;IGNORE;IGNORE;<U25E3> # 169 <_.<\> # # <ARABINT>/<ARABFOR> # +<U060C> IGNORE;IGNORE;IGNORE;<U060C> +<U061B> IGNORE;IGNORE;IGNORE;<U061B> +<U061F> IGNORE;IGNORE;IGNORE;<U061F> +<U0640> IGNORE;IGNORE;IGNORE;<U0640> +<U066A> IGNORE;IGNORE;IGNORE;<U066A> +<U066B> IGNORE;IGNORE;IGNORE;<U066B> +<U066C> IGNORE;IGNORE;IGNORE;<U066C> +<U066D> IGNORE;IGNORE;IGNORE;<U066D> +<U064B> IGNORE;IGNORE;IGNORE;<U064B> #<fathatan_no> +<UFE70> IGNORE;IGNORE;IGNORE;<UFE70> #<fathatan_is> +<UFE71> IGNORE;IGNORE;IGNORE;<UFE71> #<fathatan_me> +<U064C> IGNORE;IGNORE;IGNORE;<U064C> #<dammatan_no> +<UFE72> IGNORE;IGNORE;IGNORE;<UFE72> #<dammatan_is> +<U064D> IGNORE;IGNORE;IGNORE;<U064D> #<kasratan_no> +<UFE74> IGNORE;IGNORE;IGNORE;<UFE74> #<kasratan_is> +<U064E> IGNORE;IGNORE;IGNORE;<U064E> #<fatha_no> +<UFE76> IGNORE;IGNORE;IGNORE;<UFE76> #<fatha_is> +<UFE77> IGNORE;IGNORE;IGNORE;<UFE77> #<fatha_me> +<U064F> IGNORE;IGNORE;IGNORE;<U064F> #<damma_no> +<UFE78> IGNORE;IGNORE;IGNORE;<UFE78> #<damma_is> +<UFE79> IGNORE;IGNORE;IGNORE;<UFE79> #<damma_me> +<U0650> IGNORE;IGNORE;IGNORE;<U0650> #<kasra_no> +<UFE7A> IGNORE;IGNORE;IGNORE;<UFE7A> #<kasra_is> +<UFE7B> IGNORE;IGNORE;IGNORE;<UFE7B> #<kasra_me> +<U0651> IGNORE;IGNORE;IGNORE;<U0651> #<shadda_no> +<UFE7C> IGNORE;IGNORE;IGNORE;<UFE7C> #<shadda_is> +<UFE7D> IGNORE;IGNORE;IGNORE;<UFE7D> #<shadda_me> +<U0652> IGNORE;IGNORE;IGNORE;<U0652> #<sukun_no> +<UFE7E> IGNORE;IGNORE;IGNORE;<UFE7E> #<sukun_is> +<UFE7F> IGNORE;IGNORE;IGNORE;<UFE7F> #<sukun_me> # # <HEBREU> # +<U05B0> IGNORE;IGNORE;IGNORE;<U05B0> #point_sheva +<U05B1> IGNORE;IGNORE;IGNORE;<U05B1> #point_hataf_segol +<U05B2> IGNORE;IGNORE;IGNORE;<U05B2> #point_hataf_patah +<U05B3> IGNORE;IGNORE;IGNORE;<U05B3> #point_hataf_qamats +<U05B4> IGNORE;IGNORE;IGNORE;<U05B4> #point_hiriq +<U05B5> IGNORE;IGNORE;IGNORE;<U05B5> #point_tsere +<U05B6> IGNORE;IGNORE;IGNORE;<U05B6> #point_segol +<U05B7> IGNORE;IGNORE;IGNORE;<U05B7> #point_patah +<U05B8> IGNORE;IGNORE;IGNORE;<U05B8> #point_qamats +<U05B9> IGNORE;IGNORE;IGNORE;<U05B9> #point_holam +<U05BB> IGNORE;IGNORE;IGNORE;<U05BB> #point_qubuts +<U05BC> IGNORE;IGNORE;IGNORE;<U05BC> #point_dagesh +<U05BD> IGNORE;IGNORE;IGNORE;<U05BD> #point_meteg +<U05BE> IGNORE;IGNORE;IGNORE;<U05BE> #maqaf +<U05BF> IGNORE;IGNORE;IGNORE;<U05BF> #point_rafe +<U05C0> IGNORE;IGNORE;IGNORE;<U05C0> #paseq +<U05C1> IGNORE;IGNORE;IGNORE;<U05C1> #point_shin_dot +<U05C2> IGNORE;IGNORE;IGNORE;<U05C2> #point_sin_dot +<U05C3> IGNORE;IGNORE;IGNORE;<U05C3> #sof pasuq + +# The comment at the beginning of this section mentions characters which +# are not otherwise covered. But this description cannot express this. +# Therefore we add here a few entries which are used in older implementations +# to be compatible. --drepper +<U0001> IGNORE;IGNORE;IGNORE;<U0001> +<U0002> IGNORE;IGNORE;IGNORE;<U0002> +<U0003> IGNORE;IGNORE;IGNORE;<U0003> +<U0004> IGNORE;IGNORE;IGNORE;<U0004> +<U0005> IGNORE;IGNORE;IGNORE;<U0005> +<U0006> IGNORE;IGNORE;IGNORE;<U0006> +<U0007> IGNORE;IGNORE;IGNORE;<U0007> +<U0008> IGNORE;IGNORE;IGNORE;<U0008> +<U0009> IGNORE;IGNORE;IGNORE;<U0009> +<U000A> IGNORE;IGNORE;IGNORE;<U000A> +<U000B> IGNORE;IGNORE;IGNORE;<U000B> +<U000C> IGNORE;IGNORE;IGNORE;<U000C> +<U000D> IGNORE;IGNORE;IGNORE;<U000D> +<U000E> IGNORE;IGNORE;IGNORE;<U000E> +<U000F> IGNORE;IGNORE;IGNORE;<U000F> +<U0010> IGNORE;IGNORE;IGNORE;<U0010> +<U0011> IGNORE;IGNORE;IGNORE;<U0011> +<U0012> IGNORE;IGNORE;IGNORE;<U0012> +<U0013> IGNORE;IGNORE;IGNORE;<U0013> +<U0014> IGNORE;IGNORE;IGNORE;<U0014> +<U0015> IGNORE;IGNORE;IGNORE;<U0015> +<U0016> IGNORE;IGNORE;IGNORE;<U0016> +<U0017> IGNORE;IGNORE;IGNORE;<U0017> +<U0018> IGNORE;IGNORE;IGNORE;<U0018> +<U0019> IGNORE;IGNORE;IGNORE;<U0019> +<U001A> IGNORE;IGNORE;IGNORE;<U001A> +<U001B> IGNORE;IGNORE;IGNORE;<U001B> +<U001C> IGNORE;IGNORE;IGNORE;<U001C> +<U001D> IGNORE;IGNORE;IGNORE;<U001D> +<U001E> IGNORE;IGNORE;IGNORE;<U001E> +<U001F> IGNORE;IGNORE;IGNORE;<U001F> +<U007F> IGNORE;IGNORE;IGNORE;<U007F> +<U0080> IGNORE;IGNORE;IGNORE;<U0080> +<U0081> IGNORE;IGNORE;IGNORE;<U0081> +<U0082> IGNORE;IGNORE;IGNORE;<U0082> +<U0083> IGNORE;IGNORE;IGNORE;<U0083> +<U0084> IGNORE;IGNORE;IGNORE;<U0084> +<U0085> IGNORE;IGNORE;IGNORE;<U0085> +<U0086> IGNORE;IGNORE;IGNORE;<U0086> +<U0087> IGNORE;IGNORE;IGNORE;<U0087> +<U0088> IGNORE;IGNORE;IGNORE;<U0088> +<U0089> IGNORE;IGNORE;IGNORE;<U0089> +<U008A> IGNORE;IGNORE;IGNORE;<U008A> +<U008B> IGNORE;IGNORE;IGNORE;<U008B> +<U008C> IGNORE;IGNORE;IGNORE;<U008C> +<U008D> IGNORE;IGNORE;IGNORE;<U008D> +<U008E> IGNORE;IGNORE;IGNORE;<U008E> +<U008F> IGNORE;IGNORE;IGNORE;<U008F> +<U0090> IGNORE;IGNORE;IGNORE;<U0090> +<U0091> IGNORE;IGNORE;IGNORE;<U0091> +<U0092> IGNORE;IGNORE;IGNORE;<U0092> +<U0093> IGNORE;IGNORE;IGNORE;<U0093> +<U0094> IGNORE;IGNORE;IGNORE;<U0094> +<U0095> IGNORE;IGNORE;IGNORE;<U0095> +<U0096> IGNORE;IGNORE;IGNORE;<U0096> +<U0097> IGNORE;IGNORE;IGNORE;<U0097> +<U0098> IGNORE;IGNORE;IGNORE;<U0098> +<U0099> IGNORE;IGNORE;IGNORE;<U0099> +<U009A> IGNORE;IGNORE;IGNORE;<U009A> +<U009B> IGNORE;IGNORE;IGNORE;<U009B> +<U009C> IGNORE;IGNORE;IGNORE;<U009C> +<U009D> IGNORE;IGNORE;IGNORE;<U009D> +<U009E> IGNORE;IGNORE;IGNORE;<U009E> +<U009F> IGNORE;IGNORE;IGNORE;<U009F> + +order_start <LATIN>;forward;backward;forward;forward,position +# +<U00A0> <U0020>;<BAS>;<MIN>;IGNORE # 170<NBSP> +# +<U0030> <0>;<BAS>;<MIN>;IGNORE # 171 0 +<U0031> <1>;<BAS>;<MIN>;IGNORE # 172 1 +<U0032> <2>;<BAS>;<MIN>;IGNORE # 173 2 +<U0033> <3>;<BAS>;<MIN>;IGNORE # 174 3 +<U0034> <4>;<BAS>;<MIN>;IGNORE # 175 4 +<U0035> <5>;<BAS>;<MIN>;IGNORE # 176 5 +<U0036> <6>;<BAS>;<MIN>;IGNORE # 177 6 +<U0037> <7>;<BAS>;<MIN>;IGNORE # 178 7 +<U0038> <8>;<BAS>;<MIN>;IGNORE # 179 8 +<U0039> <9>;<BAS>;<MIN>;IGNORE # 180 9 +# +<U215B> <0>;<GRA>;<MIN>;IGNORE # 181 <18> +<U00BC> <0>;<BRE>;<MIN>;IGNORE # 182 ¼ +<U215C> <0>;<CIR>;<MIN>;IGNORE # 183 <38> +<U215D> <0>;<RNE>;<MIN>;IGNORE # 184 <58> +<U215E> <0>;<DAC>;<MIN>;IGNORE # 185 <78> +<U00BD> <0>;<CAR>;<MIN>;IGNORE # 186 ½ +<U00BE> <0>;<REU>;<MIN>;IGNORE # 187 ¾ +<U2070> <0>;<BAS>;<EMI>;IGNORE # 188 <0S> +<U00B9> <1>;<BAS>;<EMI>;IGNORE # 189 ¹ +<U00B2> <2>;<BAS>;<EMI>;IGNORE # 190 ² +<U00B3> <3>;<BAS>;<EMI>;IGNORE # 191 ³ +<U2074> <4>;<BAS>;<EMI>;IGNORE # 192 <4S> +<U2075> <5>;<BAS>;<EMI>;IGNORE # 193 <5S> +<U2076> <6>;<BAS>;<EMI>;IGNORE # 194 <6S> +<U2077> <7>;<BAS>;<EMI>;IGNORE # 195 <7S> +<U2078> <8>;<BAS>;<EMI>;IGNORE # 196 <8S> +<U2079> <9>;<BAS>;<EMI>;IGNORE # 197 <9S> +# +<U0061> <a>;<BAS>;<MIN>;IGNORE # 198 a +<U00AA> <a>;<PCL>;<EMI>;IGNORE # 199 ª +<U00E1> <a>;<ACA>;<MIN>;IGNORE # 200 á +<U00E0> <a>;<GRA>;<MIN>;IGNORE # 201 à +<U00E2> <a>;<CIR>;<MIN>;IGNORE # 202 â +<U00E3> <a>;<TIL>;<MIN>;IGNORE # 203 ã +<U00E4> <a>;<REU>;<MIN>;IGNORE # 204 ä +<U00E5> <a>;<RNE>;<MIN>;IGNORE # 205 å +<U0103> <a>;<BRE>;<MIN>;IGNORE # 206 <a(> +<U0105> <a>;<OGO>;<MIN>;IGNORE # 207 <a;> +<U0101> <a>;<MAC>;<MIN>;IGNORE # 208 <a-> +<U00E6> "<a><e>";"<LIG><LIG>";"<MIN><MIN>";IGNORE # 209 æ +<U0062> <b>;<BAS>;<MIN>;IGNORE # 210 b +<U0063> <c>;<BAS>;<MIN>;IGNORE # 211 c +<U00E7> <c>;<CDI>;<MIN>;IGNORE # 212 ç +<U0107> <c>;<ACA>;<MIN>;IGNORE # 213 <c'> +<U0109> <c>;<CIR>;<MIN>;IGNORE # 214 <c/>> +<U010D> <c>;<CAR>;<MIN>;IGNORE # 215 <c<> +<U010B> <c>;<PCT>;<MIN>;IGNORE # 216 <c.> +<U0064> <d>;<BAS>;<MIN>;IGNORE # 217 d +<U00F0> <d>;<PCL>;<MIN>;IGNORE # 218 ð +<U010F> <d>;<CAR>;<MIN>;IGNORE # 219 <d<> +<U0111> <d>;<OBL>;<MIN>;IGNORE # 220 <d//> +<U0065> <e>;<BAS>;<MIN>;IGNORE # 221 e +<U00E9> <e>;<ACA>;<MIN>;IGNORE # 222 é +<U00E8> <e>;<GRA>;<MIN>;IGNORE # 223 è +<U00EA> <e>;<CIR>;<MIN>;IGNORE # 224 ê +<U00EB> <e>;<REU>;<MIN>;IGNORE # 225 ë +<U011B> <e>;<CAR>;<MIN>;IGNORE # 226 <e<> +<U0117> <e>;<PCT>;<MIN>;IGNORE # 227 <e.> +<U0119> <e>;<OGO>;<MIN>;IGNORE # 228 <e;> +<U0113> <e>;<MAC>;<MIN>;IGNORE # 229 <e-> +<U0066> <f>;<BAS>;<MIN>;IGNORE # 230 f +<U0067> <g>;<BAS>;<MIN>;IGNORE # 231 g +<U011F> <g>;<BRE>;<MIN>;IGNORE # 232 <g(> +<U011D> <g>;<CIR>;<MIN>;IGNORE # 233 <g/>> +<U0121> <g>;<PCT>;<MIN>;IGNORE # 234 <g.> +<U0123> <g>;<CDI>;<MIN>;IGNORE # 235 <g,> +<U0068> <h>;<BAS>;<MIN>;IGNORE # 236 h +<U0125> <h>;<CIR>;<MIN>;IGNORE # 237 <h/>> +<U0127> <h>;<OBL>;<MIN>;IGNORE # 238 <h//> +<U0069> <i>;<BAS>;<MIN>;IGNORE # 239 i +<U00ED> <i>;<ACA>;<MIN>;IGNORE # 240 í +<U00EC> <i>;<GRA>;<MIN>;IGNORE # 241 ì +<U00EE> <i>;<CIR>;<MIN>;IGNORE # 242 î +<U00EF> <i>;<REU>;<MIN>;IGNORE # 243 ï +<U0131> <i>;<PCL>;<MIN>;IGNORE # 244 <i.> +<U0129> <i>;<TIL>;<MIN>;IGNORE # 245 <i?> +<U012F> <i>;<OGO>;<MIN>;IGNORE # 246 <i;> +<U012B> <i>;<MAC>;<MIN>;IGNORE # 247 <i-> +<U0133> "<i><j>";"<LIG><LIG>";"<MIN><MIN>";IGNORE # 248 <ij> +<U006A> <j>;<BAS>;<MIN>;IGNORE # 249 j +<U0135> <j>;<CIR>;<MIN>;IGNORE # 250 <j/>> +<U006B> <k>;<BAS>;<MIN>;IGNORE # 251 k +<U0138> <k>;<PCL>;<MIN>;IGNORE # 252 <kk> +<U0137> <k>;<CDI>;<MIN>;IGNORE # 253 <k,> +<U006C> <l>;<BAS>;<MIN>;IGNORE # 254 l +<U013A> <l>;<ACA>;<MIN>;IGNORE # 255 <l'> +<U013E> <l>;<CAR>;<MIN>;IGNORE # 256 <l<> +<U0142> <l>;<OBL>;<MIN>;IGNORE # 257 <l//> +<U013C> <l>;<CDI>;<MIN>;IGNORE # 258 <l,> +<U0140> <l>;<PCT>;<MIN>;IGNORE # 259 <l.> +<U006D> <m>;<BAS>;<MIN>;IGNORE # 260 m +<U006E> <n>;<BAS>;<MIN>;IGNORE # 261 n +<U00F1> <n>;<TIL>;<MIN>;IGNORE # 262 ñ +<U0149> <n>;<PCL>;<MIN>;IGNORE # 263 <'n> +<U0144> <n>;<ACA>;<MIN>;IGNORE # 264 <n'> +<U0148> <n>;<CAR>;<MIN>;IGNORE # 265 <n<> +<U0146> <n>;<CDI>;<MIN>;IGNORE # 266 <n,> +<U014B> "<n><g>";"<LIG><LIG>";"<MIN><MIN>";IGNORE # 267 <ng> +<U006F> <o>;<BAS>;<MIN>;IGNORE # 268 o +<U00BA> <o>;<PCL>;<EMI>;IGNORE # 269 º +<U00F3> <o>;<ACA>;<MIN>;IGNORE # 270 ó +<U00F2> <o>;<GRA>;<MIN>;IGNORE # 271 ò +<U00F4> <o>;<CIR>;<MIN>;IGNORE # 272 ô +<U00F5> <o>;<TIL>;<MIN>;IGNORE # 273 õ +<U00F6> <o>;<REU>;<MIN>;IGNORE # 274 ö +<U00F8> <o>;<OBL>;<MIN>;IGNORE # 275 ø +<U0151> <o>;<DAC>;<MIN>;IGNORE # 276 <o"> +<U014D> <o>;<MAC>;<MIN>;IGNORE # 277 <o-> +<U0153> "<o><e>";"<LIG><LIG>";"<MIN><MIN>";IGNORE # 278 <oe> +<U0070> <p>;<BAS>;<MIN>;IGNORE # 279 p +<U0071> <q>;<BAS>;<MIN>;IGNORE # 280 q +<U0072> <r>;<BAS>;<MIN>;IGNORE # 281 r +<U0155> <r>;<ACA>;<MIN>;IGNORE # 282 <r'> +<U0159> <r>;<CAR>;<MIN>;IGNORE # 283 <r<> +<U0157> <r>;<CDI>;<MIN>;IGNORE # 284 <r,> +<U0073> <s>;<BAS>;<MIN>;IGNORE # 285 s +<U015B> <s>;<ACA>;<MIN>;IGNORE # 286 <s'> +<U015D> <s>;<CIR>;<MIN>;IGNORE # 287 <s/>> +<U0161> <s>;<CAR>;<MIN>;IGNORE # 288 <s<> +<U015F> <s>;<CDI>;<MIN>;IGNORE # 289 <s,> +<U00DF> "<s><s>";"<LIG><LIG>";"<MIN><MIN>";IGNORE # 290 ß +<U0074> <t>;<BAS>;<MIN>;IGNORE # 291 t +<U0165> <t>;<CAR>;<MIN>;IGNORE # 292 <t<> +<U0167> <t>;<OBL>;<MIN>;IGNORE # 293 <t//> +<U0163> <t>;<CDI>;<MIN>;IGNORE # 294 <t,> +<U0075> <u>;<BAS>;<MIN>;IGNORE # 296 u +<U00FA> <u>;<ACA>;<MIN>;IGNORE # 297 ú +<U00F9> <u>;<GRA>;<MIN>;IGNORE # 298 ù +<U00FB> <u>;<CIR>;<MIN>;IGNORE # 299 û +<U00FC> <u>;<REU>;<MIN>;IGNORE # 300 ü +<U016D> <u>;<BRE>;<MIN>;IGNORE # 301 <u(> +<U016F> <u>;<RNE>;<MIN>;IGNORE # 302 <u0> +<U0171> <u>;<DAC>;<MIN>;IGNORE # 303 <u"> +<U0169> <u>;<TIL>;<MIN>;IGNORE # 304 <u?> +<U0173> <u>;<OGO>;<MIN>;IGNORE # 305 <u;> +<U016B> <u>;<MAC>;<MIN>;IGNORE # 306 <u-> +<U0076> <v>;<BAS>;<MIN>;IGNORE # 307 v +<U0077> <w>;<BAS>;<MIN>;IGNORE # 308 w +<U0175> <w>;<CIR>;<MIN>;IGNORE # 309 <w/>> +<U0078> <x>;<BAS>;<MIN>;IGNORE # 310 x +<U0079> <y>;<BAS>;<MIN>;IGNORE # 311 y +<U00FD> <y>;<ACA>;<MIN>;IGNORE # 312 ý +<U00FF> <y>;<REU>;<MIN>;IGNORE # 313 _ +<U0177> <y>;<CIR>;<MIN>;IGNORE # 314 <y/>> +<U007A> <z>;<BAS>;<MIN>;IGNORE # 315 z +<U017A> <z>;<ACA>;<MIN>;IGNORE # 316 <z'> +<U017E> <z>;<CAR>;<MIN>;IGNORE # 317 <z<> +<U017C> <z>;<PCT>;<MIN>;IGNORE # 318 <z.> +<U00FE> <th>;<BAS>;<MIN>;IGNORE # 318b Þ # +<U0041> <a>;<BAS>;<CAP>;IGNORE # 319 A +<U00C1> <a>;<ACA>;<CAP>;IGNORE # 320 Á +<U00C0> <a>;<GRA>;<CAP>;IGNORE # 321 À +<U00C2> <a>;<CIR>;<CAP>;IGNORE # 322 Â +<U00C3> <a>;<TIL>;<CAP>;IGNORE # 323 Ã +<U00C4> <a>;<REU>;<CAP>;IGNORE # 324 Ä +<U00C5> <a>;<RNE>;<CAP>;IGNORE # 325 Å +<U0102> <a>;<BRE>;<CAP>;IGNORE # 326 <A(> +<U0104> <a>;<OGO>;<CAP>;IGNORE # 327 <A;> +<U0100> <a>;<MAC>;<CAP>;IGNORE # 328 <A-> +<U00C6> "<a><e>";"<LIG><LIG>";"<CAP><CAP>";IGNORE # 329 Æ +<U0042> <b>;<BAS>;<CAP>;IGNORE # 330 B +<U0043> <c>;<BAS>;<CAP>;IGNORE # 331 C +<U00C7> <c>;<CDI>;<CAP>;IGNORE # 332 Ç +<U0106> <c>;<ACA>;<CAP>;IGNORE # 333 <C'> +<U0108> <c>;<CIR>;<CAP>;IGNORE # 334 <C/>> +<U010C> <c>;<CAR>;<CAP>;IGNORE # 335 <C>> +<U010A> <c>;<PCT>;<CAP>;IGNORE # 336 <C.> +<U0044> <d>;<BAS>;<CAP>;IGNORE # 337 D +<U00D0> <d>;<PCL>;<CAP>;IGNORE # 338 Ð +<U010E> <d>;<CAR>;<CAP>;IGNORE # 339 <D<> +<U0110> <d>;<OBL |