about summary refs log tree commit diff
diff options
context:
space:
mode:
-rw-r--r--localedata/ChangeLog4
-rw-r--r--localedata/locales/iso14651_t1_common221
-rw-r--r--localedata/locales/ta_IN93
3 files changed, 225 insertions, 93 deletions
diff --git a/localedata/ChangeLog b/localedata/ChangeLog
index 46e25638e0..0ee187fe67 100644
--- a/localedata/ChangeLog
+++ b/localedata/ChangeLog
@@ -1,5 +1,9 @@
 2010-02-03  Ulrich Drepper  <drepper@redhat.com>
 
+	* locales/ta_IN: Move collation data...
+	* locales/iso14651_t1_common: ...here.
+	Patch by Pravin Satpute <psatpute@redhat.com>.
+
 	* locales/as_IN: Use iso14651_t1 instead of local collation data.
 	Patch by Pravin Satpute <psatpute@redhat.com>.
 
diff --git a/localedata/locales/iso14651_t1_common b/localedata/locales/iso14651_t1_common
index edbe9e0f32..5dc39de9dc 100644
--- a/localedata/locales/iso14651_t1_common
+++ b/localedata/locales/iso14651_t1_common
@@ -65,6 +65,7 @@ script <GUJARATI>
 script <TELUGU>
 script <GURUMUKHI>
 script <KANNADA>
+script <TAMIL>
 script <SINHALA>
 script <MALAYALAM>
 script <BENGALI>
@@ -914,6 +915,87 @@ collating-symbol <k-halant>
 collating-symbol <k-lenght_mark>
 collating-symbol <k-ai_lenght_mark>
 #
+# <TAMIL>
+#
+collating-element <ta_split_o> from "<U0BC6><U0BBE>"
+collating-element <ta_split_oo> from "<U0BC7><U0BBE>"
+collating-element <ta_split_au> from "<U0BC6><U0BD7>"
+collating-element <tagl_KSHA> from "<U0B95><U0BCD><U0BB7>"
+collating-element <tagl_SHRI> from "<U0BB8><U0BCD><U0BB0><U0BC0>"
+# defining collating element for sorting <consonent + virama> before <consonent>
+collating-element <pure-ta-k> from "<U0B95><U0BCD>" 
+collating-element <pure-ta-ng> from "<U0B99><U0BCD>"
+collating-element <pure-ta-c> from "<U0B9A><U0BCD>"
+collating-element <pure-ta-j> from "<U0B9C><U0BCD>"
+collating-element <pure-ta-ny> from "<U0B9E><U0BCD>"
+collating-element <pure-ta-tt> from "<U0B9F><U0BCD>"
+collating-element <pure-ta-nn> from "<U0BA3><U0BCD>"
+collating-element <pure-ta-t> from "<U0BA4><U0BCD>"
+collating-element <pure-ta-n> from "<U0BA8><U0BCD>"
+collating-element <pure-ta-nnn> from "<U0BA9><U0BCD>"
+collating-element <pure-ta-p> from "<U0BAA><U0BCD>"
+collating-element <pure-ta-m> from "<U0BAE><U0BCD>"
+collating-element <pure-ta-y> from "<U0BAF><U0BCD>"
+collating-element <pure-ta-r> from "<U0BB0><U0BCD>"
+collating-element <pure-ta-rr> from "<U0BB1><U0BCD>"
+collating-element <pure-ta-l> from "<U0BB2><U0BCD>"
+collating-element <pure-ta-ll> from "<U0BB3><U0BCD>"
+collating-element <pure-ta-lll> from "<U0BB4><U0BCD>"
+collating-element <pure-ta-v> from "<U0BB5><U0BCD>"
+collating-element <pure-ta-sh> from "<U0BB6><U0BCD>"
+collating-element <pure-ta-ss> from "<U0BB7><U0BCD>"
+collating-element <pure-ta-s> from "<U0BB8><U0BCD>"
+collating-element <pure-ta-h> from "<U0BB9><U0BCD>"
+# defning symbols
+collating-symbol <ta-pulli> #virama
+collating-symbol <tavw-a>
+collating-symbol <tavw-aa>
+collating-symbol <tavw-i>
+collating-symbol <tavw-ii>
+collating-symbol <tavw-u>
+collating-symbol <tavw-uu>
+collating-symbol <tavw-e>
+collating-symbol <tavw-ee>
+collating-symbol <tavw-ai>
+collating-symbol <tavw-o>
+collating-symbol <tavw-oo>
+collating-symbol <tavw-au>
+collating-symbol <ta-aytham> #visarga
+collating-symbol <ta-k>
+collating-symbol <ta-ng>
+collating-symbol <ta-c>
+collating-symbol <ta-ny>
+collating-symbol <ta-tt>
+collating-symbol <ta-nn>
+collating-symbol <ta-t>
+collating-symbol <ta-n>
+collating-symbol <ta-p>
+collating-symbol <ta-m>
+collating-symbol <ta-y>
+collating-symbol <ta-r>
+collating-symbol <ta-l>
+collating-symbol <ta-v>
+collating-symbol <ta-zh>
+collating-symbol <ta-ll>
+collating-symbol <ta-rr>
+collating-symbol <ta-nnn>
+collating-symbol <ta-j>
+collating-symbol <ta-sh>
+collating-symbol <ta-ss>
+collating-symbol <ta-s>
+collating-symbol <ta-h>
+collating-symbol <tavs-aa>
+collating-symbol <tavs-i>
+collating-symbol <tavs-ii>
+collating-symbol <tavs-u>
+collating-symbol <tavs-uu>
+collating-symbol <tavs-e>
+collating-symbol <tavs-ee>
+collating-symbol <tavs-ai>
+collating-symbol <tavs-o>
+collating-symbol <tavs-oo>
+collating-symbol <tavs-au>
+#
 # <MALAYALAM>
 # mlvs-  denotes Malayalam vowel sign
 # mlvw- denotes Malayalam vowel
@@ -3546,6 +3628,58 @@ collating-symbol  <MMSTACK>
 <k-lenght_mark>
 <k-ai_lenght_mark>
 #
+#<TAMIL>
+#
+# collation weights in order
+<tavw-a>
+<tavw-aa>
+<tavw-i>
+<tavw-ii>
+<tavw-u>
+<tavw-uu>
+<tavw-e>
+<tavw-ee>
+<tavw-ai>
+<tavw-o>
+<tavw-oo>
+<tavw-au>
+<ta-aytham> #visarga
+<ta-k>
+<ta-ng>
+<ta-c>
+<ta-ny>
+<ta-tt>
+<ta-nn>
+<ta-t>
+<ta-n>
+<ta-p>
+<ta-m>
+<ta-y>
+<ta-r>
+<ta-l>
+<ta-v>
+<ta-zh>
+<ta-ll>
+<ta-rr>
+<ta-nnn>
+<ta-j>
+<ta-sh>
+<ta-ss>
+<ta-s>
+<ta-h>
+<ta-pulli> #virama
+<tavs-aa>
+<tavs-i>
+<tavs-ii>
+<tavs-u>
+<tavs-uu>
+<tavs-e>
+<tavs-ee>
+<tavs-ai>
+<tavs-o>
+<tavs-oo>
+<tavs-au>
+#
 # <MALAYALAM>
 #
 # collation weights in order
@@ -6123,6 +6257,93 @@ order_start  <KANNADA>;forward;forward;forward;forward,position
 <U0CD5> <k-lenght_mark>;<BAS>;<MIN>;IGNORE
 <U0CD6> <k-ai_lenght_mark>;<BAS>;<MIN>;IGNORE
 <U0CBC> IGNORE;<KNKT>;<MIN>;IGNORE
+order_start <TAMIL>;forward;forward;forward;forward,position
+<U0BE6> <0>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BE7> <1>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BE8> <2>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BE9> <3>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BEA> <4>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BEB> <5>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BEC> <6>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BED> <7>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BEE> <8>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0BEF> <9>;"<BAS><NUM>";"<MIN><MIN>";IGNORE
+<U0B85> <tavw-a>;<BAS>;<MIN>;IGNORE
+<U0B86> <tavw-aa>;<BAS>;<MIN>;IGNORE
+<U0B87> <tavw-i>;<BAS>;<MIN>;IGNORE
+<U0B88> <tavw-ii>;<BAS>;<MIN>;IGNORE
+<U0B89> <tavw-u>;<BAS>;<MIN>;IGNORE
+<U0B8A> <tavw-uu>;<BAS>;<MIN>;IGNORE
+<U0B8E> <tavw-e>;<BAS>;<MIN>;IGNORE
+<U0B8F> <tavw-ee>;<BAS>;<MIN>;IGNORE
+<U0B90> <tavw-ai>;<BAS>;<MIN>;IGNORE
+<U0B92> <tavw-o>;<BAS>;<MIN>;IGNORE
+<U0B93> <tavw-oo>;<BAS>;<MIN>;IGNORE
+<U0B94> <tavw-au>;<BAS>;<MIN>;IGNORE
+<U0B83> <ta-aytham>;<BAS>;<MIN>;IGNORE
+<pure-ta-k> <ta-k>;<BAS>;<MIN>;IGNORE
+<U0B95> "<ta-k><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-ng> "<ta-ng>";<BAS>;<MIN>;IGNORE
+<U0B99> "<ta-ng><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-c> <ta-c>;<BAS>;<MIN>;IGNORE
+<U0B9A> "<ta-c><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-ny> <ta-ny>;<BAS>;<MIN>;IGNORE
+<U0B9E> "<ta-ny><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-tt> <ta-tt>;<BAS>;<MIN>;IGNORE
+<U0B9F> "<ta-tt><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-nn> <ta-nn>;<BAS>;<MIN>;IGNORE
+<U0BA3> "<ta-nn><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-t> <ta-t>;<BAS>;<MIN>;IGNORE
+<U0BA4> "<ta-t><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-n> <ta-n>;<BAS>;<MIN>;IGNORE
+<U0BA8> "<ta-n><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-p> <ta-p>;<BAS>;<MIN>;IGNORE
+<U0BAA> "<ta-p><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-m> <ta-m>;<BAS>;<MIN>;IGNORE
+<U0BAE> "<ta-m><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-y> <ta-y>;<BAS>;<MIN>;IGNORE
+<U0BAF> "<ta-y><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-r> <ta-r>;<BAS>;<MIN>;IGNORE
+<U0BB0> "<ta-r><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-l> <ta-l>;<BAS>;<MIN>;IGNORE
+<U0BB2> "<ta-l><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-v> <ta-v>;<BAS>;<MIN>;IGNORE
+<U0BB5> "<ta-v><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-zh> <ta-zh>;<BAS>;<MIN>;IGNORE
+<U0BB4> "<ta-zh><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-ll> <ta-ll>;<BAS>;<MIN>;IGNORE
+<U0BB3> "<ta-ll><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-rr> <ta-rr>;<BAS>;<MIN>;IGNORE
+<U0BB1> "<ta-rr><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-nnn> <ta-nnn>;<BAS>;<MIN>;IGNORE
+<U0BA9> "<ta-nnn><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-j> <ta-j>;<BAS>;<MIN>;IGNORE
+<U0B9C> "<ta-j><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-sh> <ta-sh>;<BAS>;<MIN>;IGNORE
+<U0BB6> "<ta-sh><tavw-a>";<BAS>;<MIN>;IGNORE	
+<pure-ta-ss> <ta-ss>;<BAS>;<MIN>;IGNORE
+<U0BB7> "<ta-ss><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-s> <ta-s>;<BAS>;<MIN>;IGNORE
+<U0BB8> "<ta-s><tavw-a>";<BAS>;<MIN>;IGNORE
+<pure-ta-h> <ta-h>;<BAS>;<MIN>;IGNORE
+<U0BB9> "<ta-h><tavw-a>";<BAS>;<MIN>;IGNORE
+<tagl_KSHA> "<U0B95><U0BCD><U0BB7>";<BAS>;<MIN>;IGNORE
+<U0BCD> <ta-pulli>;<BAS>;<MIN>;IGNORE
+<U0BBE> <tavs-aa>;<BAS>;<MIN>;IGNORE
+<U0BBF> <tavs-i>;<BAS>;<MIN>;IGNORE
+<U0BC0> <tavs-ii>;<BAS>;<MIN>;IGNORE
+<U0BC1> <tavs-u>;<BAS>;<MIN>;IGNORE
+<U0BC2> <tavs-uu>;<BAS>;<MIN>;IGNORE
+<U0BC6> <tavs-e>;<BAS>;<MIN>;IGNORE
+<U0BC7> <tavs-ee>;<BAS>;<MIN>;IGNORE
+<U0BC8> <tavs-ai>;<BAS>;<MIN>;IGNORE
+<U0BCA><tavs-o>;<BAS>;<MIN>;IGNORE
+<U0BCB> <tavs-oo>;<BAS>;<MIN>;IGNORE
+<U0BCC> <tavs-au>;<BAS>;<MIN>;IGNORE
+<tagl_SHRI> "<U0BB6><U0BCD><U0BB0><U0BC0>";<BAS>;<MIN>;IGNORE
+<ta_split_o> <tavs-o>;<BAS>;<MIN>;IGNORE
+<ta_split_oo> <tavs-oo>;<BAS>;<MIN>;IGNORE
+<ta_split_au> <tavs-au>;<BAS>;<MIN>;IGNORE
 
 order_start <SINHALA>;forward;forward;forward;forward,position
 # SCCII Part 1 : Collation Sequence (SLS1134)
diff --git a/localedata/locales/ta_IN b/localedata/locales/ta_IN
index 51a4fff35f..68bcf4ab85 100644
--- a/localedata/locales/ta_IN
+++ b/localedata/locales/ta_IN
@@ -63,100 +63,7 @@ LC_COLLATE
 
 % Copy the template from ISO/IEC 14651
 copy "iso14651_t1"
-% Tamil Collation Order as defined in The Madras Tamil Lexicon
-% Ref: http://www.uni-koeln.de/phil-fak/indologie/tamil/otl.html
-% Contact: T. Vaseehran <t_vasee@yahoo.com>
-% Last Updated:  Feb. 12, 2004
-% ChangeLog:
-%  - Added split forms of o, oo, au
-%  - Moved Tamil Symbols above numbers
-%  - Added TAMIL LETTER SHA (U0BB6)
-%    Ref: http://wwwold.dkuug.dk/JTC1/SC2/WG2/docs/n2617
-%       : http://wwwold.dkuug.dk/JTC1/SC2/WG2/docs/n2618
-% Initial version: Feb. 10, 2004.
 
-collating-element <split_o> from "<U0BC6><U0BBE>"
-collating-element <split_oo> from "<U0BC7><U0BBE>"
-collating-element <split_au> from "<U0BC6><U0BD7>"
-collating-element <tagl_KSHA> from "<U0B95><U0BCD><U0BB7>"
-collating-element <tagl_SHRI> from "<U0BB8><U0BCD><U0BB0><U0BC0>"
-
-reorder-after <U00DE>
-<U0BF3> % TAMIL SIGN DAY
-<U0BF4> % TAMIL SIGN MONTH
-<U0BF5> % TAMIL SIGN YEAR
-<U0BF6> % TAMIL SIGN DEBIT
-<U0BF7> % TAMIL SIGN CREDIT
-<U0BF8> % TAMIL SIGN AS ABOVE
-<U0BF9> % TAMIL SIGN RUPEE
-<U0BE6> % TAMIL DIGIT ZERO
-<U0BE7> % TAMIL DIGIT ONE
-<U0BE8> % TAMIL DIGIT TWO
-<U0BE9> % TAMIL DIGIT THREE
-<U0BEA> % TAMIL DIGIT FOUR
-<U0BEB> % TAMIL DIGIT FIVE
-<U0BEC> % TAMIL DIGIT SIX
-<U0BED> % TAMIL DIGIT SEVEN
-<U0BEE> % TAMIL DIGIT EIGHT
-<U0BEF> % TAMIL DIGIT NINE
-<U0BF0> % TAMIL NUMBER TEN
-<U0BF1> % TAMIL NUMBER ONE HUNDRED
-<U0BF2> % TAMIL NUMBER ONE THOUSAND
-<U0B85> % TAMIL LETTER A
-<U0B86> % TAMIL LETTER AA
-<U0B87> % TAMIL LETTER I
-<U0B88> % TAMIL LETTER II
-<U0B89> % TAMIL LETTER U
-<U0B8A> % TAMIL LETTER UU
-<U0B8E> % TAMIL LETTER E
-<U0B8F> % TAMIL LETTER EE
-<U0B90> % TAMIL LETTER AI
-<U0B92> % TAMIL LETTER O
-<U0B93> % TAMIL LETTER OO
-<U0B94> % TAMIL LETTER AU
-<U0B83> % TAMIL SIGN VISARGA (AYTHAM)
-<U0B95> % TAMIL LETTER K
-<U0B99> % TAMIL LETTER NG
-<U0B9A> % TAMIL LETTER C
-<U0B9E> % TAMIL LETTER NY
-<U0B9F> % TAMIL LETTER TT
-<U0BA3> % TAMIL LETTER NNN
-<U0BA4> % TAMIL LETTER T
-<U0BA8> % TAMIL LETTER N
-<U0BAA> % TAMIL LETTER P
-<U0BAE> % TAMIL LETTER M
-<U0BAF> % TAMIL LETTER Y
-<U0BB0> % TAMIL LETTER R
-<U0BB2> % TAMIL LETTER L
-<U0BB5> % TAMIL LETTER V
-<U0BB4> % TAMIL LETTER LLL
-<U0BB3> % TAMIL LETTER LL
-<U0BB1> % TAMIL LETTER RR
-<U0BA9> % TAMIL LETTER NN
-<U0B9C> % TAMIL LETTER JA
-<U0BB6> % TAMIL LETTER SHA
-<U0BB7> % TAMIL LETTER SSA
-<U0BB8> % TAMIL LETTER SA
-<U0BB9> % TAMIL LETTER HA
-<tagl_KSHA>
-<U0BCD> % TAMIL SIGN VIRAMA (PULLI)
-<U0BBE> % TAMIL VOWEL SIGN AA
-<U0BBF> % TAMIL VOWEL SIGN I
-<U0BC0> % TAMIL VOWEL SIGN II
-<U0BC1> % TAMIL VOWEL SIGN U
-<U0BC2> % TAMIL VOWEL SIGN UU
-<U0BC6> % TAMIL VOWEL SIGN E
-<U0BC7> % TAMIL VOWEL SIGN EE
-<U0BC8> % TAMIL VOWEL SIGN AI
-<U0BCA> % TAMIL VOWEL SIGN O
-<U0BCB> % TAMIL VOWEL SIGN OO
-<U0BCC> % TAMIL VOWEL SIGN AU
-<U0BD7> % TAMIL AU LENGTH MARK
-<tagl_SHRI> "<U0BB6><U0BCD><U0BB0><U0BC0>"
-<split_o>  <U0BCA>
-<split_oo> <U0BCB>
-<split_au> <U0BCC>
-reorder-end
 END LC_COLLATE