summary refs log tree commit diff
path: root/iconvdata/TESTS
blob: 8d6df22432825d26389893dbb98fdbd6160d8959 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
# Available tests for iconv(1) (and therefore iconv(3)) in GNU libc.
# Copyright (C) 1998-2002 Free Software Foundation, Inc.
# This file is part of the GNU C Library.
# Contributed by Ulrich Drepper <drepper@cygnus.com>, 1998.
#

# The GNU C Library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.

# The GNU C Library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.

# You should have received a copy of the GNU Lesser General Public
# License along with the GNU C Library; if not, write to the Free
# Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
# 02111-1307 USA.

# Each line consists of at least four entries:
# 1.  input file name.
# 2.  output file name; this is different from the input file name only for
#     conversions which do not produce the same output when the transformation
#     is applied back and forth.
# 3.  Y or N depending of whether the character set contains ASCII as a
#     subset or not.
# 4.
# ...
# N.  target coded character set.

ISO-8859-1		ISO-8859-1		Y	UTF8
ISO-8859-2		ISO-8859-2		Y	UCS4 UTF8
ISO-8859-3		ISO-8859-3		Y	UTF8
ISO-8859-4		ISO-8859-4		Y	UTF8
ISO-8859-5		ISO-8859-5		Y	UTF8
ISO-8859-6		ISO-8859-6		Y	UTF8
ISO-8859-7		ISO-8859-7		Y	UTF8
ISO-8859-8		ISO-8859-8		Y	UTF8
ISO-8859-9		ISO-8859-9		Y	UTF8
ISO-8859-10		ISO-8859-10		Y	UCS-2BE UTF8
ISO-8859-14		ISO-8859-14		Y	UTF8
ISO-8859-15		ISO-8859-15		Y	UTF8
ANSI_X3.4-1968		ANSI_X3.4-1968		Y	UTF8
BS_4730			BS_4730			Y	UTF8
CSA_Z243.4-1985-1	CSA_Z243.4-1985-1	Y	UCS-2BE
CSA_Z243.4-1985-2	CSA_Z243.4-1985-2	Y	UCS4
DIN_66003		DIN_66003		Y	UTF8
DS_2089			DS_2089			Y	UTF8
ES			ES			Y	UTF8
ES2			ES2			Y	UTF8
GB_1988-80		GB_1988-80		Y	UTF8
IT			IT			Y	UTF8
JIS_C6220-1969-RO	JIS_C6220-1969-RO	Y	UTF8
JIS_C6229-1984-B	JIS_C6229-1984-B	Y	UTF8
JUS_I.B1.002		JUS_I.B1.002		Y	UTF8
KSC5636			KSC5636			Y	UTF8
MSZ_7795.3		MSZ_7795.3		Y	UTF8
NC_NC00-10		NC_NC00-10		Y	UTF8
NF_Z_62-010		NF_Z_62-010		Y	UTF8
NF_Z_62-010_1973	NF_Z_62-010_1973	Y	UTF8
NS_4551-1		NS_4551-1		Y	UTF8
NS_4551-2		NS_4551-2		Y	UTF8
PT			PT			Y	UTF8
PT2			PT2			Y	UTF8
SEN_850200_B		SEN_850200_B		Y	UTF8
SEN_850200_C		SEN_850200_C		Y	UTF8
KOI-8			KOI-8			Y	UTF8
KOI8-R			KOI8-R			Y	UTF8
CP1250			CP1250			Y	UTF8
CP1251			CP1251			Y	UTF8
CP1252			CP1252			Y	UTF8
CP1253			CP1253			Y	UTF8
CP1254			CP1254			Y	UTF8
# CP1255 and WINDOWS-1255 are the same encodings. The first test works with the
# charmap as well. The second one tests character composition/decomposition.
CP1255			CP1255			Y	UTF8
WINDOWS-1255		WINDOWS-1255		N	UTF8
CP1256			CP1256			Y	UTF8
CP1257			CP1257			Y	UTF8
# CP1258 and WINDOWS-1258 are the same encodings. The first test works with the
# charmap as well. The second one tests character composition/decomposition.
CP1258			CP1258			Y	UTF8
WINDOWS-1258		WINDOWS-1258		N	UTF8
ISO-2022-JP		ISO-2022-JP		N	UTF8
ISO-2022-JP-2		ISO-2022-JP-2		N	UTF8
ISO-2022-KR		ISO-2022-KR		N	UTF8
ISO-2022-CN		ISO-2022-CN		N	UTF8
ISO-2022-CN-EXT		ISO-2022-CN-EXT		N	UTF8
EUC-KR			EUC-KR			Y	UTF8
EUC-JP			EUC-JP			Y	UTF8
EUC-CN			EUC-CN			Y	UTF8
EUC-TW			EUC-TW			Y	UTF8
GBK			GBK			Y	UTF8
BIG5HKSCS		BIG5HKSCS		Y	UTF8
UTF-7			UTF-7			N	UTF8
IBM856			IBM856			N	UTF8
IBM922			IBM922			Y	UTF8
IBM930			IBM930			N	UTF8
IBM933			IBM933			N	UTF8
IBM935			IBM935			N	UTF8
IBM937			IBM937			N	UTF8
IBM939			IBM939			N	UTF8
IBM932			IBM932			Y	UTF8
IBM943			IBM943			Y	UTF8
IBM1046			IBM1046			Y	UTF8
IBM1124			IBM1124			Y	UTF8
IBM1129			IBM1129			Y	UTF8
IBM1160			IBM1160			N	UTF8
IBM1161			IBM1161			Y	UTF8
IBM1132			IBM1132                 N       UTF8
IBM1133			IBM1133			Y	UTF8
IBM1162			IBM1162			Y	UTF8
IBM1163			IBM1163			Y	UTF8
IBM1164			IBM1164			N	UTF8
TCVN-5712		TCVN-5712		Y	UTF8
EUC-JISX0213		EUC-JISX0213		Y	UTF8
SHIFT_JISX0213		SHIFT_JISX0213		Y	UTF8
ISO-2022-JP-3		ISO-2022-JP-3		N	UTF8