blob: f58ec349221a2d3a6f8bbc05bbed79aead93d732 [file] [log] [blame]
kpriceef160682006-08-29 18:08:31 +00001<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
2<html lang="en-us" xml:lang="en-us">
syeshinbefd53e2005-07-27 18:16:40 +00003<head>
kpriceef160682006-08-29 18:08:31 +00004<meta content="text/html; charset=utf-8" http-equiv="Content-Type" />
kpriceb59c9f62008-04-02 21:24:37 +00005<meta name="copyright" content="Copyright (c) 2000, 2008 IBM Corporation and others. All rights reserved. This program and the accompanying materials are made available under the terms of the Eclipse Public License v1.0 which accompanies this distribution, and is available at http://www.eclipse.org/legal/epl-v10.html. Contributors: IBM Corporation - initial API and implementation" />
6<meta name="DC.rights.owner" content="(C) Copyright 2000, 2008" />
kpriceef160682006-08-29 18:08:31 +00007<meta content="public" name="security" />
8<meta content="index,follow" name="Robots" />
9<meta http-equiv="PICS-Label" content='(PICS-1.1 "http://www.icra.org/ratingsv02.html" l gen true r (cz 1 lz 1 nz 1 oz 1 vz 1) "http://www.rsac.org/ratingsv01.html" l gen true r (n 0 s 0 v 0 l 0) "http://www.classify.org/safesurf/" l gen true r (SS~~000 1))' />
10<meta content="concept" name="DC.Type" />
11<meta name="DC.Title" content="XML and HTML encodings" />
12<meta name="abstract" content="Encodings enable you to specify what character encoding your text is in." />
13<meta name="description" content="Encodings enable you to specify what character encoding your text is in." />
kpriceb59c9f62008-04-02 21:24:37 +000014<meta content="character encoding, text in files, encodings, supported character sets" name="DC.subject" />
15<meta content="character encoding, text in files, encodings, supported character sets" name="keywords" />
kpriceef160682006-08-29 18:08:31 +000016<meta content="XHTML" name="DC.Format" />
17<meta content="cxmlenc" name="DC.Identifier" />
18<meta content="en-us" name="DC.Language" />
19<link href="../../org.eclipse.wst.doc.user/common.css" type="text/css" rel="stylesheet" />
syeshinbefd53e2005-07-27 18:16:40 +000020<title>XML and HTML encodings</title>
syeshin66078272005-09-20 16:53:38 +000021</head>
syeshinbefd53e2005-07-27 18:16:40 +000022<body id="cxmlenc"><a name="cxmlenc"><!-- --></a>
23
kpriceef160682006-08-29 18:08:31 +000024
syeshinbefd53e2005-07-27 18:16:40 +000025<h1 class="topictitle1">XML and HTML encodings</h1>
kpriceef160682006-08-29 18:08:31 +000026
27
28
29
syeshind0bdb8e2005-10-27 17:44:14 +000030<div><p>Encodings enable you to specify what character encoding your text
31is in.</p>
kpriceef160682006-08-29 18:08:31 +000032
syeshind0bdb8e2005-10-27 17:44:14 +000033<p>The IANA name is used in the encoding statement of an XML file, or charset
34directive in an HTML file.</p>
kpriceef160682006-08-29 18:08:31 +000035
syeshind0bdb8e2005-10-27 17:44:14 +000036<p>The HTML and XML editors support the following encodings:</p>
37
kpriceef160682006-08-29 18:08:31 +000038
39<div class="tablenoborder"><table summary="" cellspacing="0" cellpadding="4" frame="border" border="1" rules="all">
40<thead align="left">
41<tr>
kpriceb59c9f62008-04-02 21:24:37 +000042<th valign="top" class="firstcol" id="N1007C"> <p><strong>XML Encoding (IANA Name)</strong></p>
syeshinbefd53e2005-07-27 18:16:40 +000043 </th>
kpriceef160682006-08-29 18:08:31 +000044
kpriceb59c9f62008-04-02 21:24:37 +000045<th valign="top" id="N1008E"> <p><strong>Description</strong></p>
syeshinbefd53e2005-07-27 18:16:40 +000046 </th>
kpriceef160682006-08-29 18:08:31 +000047
syeshinbefd53e2005-07-27 18:16:40 +000048</tr>
kpriceef160682006-08-29 18:08:31 +000049
syeshinbefd53e2005-07-27 18:16:40 +000050</thead>
kpriceef160682006-08-29 18:08:31 +000051
52<tbody>
53<tr>
kpriceb59c9f62008-04-02 21:24:37 +000054<th valign="top" class="firstcol" id="N100AC" headers="N1007C "> <p>BIG5</p>
kpriceef160682006-08-29 18:08:31 +000055 </th>
56
kpriceb59c9f62008-04-02 21:24:37 +000057<td valign="top" headers="N100AC N1008E "> <p>Big5, Traditional Chinese</p>
syeshinbefd53e2005-07-27 18:16:40 +000058 </td>
kpriceef160682006-08-29 18:08:31 +000059
syeshinbefd53e2005-07-27 18:16:40 +000060</tr>
kpriceef160682006-08-29 18:08:31 +000061
62<tr>
kpriceb59c9f62008-04-02 21:24:37 +000063<th valign="top" class="firstcol" id="N100CC" headers="N1007C "> <p>EUC-JP</p>
kpriceef160682006-08-29 18:08:31 +000064 </th>
65
kpriceb59c9f62008-04-02 21:24:37 +000066<td valign="top" headers="N100CC N1008E "> <p>EUC encoding, Japanese</p>
syeshinbefd53e2005-07-27 18:16:40 +000067 </td>
kpriceef160682006-08-29 18:08:31 +000068
syeshinbefd53e2005-07-27 18:16:40 +000069</tr>
kpriceef160682006-08-29 18:08:31 +000070
71<tr>
kpriceb59c9f62008-04-02 21:24:37 +000072<th valign="top" class="firstcol" id="N100EC" headers="N1007C "> <p>EUC-KR</p>
kpriceef160682006-08-29 18:08:31 +000073 </th>
74
kpriceb59c9f62008-04-02 21:24:37 +000075<td valign="top" headers="N100EC N1008E "> <p>EUC encoding, Korean</p>
syeshinbefd53e2005-07-27 18:16:40 +000076 </td>
kpriceef160682006-08-29 18:08:31 +000077
syeshinbefd53e2005-07-27 18:16:40 +000078</tr>
kpriceef160682006-08-29 18:08:31 +000079
80<tr>
kpriceb59c9f62008-04-02 21:24:37 +000081<th valign="top" class="firstcol" id="N1010C" headers="N1007C ">GB18030</th>
82
83<td valign="top" headers="N1010C N1008E ">National Standard, Chinese</td>
84
85</tr>
86
87<tr>
88<th valign="top" class="firstcol" id="N10120" headers="N1007C "> <p>ISO-2022-JP</p>
kpriceef160682006-08-29 18:08:31 +000089 </th>
90
kpriceb59c9f62008-04-02 21:24:37 +000091<td valign="top" headers="N10120 N1008E "> <p>ISO 2022, Japanese</p>
syeshinbefd53e2005-07-27 18:16:40 +000092 </td>
kpriceef160682006-08-29 18:08:31 +000093
syeshinbefd53e2005-07-27 18:16:40 +000094</tr>
kpriceef160682006-08-29 18:08:31 +000095
96<tr>
kpriceb59c9f62008-04-02 21:24:37 +000097<th valign="top" class="firstcol" id="N10140" headers="N1007C "> <p>ISO-2022-KR</p>
kpriceef160682006-08-29 18:08:31 +000098 </th>
99
kpriceb59c9f62008-04-02 21:24:37 +0000100<td valign="top" headers="N10140 N1008E "> <p>ISO 2022, Korean</p>
syeshinbefd53e2005-07-27 18:16:40 +0000101 </td>
kpriceef160682006-08-29 18:08:31 +0000102
syeshinbefd53e2005-07-27 18:16:40 +0000103</tr>
kpriceef160682006-08-29 18:08:31 +0000104
105<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000106<th valign="top" class="firstcol" id="N10160" headers="N1007C "> <p>ISO-8859-1</p>
kpriceef160682006-08-29 18:08:31 +0000107 </th>
108
kpriceb59c9f62008-04-02 21:24:37 +0000109<td valign="top" headers="N10160 N1008E "> <p>ISO Latin-1</p>
syeshinbefd53e2005-07-27 18:16:40 +0000110 </td>
kpriceef160682006-08-29 18:08:31 +0000111
syeshinbefd53e2005-07-27 18:16:40 +0000112</tr>
kpriceef160682006-08-29 18:08:31 +0000113
114<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000115<th valign="top" class="firstcol" id="N10180" headers="N1007C ">ISO-8859-2</th>
116
117<td valign="top" headers="N10180 N1008E ">Central/East European (Slavic)</td>
118
119</tr>
120
121<tr>
122<th valign="top" class="firstcol" id="N10194" headers="N1007C ">ISO-8859-3</th>
123
124<td valign="top" headers="N10194 N1008E ">Southern European</td>
125
126</tr>
127
128<tr>
129<th valign="top" class="firstcol" id="N101A8" headers="N1007C ">ISO-8859-4</th>
130
131<td valign="top" headers="N101A8 N1008E ">ISO 8859-4, Cyrillic</td>
132
133</tr>
134
135<tr>
136<th valign="top" class="firstcol" id="N101BC" headers="N1007C ">ISO-8859-5</th>
137
138<td valign="top" headers="N101BC N1008E ">ISO 8859-5, Cyrillic</td>
139
140</tr>
141
142<tr>
143<th valign="top" class="firstcol" id="N101D0" headers="N1007C "> <p>ISO-8859-6</p>
kpriceef160682006-08-29 18:08:31 +0000144 </th>
145
kpriceb59c9f62008-04-02 21:24:37 +0000146<td valign="top" headers="N101D0 N1008E "> <p>Arabic (Logical)</p>
syeshinbefd53e2005-07-27 18:16:40 +0000147 </td>
kpriceef160682006-08-29 18:08:31 +0000148
syeshinbefd53e2005-07-27 18:16:40 +0000149</tr>
kpriceef160682006-08-29 18:08:31 +0000150
151<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000152<th valign="top" class="firstcol" id="N101F0" headers="N1007C ">ISO-8859-7</th>
kpriceef160682006-08-29 18:08:31 +0000153
kpriceb59c9f62008-04-02 21:24:37 +0000154<td valign="top" headers="N101F0 N1008E ">Greek</td>
kpriceef160682006-08-29 18:08:31 +0000155
syeshinbefd53e2005-07-27 18:16:40 +0000156</tr>
kpriceef160682006-08-29 18:08:31 +0000157
158<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000159<th valign="top" class="firstcol" id="N10204" headers="N1007C "> <p>ISO-8859-8</p>
kpriceef160682006-08-29 18:08:31 +0000160 </th>
161
kpriceb59c9f62008-04-02 21:24:37 +0000162<td valign="top" headers="N10204 N1008E "> <p>Hebrew (Visual) (encoding supported, but not supported by the Page
kpriceef160682006-08-29 18:08:31 +0000163Designer Design page)</p>
syeshinbefd53e2005-07-27 18:16:40 +0000164 </td>
kpriceef160682006-08-29 18:08:31 +0000165
syeshinbefd53e2005-07-27 18:16:40 +0000166</tr>
kpriceef160682006-08-29 18:08:31 +0000167
168<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000169<th valign="top" class="firstcol" id="N10224" headers="N1007C ">ISO-8859-9</th>
kpriceef160682006-08-29 18:08:31 +0000170
kpriceb59c9f62008-04-02 21:24:37 +0000171<td valign="top" headers="N10224 N1008E ">Turkish</td>
kpriceef160682006-08-29 18:08:31 +0000172
syeshinbefd53e2005-07-27 18:16:40 +0000173</tr>
kpriceef160682006-08-29 18:08:31 +0000174
175<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000176<th valign="top" class="firstcol" id="N10238" headers="N1007C "> <p>SHIFT_JIS</p>
kpriceef160682006-08-29 18:08:31 +0000177 </th>
178
kpriceb59c9f62008-04-02 21:24:37 +0000179<td valign="top" headers="N10238 N1008E "> <p>Shift-JIS, Japanese</p>
syeshinbefd53e2005-07-27 18:16:40 +0000180 </td>
kpriceef160682006-08-29 18:08:31 +0000181
syeshinbefd53e2005-07-27 18:16:40 +0000182</tr>
kpriceef160682006-08-29 18:08:31 +0000183
184<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000185<th valign="top" class="firstcol" id="N10258" headers="N1007C ">TIS-620</th>
kpriceef160682006-08-29 18:08:31 +0000186
kpriceb59c9f62008-04-02 21:24:37 +0000187<td valign="top" headers="N10258 N1008E ">TISI, Thai</td>
kpriceef160682006-08-29 18:08:31 +0000188
syeshinbefd53e2005-07-27 18:16:40 +0000189</tr>
kpriceef160682006-08-29 18:08:31 +0000190
191<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000192<th valign="top" class="firstcol" id="N1026C" headers="N1007C "> <p>US-ASCII</p>
kpriceef160682006-08-29 18:08:31 +0000193 </th>
194
kpriceb59c9f62008-04-02 21:24:37 +0000195<td valign="top" headers="N1026C N1008E "> <p>US ASCII</p>
syeshinbefd53e2005-07-27 18:16:40 +0000196 </td>
kpriceef160682006-08-29 18:08:31 +0000197
syeshinbefd53e2005-07-27 18:16:40 +0000198</tr>
kpriceef160682006-08-29 18:08:31 +0000199
200<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000201<th valign="top" class="firstcol" id="N1028C" headers="N1007C "> <p>UTF-8</p>
kpriceef160682006-08-29 18:08:31 +0000202 </th>
203
kpriceb59c9f62008-04-02 21:24:37 +0000204<td valign="top" headers="N1028C N1008E "> <p>ISO 10646/Unicode, one-byte encoding</p>
syeshinbefd53e2005-07-27 18:16:40 +0000205 </td>
kpriceef160682006-08-29 18:08:31 +0000206
syeshinbefd53e2005-07-27 18:16:40 +0000207</tr>
kpriceef160682006-08-29 18:08:31 +0000208
209<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000210<th valign="top" class="firstcol" id="N102AC" headers="N1007C "> <p>UTF-16</p>
kpriceef160682006-08-29 18:08:31 +0000211 </th>
212
kpriceb59c9f62008-04-02 21:24:37 +0000213<td valign="top" headers="N102AC N1008E "> <p>ISO 10646/Unicode, two-byte encoding</p>
syeshinbefd53e2005-07-27 18:16:40 +0000214 </td>
kpriceef160682006-08-29 18:08:31 +0000215
syeshinbefd53e2005-07-27 18:16:40 +0000216</tr>
kpriceef160682006-08-29 18:08:31 +0000217
218<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000219<th valign="top" class="firstcol" id="N102CC" headers="N1007C "> <p>UTF-16BE</p>
kpriceef160682006-08-29 18:08:31 +0000220 </th>
221
kpriceb59c9f62008-04-02 21:24:37 +0000222<td valign="top" headers="N102CC N1008E "> <p>Unicode BigEndian</p>
syeshinbefd53e2005-07-27 18:16:40 +0000223 </td>
kpriceef160682006-08-29 18:08:31 +0000224
syeshinbefd53e2005-07-27 18:16:40 +0000225</tr>
kpriceef160682006-08-29 18:08:31 +0000226
227<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000228<th valign="top" class="firstcol" id="N102EC" headers="N1007C "> <p>UTF-16LE</p>
kpriceef160682006-08-29 18:08:31 +0000229 </th>
230
kpriceb59c9f62008-04-02 21:24:37 +0000231<td valign="top" headers="N102EC N1008E "> <p>Unicode LittleEndian</p>
syeshinbefd53e2005-07-27 18:16:40 +0000232 </td>
kpriceef160682006-08-29 18:08:31 +0000233
syeshinbefd53e2005-07-27 18:16:40 +0000234</tr>
kpriceef160682006-08-29 18:08:31 +0000235
236<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000237<th valign="top" class="firstcol" id="N1030C" headers="N1007C "><p>WINDOWS-31J</p>
238</th>
kpriceef160682006-08-29 18:08:31 +0000239
kpriceb59c9f62008-04-02 21:24:37 +0000240<td valign="top" headers="N1030C N1008E "><p>Japanese, Windows-31J</p>
241</td>
kpriceef160682006-08-29 18:08:31 +0000242
syeshinbefd53e2005-07-27 18:16:40 +0000243</tr>
kpriceef160682006-08-29 18:08:31 +0000244
245<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000246<th valign="top" class="firstcol" id="N10328" headers="N1007C "> <p>WINDOWS-1255</p>
kpriceef160682006-08-29 18:08:31 +0000247 </th>
248
kpriceb59c9f62008-04-02 21:24:37 +0000249<td valign="top" headers="N10328 N1008E "> <p>Hebrew</p>
syeshinbefd53e2005-07-27 18:16:40 +0000250 </td>
kpriceef160682006-08-29 18:08:31 +0000251
syeshinbefd53e2005-07-27 18:16:40 +0000252</tr>
kpriceef160682006-08-29 18:08:31 +0000253
254<tr>
kpriceb59c9f62008-04-02 21:24:37 +0000255<th valign="top" class="firstcol" id="N10348" headers="N1007C "> <p>WINDOWS-1256</p>
kpriceef160682006-08-29 18:08:31 +0000256 </th>
257
kpriceb59c9f62008-04-02 21:24:37 +0000258<td valign="top" headers="N10348 N1008E "> <p>Arabic</p>
syeshinbefd53e2005-07-27 18:16:40 +0000259 </td>
kpriceef160682006-08-29 18:08:31 +0000260
261</tr>
262
syeshinbefd53e2005-07-27 18:16:40 +0000263</tbody>
kpriceef160682006-08-29 18:08:31 +0000264
syeshinbefd53e2005-07-27 18:16:40 +0000265</table>
266</div>
kpriceef160682006-08-29 18:08:31 +0000267
syeshinbefd53e2005-07-27 18:16:40 +0000268</div>
kpriceef160682006-08-29 18:08:31 +0000269
270<div />
271
syeshinbefd53e2005-07-27 18:16:40 +0000272</body>
273</html>