<?xml version="1.0" encoding="utf-8"?> | |
<!--Arbortext, Inc., 1988-2005, v.4002--> | |
<!DOCTYPE concept PUBLIC "-//OASIS//DTD DITA Concept//EN" "concept.dtd"> | |
<?Pub Inc?> | |
<concept id="cxmlenc" xml:lang="en-us"> | |
<title>XML and HTML encodings</title> | |
<titlealts> | |
<searchtitle>XML and HTML encodings</searchtitle> | |
</titlealts> | |
<shortdesc>Encodings enable you to specify what character encoding your text | |
is in.</shortdesc> | |
<prolog><metadata> | |
<keywords><indexterm>character encoding<indexterm>text in files</indexterm></indexterm> | |
<indexterm>encodings<indexterm>supported character sets</indexterm></indexterm> | |
</keywords> | |
</metadata></prolog> | |
<conbody> | |
<p>The IANA name is used in the encoding statement of an XML file, or charset | |
directive in an HTML file.</p> | |
<p>The HTML and XML editors support the following encodings:</p> | |
<table rowheader="firstcol"> | |
<tgroup cols="2"><colspec colname="COLSPEC0"/><colspec colname="COLSPEC1"/> | |
<thead> | |
<row> | |
<entry colname="COLSPEC0" valign="top"> <p><b>XML Encoding (IANA Name)</b></p> </entry> | |
<entry colname="COLSPEC1" valign="top"> <p><b>Description</b></p> </entry> | |
</row> | |
</thead> | |
<tbody> | |
<row> | |
<entry> <p>BIG5</p> </entry> | |
<entry> <p>Big5, Traditional Chinese</p> </entry> | |
</row> | |
<row> | |
<entry> <p>EUC-JP</p> </entry> | |
<entry> <p>EUC encoding, Japanese</p> </entry> | |
</row> | |
<row> | |
<entry> <p>EUC-KR</p> </entry> | |
<entry> <p>EUC encoding, Korean</p> </entry> | |
</row> | |
<row> | |
<entry> <p>GB2312</p> </entry> | |
<entry> <p>GBK, Simplified Chinese</p> </entry> | |
</row> | |
<row> | |
<entry>GB18030</entry> | |
<entry>National Standard, Chinese</entry> | |
</row> | |
<row> | |
<entry>IBM864</entry> | |
<entry>PC Arabic (encoding not supported by the Page Designer Design page. | |
)</entry> | |
</row> | |
<row> | |
<entry> <p>ISO-2022-JP</p> </entry> | |
<entry> <p>ISO 2022, Japanese</p> </entry> | |
</row> | |
<row> | |
<entry> <p>ISO-2022-KR</p> </entry> | |
<entry> <p>ISO 2022, Korean</p> </entry> | |
</row> | |
<row> | |
<entry> <p>ISO-8859-1</p> </entry> | |
<entry> <p>ISO Latin-1</p> </entry> | |
</row> | |
<row> | |
<entry>ISO-8859-2</entry> | |
<entry>Central/East European (Slavic)</entry> | |
</row> | |
<row> | |
<entry>ISO-8859-3</entry> | |
<entry>Southern European</entry> | |
</row> | |
<row> | |
<entry>ISO-8859-4</entry> | |
<entry>ISO 8859-4, Cyrillic</entry> | |
</row> | |
<row> | |
<entry>ISO-8859-5</entry> | |
<entry>ISO 8859-5, Cyrillic</entry> | |
</row> | |
<row> | |
<entry> <p>ISO-8859-6</p> </entry> | |
<entry> <p>Arabic (Logical)</p> </entry> | |
</row> | |
<row> | |
<entry>ISO-8859-7</entry> | |
<entry>Greek</entry> | |
</row> | |
<row> | |
<entry> <p>ISO-8859-8-I</p> </entry> | |
<entry> <p>Hebrew (Logical)</p> </entry> | |
</row> | |
<row> | |
<entry> <p>ISO-8859-8</p> </entry> | |
<entry> <p>Hebrew (Visual)(encoding supported, but not supported by the Page | |
Designer Design page)</p> </entry> | |
</row> | |
<row> | |
<entry>ISO-8859-9</entry> | |
<entry>Turkish</entry> | |
</row> | |
<row> | |
<entry> <p>SHIFT_JIS</p> </entry> | |
<entry> <p>Shift-JIS, Japanese</p> </entry> | |
</row> | |
<row> | |
<entry>TIS-620</entry> | |
<entry>TISI, Thai</entry> | |
</row> | |
<row> | |
<entry> <p>US-ASCII</p> </entry> | |
<entry> <p>US ASCII</p> </entry> | |
</row> | |
<row> | |
<entry> <p>UTF-8</p> </entry> | |
<entry> <p>ISO 10646/Unicode, one-byte encoding</p> </entry> | |
</row> | |
<row> | |
<entry> <p>UTF-16</p> </entry> | |
<entry> <p>ISO 10646/Unicode, two-byte encoding</p> </entry> | |
</row> | |
<row> | |
<entry> <p>UTF-16BE</p> </entry> | |
<entry> <p>Unicode BigEndian</p> </entry> | |
</row> | |
<row> | |
<entry> <p>UTF-16LE</p> </entry> | |
<entry> <p>Unicode LittleEndian</p> </entry> | |
</row> | |
<row> | |
<entry>WINDOWS-874</entry> | |
<entry>Thai, <tm tmclass="special" tmowner="Microsoft Corporation" tmtype="reg" | |
trademark="Microsoft">Microsoft</tm></entry> | |
</row> | |
<row> | |
<entry> <p>WINDOWS-1252</p> </entry> | |
<entry> <p>ISO Latin-1</p> </entry> | |
</row> | |
<row> | |
<entry> <p>WINDOWS-1255</p> </entry> | |
<entry> <p>Hebrew</p> </entry> | |
</row> | |
<row> | |
<entry> <p>WINDOWS-1256</p> </entry> | |
<entry> <p>Arabic</p> </entry> | |
</row> | |
<row> | |
<entry>X-EUC-JP</entry> | |
<entry>EUC encoding, Japanese (alias for EUC-JP)</entry> | |
</row> | |
<row> | |
<entry>X-SJIS</entry> | |
<entry>Shift-JIS, Japanese (alias for SHIFT_JIS)</entry> | |
</row> | |
</tbody> | |
</tgroup> | |
</table> | |
</conbody> | |
</concept> | |
<?Pub *0000003991?> |