blob: ee7563a92cb501e081c5dcf2bc0a55d17f8ee923 [file] [log] [blame]
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE html
PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html>
<head>
<!-- /*******************************************************************************
* Copyright (c) 2000, 2005 IBM Corporation and others.
* All rights reserved. This program and the accompanying materials
<meta name="security" content="public" />
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
* IBM Corporation - initial API and implementation
*******************************************************************************/ -->
<link rel="stylesheet" type="text/css" href="../../org.eclipse.wst.doc.user/common.css" />
<title>XML and HTML encodings</title>
</head>
<body id="cxmlenc"><a name="cxmlenc"><!-- --></a>
<h1 class="topictitle1">XML and HTML encodings</h1>
<div><p>Encodings enable you to specify what character encoding your text
is in.</p>
<p>The IANA name is used in the encoding statement of an XML file, or charset
directive in an HTML file.</p>
<p>The HTML and XML editors support the following encodings:</p>
<div class="tablenoborder"><table cellpadding="4" cellspacing="0" summary="" frame="border" border="1" rules="all"><thead align="left"><tr><th valign="top" class="firstcol" id="d0e31"> <p><strong>XML Encoding (IANA Name)</strong></p>
</th>
<th valign="top" id="d0e26"> <p><b>Description</b></p>
</th>
</tr>
</thead>
<tbody><tr><td valign="top" class="firstcol" id="d0e34" headers="d0e20 "> <p>BIG5</p>
</td>
<td valign="top" headers="d0e34 d0e26 "> <p>Big5, Traditional Chinese</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e45" headers="d0e20 "> <p>EUC-JP</p>
</td>
<td valign="top" headers="d0e45 d0e26 "> <p>EUC encoding, Japanese</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e56" headers="d0e20 "> <p>EUC-KR</p>
</td>
<td valign="top" headers="d0e56 d0e26 "> <p>EUC encoding, Korean</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e67" headers="d0e20 "> <p>GB2312</p>
</td>
<td valign="top" headers="d0e67 d0e26 "> <p>GBK, Simplified Chinese</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e78" headers="d0e20 ">GB18030</td>
<td valign="top" headers="d0e78 d0e26 ">National Standard, Chinese</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e83" headers="d0e20 ">IBM864</td>
<td valign="top" headers="d0e83 d0e26 ">PC Arabic
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e88" headers="d0e20 "> <p>ISO-2022-JP</p>
</td>
<td valign="top" headers="d0e88 d0e26 "> <p>ISO 2022, Japanese</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e99" headers="d0e20 "> <p>ISO-2022-KR</p>
</td>
<td valign="top" headers="d0e99 d0e26 "> <p>ISO 2022, Korean</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e110" headers="d0e20 "> <p>ISO-8859-1</p>
</td>
<td valign="top" headers="d0e110 d0e26 "> <p>ISO Latin-1</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e121" headers="d0e20 ">ISO-8859-2</td>
<td valign="top" headers="d0e121 d0e26 ">Central/East European (Slavic)</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e126" headers="d0e20 ">ISO-8859-3</td>
<td valign="top" headers="d0e126 d0e26 ">Southern European</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e131" headers="d0e20 ">ISO-8859-4</td>
<td valign="top" headers="d0e131 d0e26 ">ISO 8859-4, Cyrillic</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e136" headers="d0e20 ">ISO-8859-5</td>
<td valign="top" headers="d0e136 d0e26 ">ISO 8859-5, Cyrillic</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e141" headers="d0e20 "> <p>ISO-8859-6</p>
</td>
<td valign="top" headers="d0e141 d0e26 ">Arabic (Logical)</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e152" headers="d0e20 ">ISO-8859-7</td>
<td valign="top" headers="d0e152 d0e26 ">Greek</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e157" headers="d0e20 "> <p>ISO-8859-8-I</p>
</td>
<td valign="top" headers="d0e157 d0e26 "> <p>Hebrew (Logical)</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e168" headers="d0e20 "> <p>ISO-8859-8</p>
</td>
<td valign="top" headers="d0e168 d0e26 "> <p>Hebrew (Visual)</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e179" headers="d0e20 ">ISO-8859-9</td>
<td valign="top" headers="d0e179 d0e26 ">Turkish</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e184" headers="d0e20 "> <p>SHIFT_JIS</p>
</td>
<td valign="top" headers="d0e184 d0e26 "> <p>Shift-JIS, Japanese</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e195" headers="d0e20 ">TIS-620</td>
<td valign="top" headers="d0e195 d0e26 ">TISI, Thai</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e200" headers="d0e20 "> <p>US-ASCII</p>
</td>
<td valign="top" headers="d0e200 d0e26 "> <p>US ASCII</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e211" headers="d0e20 "> <p>UTF-8</p>
</td>
<td valign="top" headers="d0e211 d0e26 "> <p>ISO 10646/Unicode, one-byte encoding</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e222" headers="d0e20 "> <p>UTF-16</p>
</td>
<td valign="top" headers="d0e222 d0e26 "> <p>ISO 10646/Unicode, two-byte encoding</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e233" headers="d0e20 "> <p>UTF-16BE</p>
</td>
<td valign="top" headers="d0e233 d0e26 "> <p>Unicode BigEndian</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e244" headers="d0e20 "> <p>UTF-16LE</p>
</td>
<td valign="top" headers="d0e244 d0e26 "> <p>Unicode LittleEndian</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e255" headers="d0e20 ">WINDOWS-874</td>
<td valign="top" headers="d0e255 d0e26 ">Thai, Microsoft<sup>®</sup></td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e262" headers="d0e20 "> <p>WINDOWS-1252</p>
</td>
<td valign="top" headers="d0e262 d0e26 "> <p>ISO Latin-1</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e273" headers="d0e20 "> <p>WINDOWS-1255</p>
</td>
<td valign="top" headers="d0e273 d0e26 "> <p>Hebrew</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e284" headers="d0e20 "> <p>WINDOWS-1256</p>
</td>
<td valign="top" headers="d0e284 d0e26 "> <p>Arabic</p>
</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e295" headers="d0e20 ">X-EUC-JP</td>
<td valign="top" headers="d0e295 d0e26 ">EUC encoding, Japanese (alias for EUC-JP)</td>
</tr>
<tr><td valign="top" class="firstcol" id="d0e300" headers="d0e20 ">X-SJIS</td>
<td valign="top" headers="d0e300 d0e26 ">Shift-JIS, Japanese (alias for SHIFT_JIS)</td>
</tr>
</tbody>
</table>
</div>
</div>
</body>
</html>