<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html lang="en-us" xml:lang="en-us">
<head>
<meta content="text/html; charset=utf-8" http-equiv="Content-Type" />
<meta name="copyright" content="Copyright (c) 2000, 2006 IBM Corporation and others. All rights reserved. This program and the accompanying materials are made available under the terms of the Eclipse Public License v1.0 which accompanies this distribution, and is available at http://www.eclipse.org/legal/epl-v10.html. Contributors: IBM Corporation - initial API and implementation" />
<meta name="DC.rights.owner" content="(C) Copyright 2000, 2006" />
<meta content="public" name="security" />
<meta content="index,follow" name="Robots" />
<meta http-equiv="PICS-Label" content='(PICS-1.1 "http://www.icra.org/ratingsv02.html" l gen true r (cz 1 lz 1 nz 1 oz 1 vz 1) "http://www.rsac.org/ratingsv01.html" l gen true r (n 0 s 0 v 0 l 0) "http://www.classify.org/safesurf/" l gen true r (SS~~000 1))' />
<meta content="concept" name="DC.Type" />
<meta name="DC.Title" content="XML and HTML encodings" />
<meta name="abstract" content="Encodings enable you to specify what character encoding your text is in." />
<meta name="description" content="Encodings enable you to specify what character encoding your text is in." />
<meta content="Encodings, HTML, XML" name="DC.subject" />
<meta content="Encodings, HTML, XML" name="keywords" />
<meta content="XHTML" name="DC.Format" />
<meta content="cxmlenc" name="DC.Identifier" />
<meta content="en-us" name="DC.Language" />
<link href="../../org.eclipse.wst.doc.user/common.css" type="text/css" rel="stylesheet" />
<title>XML and HTML encodings</title>
</head>
<body id="cxmlenc"><a name="cxmlenc"><!-- --></a>


<h1 class="topictitle1">XML and HTML encodings</h1>




<div><p>Encodings enable you to specify what character encoding your text
is in.</p>

<p>The IANA name is used in the encoding statement of an XML file, or charset
directive in an HTML file.</p>

<p>The HTML and XML editors support the following encodings:</p>


<div class="tablenoborder"><table summary="" cellspacing="0" cellpadding="4" frame="border" border="1" rules="all">
<thead align="left">
<tr>
<th valign="top" class="firstcol" id="N1007B"> <p><strong>XML Encoding (IANA Name)</strong></p>
 </th>

<th valign="top" id="N1008D"> <p><strong>Description</strong></p>
 </th>

</tr>

</thead>

<tbody>
<tr>
<th valign="top" class="firstcol" id="N100AB" headers="N1007B "> <p>BIG5</p>
 </th>

<td valign="top" headers="N100AB N1008D "> <p>Big5, Traditional Chinese</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N100CB" headers="N1007B "> <p>EUC-JP</p>
 </th>

<td valign="top" headers="N100CB N1008D "> <p>EUC encoding, Japanese</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N100EB" headers="N1007B "> <p>EUC-KR</p>
 </th>

<td valign="top" headers="N100EB N1008D "> <p>EUC encoding, Korean</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1010B" headers="N1007B "> <p>GB2312</p>
 </th>

<td valign="top" headers="N1010B N1008D "> <p>GBK, Simplified Chinese</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1012B" headers="N1007B ">GB18030</th>

<td valign="top" headers="N1012B N1008D ">National Standard, Chinese</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1013F" headers="N1007B ">IBM864</th>

<td valign="top" headers="N1013F N1008D ">PC Arabic (encoding not supported by the Page Designer Design page.
)</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10153" headers="N1007B "> <p>ISO-2022-JP</p>
 </th>

<td valign="top" headers="N10153 N1008D "> <p>ISO 2022, Japanese</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10173" headers="N1007B "> <p>ISO-2022-KR</p>
 </th>

<td valign="top" headers="N10173 N1008D "> <p>ISO 2022, Korean</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10193" headers="N1007B "> <p>ISO-8859-1</p>
 </th>

<td valign="top" headers="N10193 N1008D "> <p>ISO Latin-1</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N101B3" headers="N1007B ">ISO-8859-2</th>

<td valign="top" headers="N101B3 N1008D ">Central/East European (Slavic)</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N101C7" headers="N1007B ">ISO-8859-3</th>

<td valign="top" headers="N101C7 N1008D ">Southern European</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N101DB" headers="N1007B ">ISO-8859-4</th>

<td valign="top" headers="N101DB N1008D ">ISO 8859-4, Cyrillic</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N101EF" headers="N1007B ">ISO-8859-5</th>

<td valign="top" headers="N101EF N1008D ">ISO 8859-5, Cyrillic</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10203" headers="N1007B "> <p>ISO-8859-6</p>
 </th>

<td valign="top" headers="N10203 N1008D "> <p>Arabic (Logical)</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10223" headers="N1007B ">ISO-8859-7</th>

<td valign="top" headers="N10223 N1008D ">Greek</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10237" headers="N1007B "> <p>ISO-8859-8-I</p>
 </th>

<td valign="top" headers="N10237 N1008D "> <p>Hebrew (Logical)</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10257" headers="N1007B "> <p>ISO-8859-8</p>
 </th>

<td valign="top" headers="N10257 N1008D "> <p>Hebrew (Visual)(encoding supported, but not supported by the Page
Designer Design page)</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N10277" headers="N1007B ">ISO-8859-9</th>

<td valign="top" headers="N10277 N1008D ">Turkish</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1028B" headers="N1007B "> <p>SHIFT_JIS</p>
 </th>

<td valign="top" headers="N1028B N1008D "> <p>Shift-JIS, Japanese</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N102AB" headers="N1007B ">TIS-620</th>

<td valign="top" headers="N102AB N1008D ">TISI, Thai</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N102BF" headers="N1007B "> <p>US-ASCII</p>
 </th>

<td valign="top" headers="N102BF N1008D "> <p>US ASCII</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N102DF" headers="N1007B "> <p>UTF-8</p>
 </th>

<td valign="top" headers="N102DF N1008D "> <p>ISO 10646/Unicode, one-byte encoding</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N102FF" headers="N1007B "> <p>UTF-16</p>
 </th>

<td valign="top" headers="N102FF N1008D "> <p>ISO 10646/Unicode, two-byte encoding</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1031F" headers="N1007B "> <p>UTF-16BE</p>
 </th>

<td valign="top" headers="N1031F N1008D "> <p>Unicode BigEndian</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1033F" headers="N1007B "> <p>UTF-16LE</p>
 </th>

<td valign="top" headers="N1033F N1008D "> <p>Unicode LittleEndian</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1035F" headers="N1007B ">WINDOWS-874</th>

<td valign="top" headers="N1035F N1008D ">Thai, Microsoft<sup>®</sup></td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1037C" headers="N1007B "> <p>WINDOWS-1252</p>
 </th>

<td valign="top" headers="N1037C N1008D "> <p>ISO Latin-1</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N1039C" headers="N1007B "> <p>WINDOWS-1255</p>
 </th>

<td valign="top" headers="N1039C N1008D "> <p>Hebrew</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N103BC" headers="N1007B "> <p>WINDOWS-1256</p>
 </th>

<td valign="top" headers="N103BC N1008D "> <p>Arabic</p>
 </td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N103DC" headers="N1007B ">X-EUC-JP</th>

<td valign="top" headers="N103DC N1008D ">EUC encoding, Japanese (alias for EUC-JP)</td>

</tr>

<tr>
<th valign="top" class="firstcol" id="N103F0" headers="N1007B ">X-SJIS</th>

<td valign="top" headers="N103F0 N1008D ">Shift-JIS, Japanese (alias for SHIFT_JIS)</td>

</tr>

</tbody>

</table>
</div>

</div>

<div />

</body>
</html>