CINXE.COM
Web Encodings - WHATWG Wiki
<!DOCTYPE html> <html class="client-nojs" lang="en" dir="ltr"> <head> <meta charset="UTF-8"/> <title>Web Encodings - WHATWG Wiki</title> <script>document.documentElement.className="client-js";RLCONF={"wgBreakFrames":false,"wgSeparatorTransformTable":["",""],"wgDigitTransformTable":["",""],"wgDefaultDateFormat":"dmy","wgMonthNames":["","January","February","March","April","May","June","July","August","September","October","November","December"],"wgRequestId":"2dd9afb376a93b12b428e079","wgCSPNonce":false,"wgCanonicalNamespace":"","wgCanonicalSpecialPageName":false,"wgNamespaceNumber":0,"wgPageName":"Web_Encodings","wgTitle":"Web Encodings","wgCurRevisionId":8675,"wgRevisionId":8675,"wgArticleId":1849,"wgIsArticle":true,"wgIsRedirect":false,"wgAction":"view","wgUserName":null,"wgUserGroups":["*"],"wgCategories":["Obsolete documents","Obsolete specifications","Spec coordination","Registries"],"wgPageContentLanguage":"en","wgPageContentModel":"wikitext","wgRelevantPageName":"Web_Encodings","wgRelevantArticleId":1849,"wgIsProbablyEditable":false,"wgRelevantPageIsProbablyEditable":false,"wgRestrictionEdit":[],"wgRestrictionMove":[], "wgVector2022PreviewPages":[]};RLSTATE={"ext.gadget.WatchlistChangesBold":"ready","ext.gadget.widensearch":"ready","site.styles":"ready","user.styles":"ready","user":"ready","user.options":"loading","skins.vector.styles.legacy":"ready"};RLPAGEMODULES=["site","mediawiki.page.ready","mediawiki.toc","skins.vector.legacy.js","ext.gadget.exlinks","ext.gadget.charinsert","ext.gadget.edittop","ext.gadget.PrettyLog"];</script> <script>(RLQ=window.RLQ||[]).push(function(){mw.loader.implement("user.options@12s5i",function($,jQuery,require,module){mw.user.tokens.set({"patrolToken":"+\\","watchToken":"+\\","csrfToken":"+\\"});});});</script> <link rel="stylesheet" href="/load.php?lang=en&modules=skins.vector.styles.legacy&only=styles&skin=vector"/> <script async="" src="/load.php?lang=en&modules=startup&only=scripts&raw=1&skin=vector"></script> <meta name="ResourceLoaderDynamicStyles" content=""/> <link rel="stylesheet" href="/load.php?lang=en&modules=ext.gadget.WatchlistChangesBold%2Cwidensearch&only=styles&skin=vector"/> <link rel="stylesheet" href="/load.php?lang=en&modules=site.styles&only=styles&skin=vector"/> <meta name="generator" content="MediaWiki 1.39.3"/> <meta name="format-detection" content="telephone=no"/> <meta name="viewport" content="width=1000"/> <link rel="apple-touch-icon" href="https://resources.whatwg.org/logo.png"/> <link rel="icon" href="https://resources.whatwg.org/logo.svg"/> <link rel="search" type="application/opensearchdescription+xml" href="/opensearch_desc.php" title="WHATWG Wiki (en)"/> <link rel="EditURI" type="application/rsd+xml" href="https://wiki.whatwg.org/api.php?action=rsd"/> <link rel="license" href="/wiki/WHATWG_Wiki:Copyrights"/> <link rel="alternate" type="application/atom+xml" title="WHATWG Wiki Atom feed" href="/index.php?title=Special:RecentChanges&feed=atom"/> </head> <body class="mediawiki ltr sitedir-ltr mw-hide-empty-elt ns-0 ns-subject page-Web_Encodings rootpage-Web_Encodings skin-vector action-view skin-vector-legacy vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-language-alert-in-sidebar-disabled vector-feature-sticky-header-disabled vector-feature-sticky-header-edit-disabled vector-feature-table-of-contents-disabled vector-feature-visual-enhancement-next-disabled"><div id="mw-page-base" class="noprint"></div> <div id="mw-head-base" class="noprint"></div> <div id="content" class="mw-body" role="main"> <a id="top"></a> <div id="siteNotice"><div id="localNotice"><div class="anonnotice" lang="en" dir="ltr"><div id="anonNotice"> <div style="margin: 0.5em auto; border: 1px solid #333333; background-color: #EEEEEE; padding: 0.5em; font-size: larger; text-align: center;"> <p>A user account is required in order to edit this wiki, but we've had to disable public user registrations due to spam. </p><p>To request an account, ask an autoconfirmed user on <a rel="nofollow" class="external text" href="https://whatwg.org/chat">Chat</a> (such as one of <span class="plainlinks"><a rel="nofollow" class="external text" href="https://wiki.whatwg.org/index.php?title=Special:ListUsers&group=autoconfirmed">these permanent autoconfirmed members</a></span>). </p> </div> </div></div></div></div> <div class="mw-indicators"> </div> <h1 id="firstHeading" class="firstHeading mw-first-heading"><span class="mw-page-title-main">Web Encodings</span></h1> <div id="bodyContent" class="vector-body"> <div id="siteSub" class="noprint">From WHATWG Wiki</div> <div id="contentSub"></div> <div id="contentSub2"></div> <div id="jump-to-nav"></div> <a class="mw-jump-link" href="#mw-head">Jump to navigation</a> <a class="mw-jump-link" href="#searchInput">Jump to search</a> <div id="mw-content-text" class="mw-body-content mw-content-ltr" lang="en" dir="ltr"><div class="mw-parser-output"><div style="background-color: pink; color: maroon; border: 1px solid maroon; padding: 0.5em; text-align: center;"> <p style="font-size: larger;">This document is obsolete.</p><p>For the current specification, see: <a rel="nofollow" class="external text" href="http://encoding.spec.whatwg.org/">Encoding Standard</a></p> </div> <p><br /> </p> <div id="toc" class="toc" role="navigation" aria-labelledby="mw-toc-heading"><input type="checkbox" role="button" id="toctogglecheckbox" class="toctogglecheckbox" style="display:none" /><div class="toctitle" lang="en" dir="ltr"><h2 id="mw-toc-heading">Contents</h2><span class="toctogglespan"><label class="toctogglelabel" for="toctogglecheckbox"></label></span></div> <ul> <li class="toclevel-1 tocsection-1"><a href="#Goals"><span class="tocnumber">1</span> <span class="toctext">Goals</span></a></li> <li class="toclevel-1 tocsection-2"><a href="#Current_Implementations"><span class="tocnumber">2</span> <span class="toctext">Current Implementations</span></a> <ul> <li class="toclevel-2 tocsection-3"><a href="#Data"><span class="tocnumber">2.1</span> <span class="toctext">Data</span></a></li> <li class="toclevel-2 tocsection-4"><a href="#Opera"><span class="tocnumber">2.2</span> <span class="toctext">Opera</span></a> <ul> <li class="toclevel-3 tocsection-5"><a href="#Matching"><span class="tocnumber">2.2.1</span> <span class="toctext">Matching</span></a></li> <li class="toclevel-3 tocsection-6"><a href="#Encodings"><span class="tocnumber">2.2.2</span> <span class="toctext">Encodings</span></a></li> </ul> </li> <li class="toclevel-2 tocsection-7"><a href="#Firefox"><span class="tocnumber">2.3</span> <span class="toctext">Firefox</span></a> <ul> <li class="toclevel-3 tocsection-8"><a href="#Matching_2"><span class="tocnumber">2.3.1</span> <span class="toctext">Matching</span></a></li> <li class="toclevel-3 tocsection-9"><a href="#Encodings_2"><span class="tocnumber">2.3.2</span> <span class="toctext">Encodings</span></a></li> </ul> </li> <li class="toclevel-2 tocsection-10"><a href="#Internet_Explorer"><span class="tocnumber">2.4</span> <span class="toctext">Internet Explorer</span></a> <ul> <li class="toclevel-3 tocsection-11"><a href="#Matching_3"><span class="tocnumber">2.4.1</span> <span class="toctext">Matching</span></a></li> <li class="toclevel-3 tocsection-12"><a href="#Encodings_3"><span class="tocnumber">2.4.2</span> <span class="toctext">Encodings</span></a></li> <li class="toclevel-3 tocsection-13"><a href="#Data_2"><span class="tocnumber">2.4.3</span> <span class="toctext">Data</span></a></li> </ul> </li> <li class="toclevel-2 tocsection-14"><a href="#Safari"><span class="tocnumber">2.5</span> <span class="toctext">Safari</span></a> <ul> <li class="toclevel-3 tocsection-15"><a href="#Matching_4"><span class="tocnumber">2.5.1</span> <span class="toctext">Matching</span></a></li> <li class="toclevel-3 tocsection-16"><a href="#Encodings_4"><span class="tocnumber">2.5.2</span> <span class="toctext">Encodings</span></a></li> <li class="toclevel-3 tocsection-17"><a href="#Data_3"><span class="tocnumber">2.5.3</span> <span class="toctext">Data</span></a></li> </ul> </li> <li class="toclevel-2 tocsection-18"><a href="#Chrome"><span class="tocnumber">2.6</span> <span class="toctext">Chrome</span></a></li> </ul> </li> <li class="toclevel-1 tocsection-19"><a href="#Thoughts"><span class="tocnumber">3</span> <span class="toctext">Thoughts</span></a> <ul> <li class="toclevel-2 tocsection-20"><a href="#Anne"><span class="tocnumber">3.1</span> <span class="toctext">Anne</span></a></li> <li class="toclevel-2 tocsection-21"><a href="#E-mails"><span class="tocnumber">3.2</span> <span class="toctext">E-mails</span></a></li> <li class="toclevel-2 tocsection-22"><a href="#Spec_notes"><span class="tocnumber">3.3</span> <span class="toctext">Spec notes</span></a></li> <li class="toclevel-2 tocsection-23"><a href="#ICU_in_Chrome_and_Safari"><span class="tocnumber">3.4</span> <span class="toctext">ICU in Chrome and Safari</span></a></li> </ul> </li> <li class="toclevel-1 tocsection-24"><a href="#Misc."><span class="tocnumber">4</span> <span class="toctext">Misc.</span></a></li> </ul> </div> <h2><span class="mw-headline" id="Goals">Goals</span></h2> <ul><li>Document existing practices by describing for each browser <ul><li>The list of supported encodings.</li> <li>The list of supported labels for those encodings.</li> <li>The matching algorithm for labels.</li></ul></li> <li>Converge the various used algorithms by <ul><li>Defining a list of encodings everyone has to support. Browsers must not support more encodings than on that list.</li> <li>Defining a list of supported labels for those encodings. Browsers must not support more labels than on that list.</li> <li>Defining the matching algorithm. (HTML5 has been updated with a better one now.)</li></ul></li> <li>Get the new rules implemented</li></ul> <p>Documenting more exactly the encoding (Unicode stream + encoding -> byte stream) and decoding (byte stream + encoding -> Unicode stream) algorithms for each encoding and getting that implemented interoperably would also be great. </p> <h2><span class="mw-headline" id="Current_Implementations">Current Implementations</span></h2> <p>Does this differ per platform? Opera might differ a bit on Mac. </p> <h3><span class="mw-headline" id="Data">Data</span></h3> <p>Integrate this awesome data somehow: </p> <ul><li><a rel="nofollow" class="external free" href="http://coq.no/character-tables/mime/en">http://coq.no/character-tables/mime/en</a></li> <li><a rel="nofollow" class="external free" href="http://coq.no/character-tables/mime/iso-2022/en">http://coq.no/character-tables/mime/iso-2022/en</a></li> <li><a rel="nofollow" class="external free" href="http://coq.no/character-tables/mime/euc/en">http://coq.no/character-tables/mime/euc/en</a></li> <li><a rel="nofollow" class="external free" href="http://coq.no/character-tables/mime/locale-specific/en">http://coq.no/character-tables/mime/locale-specific/en</a></li></ul> <h3><span class="mw-headline" id="Opera">Opera</span></h3> <h4><span class="mw-headline" id="Matching">Matching</span></h4> <p>UTS22 and strips leading x characters. (For now, plan is to switch to removing leading and trailing whitespace and ASCII case-insensitive matching afterwards in the future.) </p> <h4><span class="mw-headline" id="Encodings">Encodings</span></h4> <table border="1" cellpadding="4" cellspacing="0"> <tbody><tr> <th colspan="2">Encoding </th> <th>Labels </th> <th>Decoded As </th> <th>Notes </th></tr> <tr> <td style="text-align:center">7-bit </td> <td>us-ascii </td> <td>ansix341968, ansix341986, ascii, cp367, csascii, csinvariant, csiso646basic1983, ibm367, invariant, iso646basic1983, iso646irv1991, iso646us, isoir6, ref, us, usascii </td> <td>windows-1252 </td> <td> </td></tr> <tr> <td style="text-align:center">DOS </td> <td>ibm866 </td> <td>866, cp866, csibm866, ibm866 </td> <td> </td> <td> </td></tr> <tr> <td rowspan="16" style="text-align:center">ISO </td> <td>iso-8859-1 </td> <td>cp819, csisolatin1, ibm819, iso88591, iso885911987, isoir100, l1, latin1 </td> <td>windows-1252 </td> <td> </td></tr> <tr> <td>iso-8859-2 </td> <td>csisolatin2, iso88592, iso885921987, isoir101, l2, latin2 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-3 </td> <td>csisolatin3, iso88593, iso885931988, isoir109, l3, latin3 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-4 </td> <td>csisolatin4, iso88594, iso885941988, isoir110, l4, latin4 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-5 </td> <td>csisolatincyrillic, cyrillic, iso88595, iso885951988, isoir144 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-6 </td> <td>arabic, asmo708, csiso88596e, csisolatinarabic, ecma114, iso88596, iso885961987, iso88596e, isoir127 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-6-i </td> <td>csiso88596i, iso88596i </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-7 </td> <td>csisolatingreek, ecma118, elot928, greek, greek8, iso88597, iso885971987, isoir126 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-8 </td> <td>csiso88598e, csisolatinhebrew, hebrew, iso88598, iso885981988, iso88598e, isoir138, visual </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-8-i </td> <td>csiso88598i, iso88598i </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-9 </td> <td>csisolatin5, iso88599, iso885991989, isoir148, l5, latin5 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-10 </td> <td>csisolatin6, iso885910, iso8859101992, isoir157, l6, latin6 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-13 </td> <td>iso885913 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-14 </td> <td>iso885914, iso8859141998, isoceltic, isoir199, l8, latin8 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-15 </td> <td>iso885915, latin9 </td> <td> </td> <td> </td></tr> <tr> <td>iso-8859-16 </td> <td>iso885916, iso8859162001, isoir226, l10, latin10 </td> <td> </td> <td> </td></tr> <tr> <td rowspan="11" style="text-align:center">Win </td> <td>iso-8859-11 </td> <td>iso885911, tis620, tis6202533, windows874 </td> <td> </td> <td>Actually implemented as windows-874 </td></tr> <tr> <td>windows-1250 </td> <td>cp1250, microsoftcp1250, windows1250 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1251 </td> <td>cp1251, microsoftcp1251, windows1251 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1252 </td> <td>cp1252, microsoftcp1252, windows1252 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1253 </td> <td>cp1253, microsoftcp1253, windows1253 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1254 </td> <td>cp1254, microsoftcp1254, windows1254 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1255 </td> <td>cp1255, microsoftcp1255, windows1255 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1256 </td> <td>cp1256, microsoftcp1256, windows1256 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1257 </td> <td>cp1257, microsoftcp1257, windows1257 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1258 </td> <td>cp1258, microsoftcp1258, windows1258 </td> <td> </td> <td> </td></tr> <tr> <td>windows-sami-2 </td> <td>samiws2, windowssami2, ws2 </td> <td> </td> <td> </td></tr> <tr> <td rowspan="5" style="text-align:center">Mac </td> <td>macintosh </td> <td>csmacintosh, mac, macintosh, macroman </td> <td> </td> <td>Likely disabled. </td></tr> <tr> <td>x-mac-ce </td> <td>macce </td> <td> </td> <td>Likely disabled. </td></tr> <tr> <td>x-mac-cyrillic </td> <td>maccyrillic </td> <td> </td> <td>Likely disabled. </td></tr> <tr> <td>x-mac-greek </td> <td>macgreek </td> <td> </td> <td>Likely disabled. </td></tr> <tr> <td>x-mac-turkish </td> <td>macturkish </td> <td> </td> <td>Likely disabled. </td></tr> <tr> <td rowspan="5" style="text-align:center">Misc. </td> <td>koi8-r </td> <td>cskoi8r, koi8r </td> <td> </td> <td> </td></tr> <tr> <td>koi8-u </td> <td>koi8u </td> <td> </td> <td> </td></tr> <tr> <td>tcvn </td> <td>tcvn, viettcvn </td> <td> </td> <td> </td></tr> <tr> <td>viscii </td> <td>csviscii, viscii </td> <td> </td> <td> </td></tr> <tr> <td>x-vps </td> <td>vps </td> <td> </td> <td> </td></tr> <tr> <td rowspan="13" style="font-size:200%; line-height:100%; text-align:center">中<br />日<br />韓 </td> <td>big5 </td> <td>big5, cnbig5, csbig5 </td> <td> </td> <td> </td></tr> <tr> <td>big5-hkscs </td> <td>big5hkscs </td> <td> </td> <td> </td></tr> <tr> <td>euc-jp </td> <td>cseucpkdfmtjapanese, eucjp, extendedunixcodepackedformatforjapanese </td> <td> </td> <td> </td></tr> <tr> <td>euc-kr </td> <td>cseuckr, csksc56011987, euckr, isoir149, korean, ksc5601, ksc56011987, ksc56011989, windows949 </td> <td> </td> <td> </td></tr> <tr> <td>euc-tw </td> <td>euctw </td> <td> </td> <td> </td></tr> <tr> <td>gb18030 </td> <td>gb18030 </td> <td> </td> <td> </td></tr> <tr> <td>gbk </td> <td>chinese, cngb, cp936, csgb2312, csiso58gb231280, euccn, gb2312, gb231280, gbk, isoir58, ms936, windows936 </td> <td> </td> <td> </td></tr> <tr> <td>hz-gb-2312 </td> <td>hzgb2312 </td> <td> </td> <td> </td></tr> <tr> <td>iso-2022-cn </td> <td>iso2022cn </td> <td> </td> <td> </td></tr> <tr> <td>iso-2022-jp </td> <td>csiso2022jp, iso2022jp </td> <td> </td> <td> </td></tr> <tr> <td>iso-2022-jp-1 </td> <td>iso2022jp1 </td> <td> </td> <td> </td></tr> <tr> <td>iso-2022-kr </td> <td>csiso2022kr, iso2022kr </td> <td> </td> <td> </td></tr> <tr> <td>shift_jis </td> <td>cp932, csshiftjis, cswindows31j, ms932, mskanji, shiftjis, sjis, windows31j </td> <td> </td> <td> </td></tr> <tr> <td rowspan="4" style="font-size:200%; text-align:center">� </td> <td>utf-16 </td> <td>csunicode, csunicode11, csunicodeascii, iso10646j1, iso10646ucs2, iso10646ucsbasic, utf16 </td> <td> </td> <td> </td></tr> <tr> <td>utf-16be </td> <td>utf16be </td> <td> </td> <td> </td></tr> <tr> <td>utf-16le </td> <td>utf16le </td> <td> </td> <td> </td></tr> <tr> <td>utf-8 </td> <td>utf8 </td> <td> </td> <td> </td></tr></tbody></table> <h3><span class="mw-headline" id="Firefox">Firefox</span></h3> <h4><span class="mw-headline" id="Matching_2">Matching</span></h4> <p>ASCII lowercasing. </p> <h4><span class="mw-headline" id="Encodings_2">Encodings</span></h4> <p>See <a rel="nofollow" class="external free" href="https://wiki.mozilla.org/I18n:Charset_Aliases">https://wiki.mozilla.org/I18n:Charset_Aliases</a> </p> <table class="wikitable"> <tbody><tr> <th colspan="2">Encoding </th> <th>Labels </th> <th>Decoded As </th> <th>Notes </th></tr> <tr> <td style="text-align:center">7-bit </td> <td>us-ascii </td> <td>646, ansi_x3.4-1968, ascii, us-ascii </td> <td>windows-1252 </td> <td> </td></tr> <tr> <td rowspan="8" style="text-align:center">DOS </td> <td>IBM850 </td> <td>850, cp850, csIBM850, ibm850 </td> <td> </td> <td>csIBM850 not recognised. </td></tr> <tr> <td>IBM852 </td> <td>852, cp852, csIBM852, ibm852 </td> <td> </td> <td>csIBM852 not recognised. </td></tr> <tr> <td>IBM855 </td> <td>855, cp855, csIBM855, ibm855 </td> <td> </td> <td>csIBM855 not recognised. </td></tr> <tr> <td>IBM857 </td> <td>857, cp857, csIBM857, ibm857 </td> <td> </td> <td>csIBM857 not recognised. </td></tr> <tr> <td>IBM862 </td> <td>862, cp862, csIBM862, ibm862 </td> <td> </td> <td>csIBM862 not recognised. </td></tr> <tr> <td>IBM864 </td> <td>864, cp864, csIBM864, ibm-864, ibm864 </td> <td> </td> <td>csIBM864 not recognised. </td></tr> <tr> <td>IBM864i </td> <td>864i, cp864i, csibm864i, ibm-864i, ibm864i </td> <td> </td> <td> </td></tr> <tr> <td>IBM866 </td> <td>866, cp-866, cp866, csIBM866, ibm866 </td> <td> </td> <td>csIBM866 not recognised. </td></tr> <tr> <td rowspan="19" style="text-align:center">ISO </td> <td>ISO-8859-1 </td> <td>cp819, csisolatin1, ibm819, iso-8859-1, iso-ir-100, iso8859-1, iso88591, iso_8859-1, l1, latin1 </td> <td>windows-1252 </td> <td> </td></tr> <tr> <td>ISO-8859-2 </td> <td>csisolatin2, iso-8859-2, iso-ir-101, iso8859-2, iso88592, iso_8859-2, l2, latin2 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-3 </td> <td>csisolatin3, iso-8859-3, iso-ir-109, iso8859-3, iso88593, iso_8859-3, l3, latin3 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-4 </td> <td>csisolatin4, iso-8859-4, iso-ir-110, iso8859-4, iso88594, iso_8859-4, l4, latin4 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-5 </td> <td>csisolatincyrillic, cyrillic, iso-8859-5, iso-ir-144, iso8859-5, iso88595, iso_8859-5 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-6 </td> <td>arabic, asmo-708, csisolatinarabic, ecma-114, iso-8859-6, iso-ir-127, iso8859-6, iso88596, iso_8859-6 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-6-E </td> <td>csiso88596e, iso-8859-6-e </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-6-I </td> <td>csiso88596i, iso-8859-6-i </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-7 </td> <td>csisolatingreek, ecma-118, elot_928, greek, greek8, iso-8859-7, iso-ir-126, iso8859-7, iso88597, iso_8859-7, sun_eu_greek </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-8 </td> <td>csisolatinhebrew, hebrew, iso-8859-8, iso-ir-138, iso8859-8, iso88598, iso_8859-8, visual </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-8-E </td> <td>csiso88598e, iso-8859-8-e </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-8-I </td> <td>csiso88598i, iso-8859-8-i, iso-8859-8i </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-9 </td> <td>csisolatin5, iso-8859-9, iso-ir-148, iso8859-9, iso88599, iso_8859-9, l5, latin5 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-10 </td> <td>csisolatin6, iso-8859-10, iso-ir-157, iso8859-10, iso885910, l6, latin6 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-11 </td> <td>iso-8859-11, iso8859-11, iso885911 </td> <td>windows-874 </td> <td> </td></tr> <tr> <td>ISO-8859-13 </td> <td>iso-8859-13, iso8859-13, iso885913 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-14 </td> <td>iso-8859-14, iso8859-14, iso885914 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-15 </td> <td>iso-8859-15, iso8859-15, iso885915, iso_8859-15 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-8859-16 </td> <td>iso-8859-16 </td> <td> </td> <td> </td></tr> <tr> <td rowspan="10" style="text-align:center">Win </td> <td>windows-874 </td> <td>ibm874, windows-874 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1250 </td> <td>cp1250, windows-1250, x-cp1250 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1251 </td> <td>ansi-1251, cp1251, windows-1251, x-cp1251 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1252 </td> <td>cp1252, windows-1252, x-cp1252 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1253 </td> <td>cp1253, windows-1253, x-cp1253 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1254 </td> <td>cp1254, windows-1254, x-cp1254 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1255 </td> <td>cp1255, windows-1255, x-cp1255 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1256 </td> <td>cp1256, windows-1256, x-cp1256 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1257 </td> <td>cp1257, windows-1257, x-cp1257 </td> <td> </td> <td> </td></tr> <tr> <td>windows-1258 </td> <td>cp1258, windows-1258, x-cp1258 </td> <td> </td> <td> </td></tr> <tr> <td rowspan="15" style="text-align:center">Mac </td> <td>x-mac-arabic </td> <td>x-mac-arabic </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-ce </td> <td>x-mac-ce </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-croatian </td> <td>x-mac-croatian </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-cyrillic </td> <td>x-mac-cyrillic </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-devanagari </td> <td>x-mac-devanagari </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-farsi </td> <td>x-mac-farsi </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-greek </td> <td>x-mac-greek </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-gujarati </td> <td>x-mac-gujarati </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-gurmukhi </td> <td>x-mac-gurmukhi </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-hebrew </td> <td>x-mac-hebrew </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-icelandic </td> <td>x-mac-icelandic </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-roman </td> <td>csMacintosh, mac, macintosh, x-mac-roman </td> <td> </td> <td>csMacintosh not recognised. </td></tr> <tr> <td>x-mac-romanian </td> <td>x-mac-romanian </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-turkish </td> <td>x-mac-turkish </td> <td> </td> <td> </td></tr> <tr> <td>x-mac-ukrainian </td> <td>x-mac-ukrainian </td> <td> </td> <td> </td></tr> <tr> <td rowspan="11" style="text-align:center">Misc. </td> <td>armscii-8 </td> <td>armscii-8 </td> <td> </td> <td> </td></tr> <tr> <td>GEOSTD8 </td> <td>geostd8 </td> <td> </td> <td>Does not seem to work. </td></tr> <tr> <td>ISO-IR-111 </td> <td>csiso111ecmacyrillic, ecma-cyrillic, iso-ir-111 </td> <td> </td> <td> </td></tr> <tr> <td>KOI8-R </td> <td>koi8-r </td> <td> </td> <td> </td></tr> <tr> <td>KOI8-U </td> <td>koi8-u </td> <td> </td> <td> </td></tr> <tr> <td>T.61-8bit </td> <td>csiso103t618bit, iso-ir-103, t.61, t.61-8bit </td> <td> </td> <td> </td></tr> <tr> <td>TIS-620 </td> <td>tis-620, tis620 </td> <td>windows-874 </td> <td> </td></tr> <tr> <td>VISCII </td> <td>csviscii, viscii </td> <td> </td> <td> </td></tr> <tr> <td>x-user-defined </td> <td>x-user-defined </td> <td> </td> <td> </td></tr> <tr> <td>x-viet-tcvn5712 </td> <td>x-viet-tcvn5712 </td> <td> </td> <td> </td></tr> <tr> <td>x-viet-vps </td> <td>x-viet-vps </td> <td> </td> <td> </td></tr> <tr> <td rowspan="16" style="font-size:200%; line-height:100%; text-align:center">中<br />日<br />韓 </td> <td>Big5 </td> <td>big5, csbig5, x-x-big5, zh_tw-big5 </td> <td> </td> <td> </td></tr> <tr> <td>Big5-HKSCS </td> <td>big5-hkscs </td> <td> </td> <td> </td></tr> <tr> <td>EUC-JP </td> <td>cseucpkdfmtjapanese, euc-jp, x-euc-jp </td> <td> </td> <td> </td></tr> <tr> <td>EUC-KR </td> <td>5601, csksc56011987, cseuckr, euc-kr, iso-ir-149, korean, ks_c_5601-1989, ksc5601, ksc_5601 </td> <td>x-windows-949 </td> <td>This converter is assymetric. In ToUnicode direction, it is generous and acts as Windows-949. It also supports 8-byte sequences for 8,822 Hangul syllables not encoded as precomposed forms in KS X 1001. In FromUnicode direction, it is strict and generate 8-byte sequences for those 8,822 Hangul syllables instead of 2-byte sequences in windows-949. </td></tr> <tr> <td>gb18030 </td> <td>gb18030 </td> <td> </td> <td> </td></tr> <tr> <td>GB2312 </td> <td>chinese, csgb2312, csiso58gb231280, gb2312, gb_2312, gb_2312-80, iso-ir-58, zh_cn.euc </td> <td>x-gbk </td> <td> </td></tr> <tr> <td>HZ-GB-2312 </td> <td>hz-gb-2312 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-2022-CN </td> <td>iso-2022-cn, iso-2022-cn-ext </td> <td> </td> <td> </td></tr> <tr> <td>ISO-2022-JP </td> <td>csiso2022jp, csiso2022jp2, iso-2022-jp, iso-2022-jp-2 </td> <td> </td> <td> </td></tr> <tr> <td>ISO-2022-KR </td> <td>csiso2022kr, iso-2022-kr </td> <td> </td> <td> </td></tr> <tr> <td>Shift_JIS </td> <td>csshiftjis, ms_kanji, shift-jis, shift_jis, windows-31j, x-sjis </td> <td> </td> <td> </td></tr> <tr> <td>windows-936 </td> <td>windows-936 </td> <td> </td> <td> </td></tr> <tr> <td>x-euc-tw </td> <td>cns11643, x-euc-tw, zh_tw-euc </td> <td> </td> <td> </td></tr> <tr> <td>x-gbk </td> <td>gbk, x-gbk </td> <td> </td> <td> </td></tr> <tr> <td>x-johab </td> <td>x-johab </td> <td> </td> <td> </td></tr> <tr> <td>x-windows-949 </td> <td>ks_c_5601-1987, x-windows-949 </td> <td> </td> <td> </td></tr> <tr> <td rowspan="9" style="font-size:200%; text-align:center">� </td> <td>UTF-16 </td> <td>utf-16 </td> <td> </td> <td>Recognized as BE or LE by BOM or byte sniffing </td></tr> <tr> <td>UTF-16BE </td> <td>csunicode, csunicode11, csunicodeascii, csunicodelatin1, iso-10646, iso-10646-j-1, iso-10646-ucs-2, iso-10646-ucs-basic, iso-10646-unicode-latin1, utf-16be, x-iso-10646-ucs-2-be </td> <td> </td> <td> </td></tr> <tr> <td>UTF-16LE </td> <td>utf-16le, x-iso-10646-ucs-2-le </td> <td> </td> <td> </td></tr> <tr> <td>UTF-32 </td> <td>utf-32 </td> <td> </td> <td>Recognized as BE or LE by BOM or byte sniffing </td></tr> <tr> <td>UTF-32BE </td> <td>iso-10646-ucs-4, utf-32be, x-iso-10646-ucs-4-be </td> <td> </td> <td> </td></tr> <tr> <td>UTF-32LE </td> <td>utf-32le, x-iso-10646-ucs-4-le </td> <td> </td> <td> </td></tr> <tr> <td>UTF-7 </td> <td>csunicode11utf7, unicode-1-1-utf-7, unicode-2-0-utf-7, utf-7, x-unicode-2-0-utf-7 </td> <td> </td> <td> </td></tr> <tr> <td>UTF-8 </td> <td>unicode-1-1-utf-8, utf-8, utf8 </td> <td> </td> <td> </td></tr> <tr> <td>x-imap4-modified-utf7 </td> <td>x-imap4-modified-utf7 </td> <td> </td> <td> </td></tr></tbody></table> <p>Table generated from <<a rel="nofollow" class="external free" href="http://mxr.mozilla.org/mozilla1.9.1/source/intl/uconv/src/charsetalias.properties">http://mxr.mozilla.org/mozilla1.9.1/source/intl/uconv/src/charsetalias.properties</a>> (corresponds to Firefox 3.5.2). </p><p>Aliases (used for parsing, apparently not for serialisation) are scattered around in a large number of files; cf. <<a rel="nofollow" class="external free" href="http://mxr.mozilla.org/firefox/source/intl/uconv/ucvlatin/nsISO885911ToUnicode.cpp">http://mxr.mozilla.org/firefox/source/intl/uconv/ucvlatin/nsISO885911ToUnicode.cpp</a>> for the mapping from ISO-8859-11 to windows-874. </p><p>8-bit encodings (excluding UTFs, CJK encodings and T.61) tested using <<a rel="nofollow" class="external free" href="http://coq.no/X/charset5/tests8bit.html">http://coq.no/X/charset5/tests8bit.html</a>> (fail/pass should not be taken too seriously yet, especially not for more obscure encodings), Firefox version 3.5.1, OS X. </p><p><b>Bugs:</b> Filed <<a rel="nofollow" class="external free" href="https://bugzilla.mozilla.org/show_bug.cgi?id=512060">https://bugzilla.mozilla.org/show_bug.cgi?id=512060</a>> for the labels marked 'not recognised' in the table above since the lack of support for these is clearly accidental rather than deliberate (though it seems to suggest that these particular labels are not particularly widely used). In most other cases, research and deliberation will be needed to distinguish between bugs and features. </p> <h3><span class="mw-headline" id="Internet_Explorer">Internet Explorer</span></h3> <h4><span class="mw-headline" id="Matching_3">Matching</span></h4> <p>Strips leading and trailing whitespace and then does ASCII(?) case-insensitive matching. (Matches HTML5.) </p> <h4><span class="mw-headline" id="Encodings_3">Encodings</span></h4> <table border="1" cellpadding="4" cellspacing="0"> <tbody><tr> <th colspan="2">Encoding </th> <th>Labels </th> <th>Decoded As </th> <th>Notes </th></tr> <tr> <td rowspan="5" style="text-align:center">7-bit </td> <td>us-ascii </td> <td>ansi_x3.4-1968, ansi_x3.4-1986, ascii, cp367, csascii, ibm367, iso-ir-6, iso646-us, iso_646.irv:1991, us, us-ascii </td> <td> </td> <td>(code page: 20127) </td></tr> <tr> <td>x-ia5 </td> <td>irv, x-ia5 </td> <td> </td> <td>(code page: 20105) Most significant bit ignored. </td></tr> <tr> <td>x-ia5-german </td> <td>din_66003, german, x-ia5-german </td> <td> </td> <td>(code page: 20106) Most significant bit ignored. </td></tr> <tr> <td>x-ia5-norwegian </td> <td>norwegian, ns_4551-1, x-ia5-norwegian </td> <td> </td> <td>(code page: 20108) Most significant bit ignored. Actually decoded as NS 4551-2, not NS 4551-1. </td></tr> <tr> <td>x-ia5-swedish </td> <td>sen_850200_b, swedish, x-ia5-swedish </td> <td> </td> <td>(code page: 20107) Most significant bit ignored. Actually decoded as SEN 85 02 00 Annex C, not SEN 85 02 00 Annex B. </td></tr> <tr> <td rowspan="17" style="text-align:center">DOS </td> <td>cp866 </td> <td>cp866, ibm866 </td> <td> </td> <td>(code page: 866) </td></tr> <tr> <td>dos-720 </td> <td>dos-720 </td> <td> </td> <td>(code page: 720) </td></tr> <tr> <td>dos-862 </td> <td>cp862, dos-862, ibm862 </td> <td> </td> <td>(code page: 862) </td></tr> <tr> <td>ibm00858 </td> <td>ccsid00858, cp00858, cp858, ibm00858, pc-multilingual-850+euro </td> <td> </td> <td>(code page: 858) </td></tr> <tr> <td>ibm437 </td> <td>437, cp437, cspc8codepage437, ibm437 </td> <td> </td> <td>(code page: 437) </td></tr> <tr> <td>ibm737 </td> <td>ibm737 </td> <td> </td> <td>(code page: 737) </td></tr> <tr> <td>ibm775 </td> <td>ibm775 </td> <td> </td> <td>(code page: 775) </td></tr> <tr> <td>ibm850 </td> <td>cp850, ibm850 </td> <td> </td> <td>(code page: 850) </td></tr> <tr> <td>ibm852 </td> <td>cp852, ibm852 </td> <td> </td> <td>(code page: 852) </td></tr> <tr> <td>ibm855 </td> <td>cp855, ibm855 </td> <td> </td> <td>(code page: 855) </td></tr> <tr> <td>ibm857 </td> <td>cp857, ibm857 </td> <td> </td> <td>(code page: 857) </td></tr> <tr> <td>ibm860 </td> <td>cp860, ibm860 </td> <td> </td> <td>(code page: 860) </td></tr> <tr> <td>ibm861 </td> <td>cp861, ibm861 </td> <td> </td> <td>(code page: 861) </td></tr> <tr> <td>ibm863 </td> <td>cp863, ibm863 </td> <td> </td> <td>(code page: 863) </td></tr> <tr> <td>ibm864 </td> <td>cp864, ibm864 </td> <td> </td> <td>(code page: 864) </td></tr> <tr> <td>ibm865 </td> <td>cp865, ibm865 </td> <td> </td> <td>(code page: 865) </td></tr> <tr> <td>ibm869 </td> <td>cp869, ibm869 </td> <td> </td> <td>(code page: 869) </td></tr> <tr> <td rowspan="12" style="text-align:center">ISO </td> <td>iso-8859-1 </td> <td>cp819, csisolatin1, ibm819, iso-8859-1, iso-ir-100, iso8859-1, iso_8859-1, iso_8859-1:1987, l1, latin1 </td> <td>windows-1252 </td> <td>(code page: 28591) </td></tr> <tr> <td>iso-8859-2 </td> <td>csisolatin2, iso-8859-2, iso-ir-101, iso8859-2, iso_8859-2, iso_8859-2:1987, l2, latin2 </td> <td> </td> <td>(code page: 28592) </td></tr> <tr> <td>iso-8859-3 </td> <td>csisolatin3, iso-8859-3, iso-ir-109, iso_8859-3, iso_8859-3:1988, l3, latin3 </td> <td> </td> <td>(code page: 28593) </td></tr> <tr> <td>iso-8859-4 </td> <td>csisolatin4, iso-8859-4, iso-ir-110, iso_8859-4, iso_8859-4:1988, l4, latin4 </td> <td> </td> <td>(code page: 28594) </td></tr> <tr> <td>iso-8859-5 </td> <td>csisolatincyrillic, cyrillic, iso-8859-5, iso-ir-144, iso_8859-5, iso_8859-5:1988 </td> <td> </td> <td>(code page: 28595) </td></tr> <tr> <td>iso-8859-6 </td> <td>arabic, csisolatinarabic, ecma-114, iso-8859-6, iso-ir-127, iso_8859-6, iso_8859-6:1987 </td> <td> </td> <td>(code page: 28596) </td></tr> <tr> <td>iso-8859-7 </td> <td>csisolatingreek, ecma-118, elot_928, greek, greek8, iso-8859-7, iso-ir-126, iso_8859-7, iso_8859-7:1987 </td> <td> </td> <td>(code page: 28597) </td></tr> <tr> <td>iso-8859-8 </td> <td>csisolatinhebrew, hebrew, iso-8859-8, iso-8859-8 visual, iso-ir-138, iso_8859-8, iso_8859-8:1988, logical, visual </td> <td> </td> <td>(code page: 28598) </td></tr> <tr> <td>iso-8859-8-i </td> <td>iso-8859-8-i </td> <td> </td> <td>(code page: 38598) </td></tr> <tr> <td>iso-8859-9 </td> <td>csisolatin5, iso-8859-9, iso-ir-148, iso_8859-9, iso_8859-9:1989, l5, latin5 </td> <td>windows-1254 </td> <td>(code page: 28599) </td></tr> <tr> <td>iso-8859-13 </td> <td>iso-8859-13 </td> <td> </td> <td>(code page: 28603) </td></tr> <tr> <td>iso-8859-15 </td> <td>csisolatin9, iso-8859-15, iso_8859-15, l9, latin9 </td> <td> </td> <td>(code page: 28605) </td></tr> <tr> <td rowspan="10" style="text-align:center">Win </td> <td>windows-874 </td> <td>dos-874, iso-8859-11, tis-620, windows-874 </td> <td> </td> <td>(code page: 874) </td></tr> <tr> <td>windows-1250 </td> <td>windows-1250, x-cp1250 </td> <td> </td> <td>(code page: 1250) </td></tr> <tr> <td>windows-1251 </td> <td>windows-1251, x-cp1251 </td> <td> </td> <td>(code page: 1251) </td></tr> <tr> <td>windows-1252 </td> <td>windows-1252, x-ansi </td> <td> </td> <td>(code page: 1252) </td></tr> <tr> <td>windows-1253 </td> <td>windows-1253 </td> <td> </td> <td>(code page: 1253) </td></tr> <tr> <td>windows-1254 </td> <td>windows-1254 </td> <td> </td> <td>(code page: 1254) </td></tr> <tr> <td>windows-1255 </td> <td>windows-1255 </td> <td> </td> <td>(code page: 1255) </td></tr> <tr> <td>windows-1256 </td> <td>cp1256, windows-1256 </td> <td> </td> <td>(code page: 1256) </td></tr> <tr> <td>windows-1257 </td> <td>windows-1257 </td> <td> </td> <td>(code page: 1257) </td></tr> <tr> <td>windows-1258 </td> <td>windows-1258 </td> <td> </td> <td>(code page: 1258) </td></tr> <tr> <td rowspan="12" style="text-align:center">Mac </td> <td>macintosh </td> <td>macintosh </td> <td> </td> <td>(code page: 10000) </td></tr> <tr> <td>x-mac-arabic </td> <td>x-mac-arabic </td> <td> </td> <td>(code page: 10004) </td></tr> <tr> <td>x-mac-ce </td> <td>x-mac-ce </td> <td> </td> <td>(code page: 10029) </td></tr> <tr> <td>x-mac-croatian </td> <td>x-mac-croatian </td> <td> </td> <td>(code page: 10082) </td></tr> <tr> <td>x-mac-cyrillic </td> <td>x-mac-cyrillic </td> <td> </td> <td>(code page: 10007) </td></tr> <tr> <td>x-mac-greek </td> <td>x-mac-greek </td> <td> </td> <td>(code page: 10006) </td></tr> <tr> <td>x-mac-hebrew </td> <td>x-mac-hebrew </td> <td> </td> <td>(code page: 10005) </td></tr> <tr> <td>x-mac-icelandic </td> <td>x-mac-icelandic </td> <td> </td> <td>(code page: 10079) </td></tr> <tr> <td>x-mac-romanian </td> <td>x-mac-romanian </td> <td> </td> <td>(code page: 10010) </td></tr> <tr> <td>x-mac-thai </td> <td>x-mac-thai </td> <td> </td> <td>(code page: 10021) </td></tr> <tr> <td>x-mac-turkish </td> <td>x-mac-turkish </td> <td> </td> <td>(code page: 10081) </td></tr> <tr> <td>x-mac-ukrainian </td> <td>x-mac-ukrainian </td> <td> </td> <td>(code page: 10017) </td></tr> <tr> <td rowspan="16" style="text-align:center">Misc. </td> <td>asmo-708 </td> <td>asmo-708 </td> <td> </td> <td>(code page: 708) </td></tr> <tr> <td>koi8-r </td> <td>cskoi8r, koi, koi8, koi8-r, koi8r </td> <td> </td> <td>(code page: 20866) </td></tr> <tr> <td>koi8-u </td> <td>koi8-ru, koi8-u </td> <td> </td> <td>(code page: 21866) </td></tr> <tr> <td>x-cp20261 </td> <td>x-cp20261 </td> <td> </td> <td>(code page: 20261) T.61 / ISO/IEC_6937 </td></tr> <tr> <td>x-cp20269 </td> <td>x-cp20269 </td> <td> </td> <td>(code page: 20269) T.61 / ISO/IEC_6937 (non-combining accents?) </td></tr> <tr> <td>x-europa </td> <td>x-europa </td> <td> </td> <td>(code page: 29001) What is this? </td></tr> <tr> <td>x-iscii-as </td> <td>x-iscii-as </td> <td> </td> <td>(code page: 57006) </td></tr> <tr> <td>x-iscii-be </td> <td>x-iscii-be </td> <td> </td> <td>(code page: 57003) </td></tr> <tr> <td>x-iscii-de </td> <td>x-iscii-de </td> <td> </td> <td>(code page: 57002) </td></tr> <tr> <td>x-iscii-gu </td> <td>x-iscii-gu </td> <td> </td> <td>(code page: 57010) </td></tr> <tr> <td>x-iscii-ka </td> <td>x-iscii-ka </td> <td> </td> <td>(code page: 57008) </td></tr> <tr> <td>x-iscii-ma </td> <td>x-iscii-ma </td> <td> </td> <td>(code page: 57009) </td></tr> <tr> <td>x-iscii-or </td> <td>x-iscii-or </td> <td> </td> <td>(code page: 57007) </td></tr> <tr> <td>x-iscii-pa </td> <td>x-iscii-pa </td> <td> </td> <td>(code page: 57011) </td></tr> <tr> <td>x-iscii-ta </td> <td>x-iscii-ta </td> <td> </td> <td>(code page: 57004) </td></tr> <tr> <td>x-iscii-te </td> <td>x-iscii-te </td> <td> </td> <td>(code page: 57005) </td></tr> <tr> <td rowspan="27" style="font-size:200%; line-height:100%; text-align:center">中<br />日<br />韓 </td> <td>big5 </td> <td>big5, big5-hkscs, cn-big5, csbig5, x-x-big5 </td> <td> </td> <td>(code page: 950) </td></tr> <tr> <td>csiso2022jp </td> <td>csiso2022jp </td> <td> </td> <td>(code page: 50221) </td></tr> <tr> <td>euc-cn </td> <td>euc-cn, x-euc-cn </td> <td> </td> <td>(code page: 51936) </td></tr> <tr> <td>euc-jp </td> <td>cseucpkdfmtjapanese, euc-jp, extended_unix_code_packed_format_for_japanese, iso-2022-jpeuc, x-euc, x-euc-jp </td> <td> </td> <td>(code page: 51932) </td></tr> <tr> <td>euc-kr </td> <td>cseuckr, euc-kr, iso-2022-kr-8, iso-2022-kr-8bit </td> <td> </td> <td>(code page: 51949) </td></tr> <tr> <td>gb18030 </td> <td>gb18030 </td> <td> </td> <td>(code page: 54936) </td></tr> <tr> <td>gb2312 </td> <td>chinese, cn-gb, csgb2312, csgb231280, csiso58gb231280, gb2312, gb2312-80, gb231280, gbk, gb_2312-80, iso-ir-58 </td> <td> </td> <td>(code page: 936) GBK superset. The "gb2312-80" label does not seem to work in IE8. </td></tr> <tr> <td>hz-gb-2312 </td> <td>hz-gb-2312 </td> <td> </td> <td>(code page: 52936) </td></tr> <tr> <td>iso-2022-jp </td> <td>iso-2022-jp </td> <td> </td> <td>(code page: 50220) </td></tr> <tr> <td>iso-2022-kr </td> <td>csiso2022kr, iso-2022-kr, iso-2022-kr-7, iso-2022-kr-7bit </td> <td> </td> <td>(code page: 50225) </td></tr> <tr> <td>johab </td> <td>johab </td> <td> </td> <td>(code page: 1361) </td></tr> <tr> <td>ks_c_5601-1987 </td> <td>csksc56011987, iso-ir-149, korean, ks-c-5601, ks-c5601, ksc5601, ksc_5601, ks_c_5601, ks_c_5601-1987, ks_c_5601-1989, ks_c_5601_1987 </td> <td> </td> <td>(code page: 949) EUC-KR superset </td></tr> <tr> <td>shift_jis </td> <td>csshiftjis, cswindows31j, ms_kanji, shift-jis, shift_jis, sjis, windows-31j, x-ms-cp932, x-sjis </td> <td> </td> <td>(code page: 932) </td></tr> <tr> <td>x-chinese-cns </td> <td>x-chinese-cns </td> <td> </td> <td>(code page: 20000) EUC-TW </td></tr> <tr> <td>x-chinese-eten </td> <td>x-chinese-eten </td> <td> </td> <td>(code page: 20002) Other encoding of the Taiwanese CNS character set. </td></tr> <tr> <td>x-cp20001 </td> <td>x-cp20001 </td> <td> </td> <td>(code page: 20001) TW (not tested) </td></tr> <tr> <td>x-cp20003 </td> <td>x-cp20003 </td> <td> </td> <td>(code page: 20003) TW (not tested) </td></tr> <tr> <td>x-cp20004 </td> <td>x-cp20004 </td> <td> </td> <td>(code page: 20004) TW (not tested) </td></tr> <tr> <td>x-cp20005 </td> <td>x-cp20005 </td> <td> </td> <td>(code page: 20005) TW (not tested) </td></tr> <tr> <td>x-mac-chinesesimp </td> <td>x-mac-chinesesimp </td> <td> </td> <td>(code page: 10008) EUC-CN superset. Handled as plain ENC-CN? </td></tr> <tr> <td>x-mac-chinesetrad </td> <td>x-mac-chinesetrad </td> <td> </td> <td>(code page: 10002) Big5 superset. </td></tr> <tr> <td>x-mac-japanese </td> <td>x-mac-japanese </td> <td> </td> <td>(code page: 10001) Shift_JIS superset. Handled as Windows Shift_JIS? </td></tr> <tr> <td>x-mac-korean </td> <td>x-mac-korean </td> <td> </td> <td>(code page: 10003) EUC-KR superset. Handled as plain EUC-KR? </td></tr> <tr> <td>x-cp20936 </td> <td>x-cp20936 </td> <td> </td> <td>(code page: 20936) EUC-CN (not the GBK superset) </td></tr> <tr> <td>x-cp20949 </td> <td>x-cp20949 </td> <td> </td> <td>(code page: 20949) EUC-KR (not the Windows superset) </td></tr> <tr> <td>x-cp50227 </td> <td>x-cp50227 </td> <td> </td> <td>(code page: 50227) GBK, including at least some Windows extensions. </td></tr> <tr> <td>(???) </td> <td>x-cp50229 </td> <td> </td> <td>(code page: 50229) ISO-2022-CN subset? Includes GB 2312-80 (CN) and CNS 11643-1992 Plane 1 (TW). </td></tr> <tr> <td rowspan="4" style="font-size:200%; text-align:center">� </td> <td>unicodefffe </td> <td>unicodefffe, utf-16be </td> <td> </td> <td>(code page: 1201) UTF-16BE </td></tr> <tr> <td>utf-16 </td> <td>iso-10646-ucs-2, ucs-2, unicode, utf-16, utf-16le </td> <td> </td> <td>(code page: 1200) UTF-16LE. UCS-2 is not(!) taken to mean UTF-16. </td></tr> <tr> <td>utf-7 </td> <td>csunicode11utf7, unicode-1-1-utf-7, unicode-2-0-utf-7, utf-7, x-unicode-1-1-utf-7, x-unicode-2-0-utf-7 </td> <td> </td> <td>(code page: 65000) </td></tr> <tr> <td>utf-8 </td> <td>unicode-1-1-utf-8, unicode-2-0-utf-8, utf-8, x-unicode-1-1-utf-8, x-unicode-2-0-utf-8 </td> <td> </td> <td>(code page: 65001) </td></tr> <tr> <td rowspan="35" style="text-align:center">EBC<br />DIC </td> <td>cp875 </td> <td>cp875 </td> <td> </td> <td>(code page: 875) EBCDIC Greece </td></tr> <tr> <td>cp1025 </td> <td>cp1025 </td> <td> </td> <td>(code page: 21025) EBCDIC Cyrilllic Multilingual </td></tr> <tr> <td>ibm-thai </td> <td>csibmthai, ibm-thai </td> <td> </td> <td>(code page: 20838) EBCDIC Thailand </td></tr> <tr> <td>ibm00924 </td> <td>ccsid00924, cp00924, ebcdic-latin9--euro, ibm00924 </td> <td> </td> <td>(code page: 20924) EBCDIC Latin 9 </td></tr> <tr> <td>ibm01047 </td> <td>ibm01047 </td> <td> </td> <td>(code page: 1047) EBCDIC Latin 1/Open Systems </td></tr> <tr> <td>ibm01140 </td> <td>ccsid01140, cp01140, ebcdic-us-37+euro, ibm01140 </td> <td> </td> <td>(code page: 1140) EBCDIC USA, Canada, etc. ECECP </td></tr> <tr> <td>ibm01141 </td> <td>ccsid01141, cp01141, ebcdic-de-273+euro, ibm01141 </td> <td> </td> <td>(code page: 1141) EBCDIC Austria, Germany ECECP </td></tr> <tr> <td>ibm01142 </td> <td>ccsid01142, cp01142, ebcdic-dk-277+euro, ebcdic-no-277+euro, ibm01142 </td> <td> </td> <td>(code page: 1142) EBCDIC Denmark, Norway ECECP </td></tr> <tr> <td>ibm01143 </td> <td>ccsid01143, cp01143, ebcdic-fi-278+euro, ebcdic-se-278+euro, ibm01143 </td> <td> </td> <td>(code page: 1143) EBCDIC Finland, Sweden ECECP </td></tr> <tr> <td>ibm01144 </td> <td>ccsid01144, cp01144, ebcdic-it-280+euro, ibm01144 </td> <td> </td> <td>(code page: 1144) EBCDIC Italy ECECP </td></tr> <tr> <td>ibm01145 </td> <td>ccsid01145, cp01145, ebcdic-es-284+euro, ibm01145 </td> <td> </td> <td>(code page: 1145) EBCDIC Spain, Latin America (Spanish) </td></tr> <tr> <td>ibm01146 </td> <td>ccsid01146, cp01146, ebcdic-gb-285+euro, ibm01146 </td> <td> </td> <td>(code page: 1146) EBCDIC UK ECECP </td></tr> <tr> <td>ibm01147 </td> <td>ccsid01147, cp01147, ebcdic-fr-297+euro, ibm01147 </td> <td> </td> <td>(code page: 1147) EBCDIC France ECECP </td></tr> <tr> <td>ibm01148 </td> <td>ccsid01148, cp01148, ebcdic-international-500+euro, ibm01148 </td> <td> </td> <td>(code page: 1148) EBCDIC International ECECP </td></tr> <tr> <td>ibm01149 </td> <td>ccsid01149, cp01149, ebcdic-is-871+euro, ibm01149 </td> <td> </td> <td>(code page: 1149) EBCDIC Iceland ECECP </td></tr> <tr> <td>ibm037 </td> <td>cp037, csibm037, ebcdic-cp-ca, ebcdic-cp-nl, ebcdic-cp-us, ebcdic-cp-wt, ibm037 </td> <td> </td> <td>(code page: 37) EBCDIC USA/Canada - CECP </td></tr> <tr> <td>ibm1026 </td> <td>cp1026, csibm1026, ibm1026 </td> <td> </td> <td>(code page: 1026) EBCDIC Latin #5 - Turkey </td></tr> <tr> <td>ibm273 </td> <td>cp273, csibm273, ibm273 </td> <td> </td> <td>(code page: 20273) EBCDIC Germany F.R./Austria - CECP </td></tr> <tr> <td>ibm277 </td> <td>csibm277, ebcdic-cp-dk, ebcdic-cp-no, ibm277 </td> <td> </td> <td>(code page: 20277) EBCDIC Denmark, Norway - CECP </td></tr> <tr> <td>ibm278 </td> <td>cp278, csibm278, ebcdic-cp-fi, ebcdic-cp-se, ibm278 </td> <td> </td> <td>(code page: 20278) EBCDIC Finland, Sweden - CECP </td></tr> <tr> <td>ibm280 </td> <td>cp280, csibm280, ebcdic-cp-it, ibm280 </td> <td> </td> <td>(code page: 20280) EBCDIC Italy - CECP </td></tr> <tr> <td>ibm284 </td> <td>cp284, csibm284, ebcdic-cp-es, ibm284 </td> <td> </td> <td>(code page: 20284) EBCDIC Spain/Latin America - CECP </td></tr> <tr> <td>ibm285 </td> <td>cp285, csibm285, ebcdic-cp-gb, ibm285 </td> <td> </td> <td>(code page: 20285) EBCDIC United Kingdom - CECP </td></tr> <tr> <td>ibm290 </td> <td>cp290, csibm290, ebcdic-jp-kana, ibm290 </td> <td> </td> <td>(code page: 20290) EBCDIC Japanese (Katakana) Extended. Katakana replace lowercase EBCDIC. </td></tr> <tr> <td>ibm297 </td> <td>cp297, csibm297, ebcdic-cp-fr, ibm297 </td> <td> </td> <td>(code page: 20297) EBCDIC France - CECP </td></tr> <tr> <td>ibm420 </td> <td>cp420, csibm420, ebcdic-cp-ar1, ibm420 </td> <td> </td> <td>(code page: 20420) EBCDIC Arabic Bilingual </td></tr> <tr> <td>ibm423 </td> <td>cp423, csibm423, ebcdic-cp-gr, ibm423 </td> <td> </td> <td>(code page: 20423) EBCDIC Greece - 183 </td></tr> <tr> <td>ibm424 </td> <td>cp424, csibm424, ebcdic-cp-he, ibm424 </td> <td> </td> <td>(code page: 20424) EBCDIC Israel (Hebrew) </td></tr> <tr> <td>ibm500 </td> <td>cp500, csibm500, ebcdic-cp-be, ebcdic-cp-ch, ibm500 </td> <td> </td> <td>(code page: 500) EBCDIC International #5 </td></tr> <tr> <td>ibm870 </td> <td>cp870, csibm870, ebcdic-cp-roece, ebcdic-cp-yu, ibm870 </td> <td> </td> <td>(code page: 870) EBCDIC Latin 2, Multilingual </td></tr> <tr> <td>ibm871 </td> <td>cp871, csibm871, ebcdic-cp-is, ibm871 </td> <td> </td> <td>(code page: 20871) EBCDIC Iceland </td></tr> <tr> <td>ibm880 </td> <td>cp880, csibm880, ebcdic-cyrillic, ibm880 </td> <td> </td> <td>(code page: 20880) EBCDIC Cyrillic, Multilingual </td></tr> <tr> <td>ibm905 </td> <td>cp905, csibm905, ebcdic-cp-tr, ibm905 </td> <td> </td> <td>(code page: 20905) EBCDIC Latin 3 </td></tr> <tr> <td>x-ebcdic-koreanextended </td> <td>x-ebcdic-koreanextended </td> <td> </td> <td>(code page: 20833) EBCDIC Korean (some variant) </td></tr> <tr> <td>(???) </td> <td>x-cp21027 </td> <td> </td> <td>(code page: 21027) EBCDIC Japanese (some variant). Certain EBCDIC letters/digits decoded incorrectly. </td></tr> <tr> <td rowspan="6" style="text-align:center">¿···? </td> <td>(???) </td> <td>cp930 </td> <td> </td> <td>(code page: 50930) JAPAN MIX EBCDIC? Appears to be ASCII-compatible... </td></tr> <tr> <td>(???) </td> <td>cp933 </td> <td> </td> <td>(code page: 50933) KOREA MIX EBCDIC? Appears to be ASCII-compatible... </td></tr> <tr> <td>(???) </td> <td>cp935 </td> <td> </td> <td>(code page: 50935) S-CHINESE MIX EBCDIC? Appears to be ASCII-compatible... </td></tr> <tr> <td>(???) </td> <td>cp937 </td> <td> </td> <td>(code page: 50937) T-CHINESE MIX EBCDIC? Appears to be ASCII-compatible... </td></tr> <tr> <td>(???) </td> <td>cp939 </td> <td> </td> <td>(code page: 50939) JAPAN MIX EBCDIC? Appears to be ASCII-compatible... </td></tr> <tr> <td>(???) </td> <td>x-ebcdic-japaneseanduscanada </td> <td> </td> <td>(code page: 50931) EBCDIC? Appears to be ASCII-compatible... </td></tr> </tbody></table> <p>All EBCDIC encodings contain the letters A–Z, a–z and the digits 0–9 in EBCDIC positions (unless there is a note in the table saying otherwise). </p> <h4><span class="mw-headline" id="Data_2">Data</span></h4> <p>Source for the encodings and labels data: <a rel="nofollow" class="external free" href="http://lists.w3.org/Archives/Public/public-html-comments/2009Sep/att-0050/ie.encodings.txt">http://lists.w3.org/Archives/Public/public-html-comments/2009Sep/att-0050/ie.encodings.txt</a> </p><p>Labels and code pages .NET supports: <a rel="nofollow" class="external free" href="http://blogs.msdn.com/shawnste/archive/2009/08/18/alternate-encoding-names-recognized-by-net-ie.aspx">http://blogs.msdn.com/shawnste/archive/2009/08/18/alternate-encoding-names-recognized-by-net-ie.aspx</a> (there should be few, if any, differences with the above) </p><p>Different data for encodings and labels IE supports (might be more accurate): <a rel="nofollow" class="external free" href="http://html5.org/temp/2009/ie-encodings.htm">http://html5.org/temp/2009/ie-encodings.htm</a> (original: <a rel="nofollow" class="external free" href="http://web.archive.org/web/20080204211015/http://www.hitachi-to.co.jp/prod/prod_2/inter/emk/help/TextEncoder/CodePage.htm">http://web.archive.org/web/20080204211015/http://www.hitachi-to.co.jp/prod/prod_2/inter/emk/help/TextEncoder/CodePage.htm</a>) </p> <h3><span class="mw-headline" id="Safari">Safari</span></h3> <h4><span class="mw-headline" id="Matching_4">Matching</span></h4> <p>UTS22 </p> <h4><span class="mw-headline" id="Encodings_4">Encodings</span></h4> <p>FIXME </p> <h4><span class="mw-headline" id="Data_3">Data</span></h4> <p>Based on discussion with Maciej (Apple) archived here: <a rel="nofollow" class="external free" href="http://krijnhoetmer.nl/irc-logs/whatwg/20090909#l-110">http://krijnhoetmer.nl/irc-logs/whatwg/20090909#l-110</a> </p><p>Safari uses the system version of ICU on Mac (4.0 for Snow Leopard, 3.6 for Leopard and 3.2 for Tiger) and in addition supports TEC on Mac for encodings that are not in ICU. (Unclear how much of TEC is enabled.) </p><p>On Windows Safari ships with ICU 4.0 </p> <hr /> <p>According to webkit/WebCore/platform/text/TextCodecICU.cpp, WebKit now uses ICU <<a rel="nofollow" class="external free" href="http://site.icu-project.org/">http://site.icu-project.org/</a>> with additional aliases (webkit/WebCore/platform/text/TextCodecICU.cpp), additional encodings (webkit/WebCore/platform/text/mac/mac-encodings.txt) possibly implemented using TECM at least on the Mac, a list of official IANA labels (webkit/WebCore/platform/text/mac/character-sets.txt) and probably a few more which I have not noticed. </p><p>ICU 4.2’s icu/source/data/mappings/convrtrs.txt or <<a rel="nofollow" class="external free" href="http://demo.icu-project.org/icu-bin/convexp">http://demo.icu-project.org/icu-bin/convexp</a>> lists encodings and labels not supported in Safari 4.0 on Leopard, and webkit/WebCore/platform/text/TextCodecICU.cpp mentions that Tiger included ICU 3.2. </p><p>See also: <a rel="nofollow" class="external free" href="http://trac.webkit.org/browser/trunk/WebCore/platform/text">http://trac.webkit.org/browser/trunk/WebCore/platform/text</a> </p> <h3><span class="mw-headline" id="Chrome">Chrome</span></h3> <p>Similar to Safari with some customizations in ICU alias tables. Chrome 3.0 has ICU 3.8 plus customizations for EUC-JP (to match IE/Firefox). For EUC-KR and GBK, we use different mapping tables than used by Safari (which just uses ICU's default tables for them). ISO-8859-16 is also added. </p><p>Chrome trunk uses ICU 4.2. </p> <h2><span class="mw-headline" id="Thoughts">Thoughts</span></h2> <h3><span class="mw-headline" id="Anne">Anne</span></h3> <p>If it can be agreed upon that all non-UTF-8 and non-UTF-16 encodings are legacy encodings I personally would not mind advocating that we should drop support for US-ASCII and ISO-8859-1 completely in favor of Windows-1252 (and do the same for similar situations). I.e. that US-ASCII and ISO-8859-1 labels simply map to Windows-1252. This should simplify code a little bit as well. </p><p>I also think that we should ban UTF-7, UTF-32 and all EBCDIC encodings. This is already mostly done by HTML5. </p> <hr /> <p>I wonder if we can standardize (document to start with) the encoding detection algorithm. The list of encodings is fixed. The list of legacy pages is also fairly fixed. The detection algorithms in browsers should be fairly stable. Certainly looks possible. </p> <h3><span class="mw-headline" id="E-mails">E-mails</span></h3> <p>WHATWG got these e-mails that we should make sure to cover as part of this: </p> <ul><li><a rel="nofollow" class="external free" href="http://lists.whatwg.org/htdig.cgi/whatwg-whatwg.org/2009-July/021207.html">http://lists.whatwg.org/htdig.cgi/whatwg-whatwg.org/2009-July/021207.html</a></li> <li><a rel="nofollow" class="external free" href="http://lists.whatwg.org/pipermail/whatwg-whatwg.org/2009-September/023208.html">http://lists.whatwg.org/pipermail/whatwg-whatwg.org/2009-September/023208.html</a></li></ul> <h3><span class="mw-headline" id="Spec_notes">Spec notes</span></h3> <p>This is what the spec used to say about encodings: </p> <pre> <p>In addition, user agents must support the aliases given in the following table for every character encoding they support, so that labels from the first column are treated as equivalent to the labels given in the corresponding cell from the second column on the same row.</p> <table> <caption>Additional character encoding aliases</caption> <thead> <tr> <th> Alias <th> Corresponding encoding <th> References <tbody> <tr> <td> x-sjis <td> windows-31J <td> <a href="#refsSHIFTJIS">[SHIFTJIS]</a> <a href="#refsWIN31J">[WIN31J]</a> <tr> <td> windows-932 <td> windows-31J <td> <a href="#refsWIN31J">[WIN31J]</a> <tr> <td> x-x-big5 <td> Big5 <td> <a href="#refsBIG5">[BIG5]</a> </tbody> </table> </pre> <h3><span class="mw-headline" id="ICU_in_Chrome_and_Safari">ICU in Chrome and Safari</span></h3> <p>Giving a link to or actually including the info on what Safari and Chrome support would be nice. It seems like this would be at least a subset, but it sounds like more may have been added from the text above. </p><p><a rel="nofollow" class="external free" href="http://demo.icu-project.org/icu-bin/convexp">http://demo.icu-project.org/icu-bin/convexp</a> </p> <h2><span class="mw-headline" id="Misc.">Misc.</span></h2> <p><a rel="nofollow" class="external free" href="http://philip.html5.org/data/charsets.html">http://philip.html5.org/data/charsets.html</a> </p> <!-- NewPP limit report Cached time: 20250204233442 Cache expiry: 86400 Reduced expiry: false Complications: [show‐toc] CPU time usage: 0.060 seconds Real time usage: 0.077 seconds Preprocessor visited node count: 94/1000000 Post‐expand include size: 477/2097152 bytes Template argument size: 156/2097152 bytes Highest expansion depth: 4/100 Expensive parser function count: 0/100 Unstrip recursion depth: 0/20 Unstrip post‐expand size: 985/5000000 bytes --> <!-- Transclusion expansion time report (%,ms,calls,template) 100.00% 11.612 1 Template:Obsolete 100.00% 11.612 1 -total --> <!-- Saved in parser cache with key mediawiki:pcache:idhash:1849-0!canonical and timestamp 20250204233442 and revision id 8675. --> </div> <div class="printfooter" data-nosnippet="">Retrieved from "<a dir="ltr" href="https://wiki.whatwg.org/index.php?title=Web_Encodings&oldid=8675">https://wiki.whatwg.org/index.php?title=Web_Encodings&oldid=8675</a>"</div></div> <div id="catlinks" class="catlinks" data-mw="interface"><div id="mw-normal-catlinks" class="mw-normal-catlinks"><a href="/wiki/Special:Categories" title="Special:Categories">Categories</a>: <ul><li><a href="/wiki/Category:Obsolete_documents" title="Category:Obsolete documents">Obsolete documents</a></li><li><a href="/wiki/Category:Obsolete_specifications" title="Category:Obsolete specifications">Obsolete specifications</a></li><li><a href="/wiki/Category:Spec_coordination" title="Category:Spec coordination">Spec coordination</a></li><li><a href="/wiki/Category:Registries" title="Category:Registries">Registries</a></li></ul></div></div> </div> </div> <div id="mw-navigation"> <h2>Navigation menu</h2> <div id="mw-head"> <nav id="p-personal" class="vector-menu mw-portlet mw-portlet-personal vector-user-menu-legacy" aria-labelledby="p-personal-label" role="navigation" > <h3 id="p-personal-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">Personal tools</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="pt-login" class="mw-list-item"><a href="/index.php?title=Special:UserLogin&returnto=Web+Encodings" title="You are encouraged to log in; however, it is not mandatory [o]" accesskey="o"><span>Log in</span></a></li></ul> </div> </nav> <div id="left-navigation"> <nav id="p-namespaces" class="vector-menu mw-portlet mw-portlet-namespaces vector-menu-tabs vector-menu-tabs-legacy" aria-labelledby="p-namespaces-label" role="navigation" > <h3 id="p-namespaces-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">Namespaces</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="ca-nstab-main" class="selected mw-list-item"><a href="/wiki/Web_Encodings" title="View the content page [c]" accesskey="c"><span>Page</span></a></li><li id="ca-talk" class="new mw-list-item"><a href="/index.php?title=Talk:Web_Encodings&action=edit&redlink=1" rel="discussion" title="Discussion about the content page (page does not exist) [t]" accesskey="t"><span>Discussion</span></a></li></ul> </div> </nav> <nav id="p-variants" class="vector-menu mw-portlet mw-portlet-variants emptyPortlet vector-menu-dropdown" aria-labelledby="p-variants-label" role="navigation" > <input type="checkbox" id="p-variants-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-p-variants" class="vector-menu-checkbox" aria-labelledby="p-variants-label" /> <label id="p-variants-label" aria-label="Change language variant" class="vector-menu-heading " > <span class="vector-menu-heading-label">English</span> </label> <div class="vector-menu-content"> <ul class="vector-menu-content-list"></ul> </div> </nav> </div> <div id="right-navigation"> <nav id="p-views" class="vector-menu mw-portlet mw-portlet-views vector-menu-tabs vector-menu-tabs-legacy" aria-labelledby="p-views-label" role="navigation" > <h3 id="p-views-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">Views</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="ca-view" class="selected mw-list-item"><a href="/wiki/Web_Encodings"><span>Read</span></a></li><li id="ca-viewsource" class="mw-list-item"><a href="/index.php?title=Web_Encodings&action=edit" title="This page is protected. You can view its source [e]" accesskey="e"><span>View source</span></a></li><li id="ca-history" class="mw-list-item"><a href="/index.php?title=Web_Encodings&action=history" title="Past revisions of this page [h]" accesskey="h"><span>View history</span></a></li></ul> </div> </nav> <nav id="p-cactions" class="vector-menu mw-portlet mw-portlet-cactions emptyPortlet vector-menu-dropdown" aria-labelledby="p-cactions-label" role="navigation" title="More options" > <input type="checkbox" id="p-cactions-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-p-cactions" class="vector-menu-checkbox" aria-labelledby="p-cactions-label" /> <label id="p-cactions-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">More</span> </label> <div class="vector-menu-content"> <ul class="vector-menu-content-list"></ul> </div> </nav> <div id="p-search" role="search" class="vector-search-box-vue vector-search-box-show-thumbnail vector-search-box-auto-expand-width vector-search-box"> <div> <h3 > <label for="searchInput">Search</label> </h3> <form action="/index.php" id="searchform" class="vector-search-box-form"> <div id="simpleSearch" class="vector-search-box-inner" data-search-loc="header-navigation"> <input class="vector-search-box-input" type="search" name="search" placeholder="Search WHATWG Wiki" aria-label="Search WHATWG Wiki" autocapitalize="sentences" title="Search WHATWG Wiki [f]" accesskey="f" id="searchInput" > <input type="hidden" name="title" value="Special:Search"> <input id="mw-searchButton" class="searchButton mw-fallbackSearchButton" type="submit" name="fulltext" title="Search the pages for this text" value="Search"> <input id="searchButton" class="searchButton" type="submit" name="go" title="Go to a page with this exact name if it exists" value="Go"> </div> </form> </div> </div> </div> </div> <div id="mw-panel"> <div id="p-logo" role="banner"> <a class="mw-wiki-logo" href="/" title="Visit the main page"></a> </div> <nav id="p-navigation" class="vector-menu mw-portlet mw-portlet-navigation vector-menu-portal portal" aria-labelledby="p-navigation-label" role="navigation" > <h3 id="p-navigation-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">Navigation</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="n-mainpage" class="mw-list-item"><a href="/" title="Visit the main page [z]" accesskey="z"><span>Main Page</span></a></li><li id="n-randompage" class="mw-list-item"><a href="/wiki/Special:Random" title="Load a random page [x]" accesskey="x"><span>Random page</span></a></li><li id="n-recentchanges" class="mw-list-item"><a href="/wiki/Special:RecentChanges" title="A list of recent changes in the wiki [r]" accesskey="r"><span>Recent changes</span></a></li></ul> </div> </nav> <nav id="p-WHATWG" class="vector-menu mw-portlet mw-portlet-WHATWG vector-menu-portal portal" aria-labelledby="p-WHATWG-label" role="navigation" > <h3 id="p-WHATWG-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">WHATWG</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="n-Standards" class="mw-list-item"><a href="https://spec.whatwg.org/" rel="nofollow"><span>Standards</span></a></li><li id="n-FAQ" class="mw-list-item"><a href="https://whatwg.org/faq" rel="nofollow"><span>FAQ</span></a></li><li id="n-Chat" class="mw-list-item"><a href="https://whatwg.org/chat" rel="nofollow"><span>Chat</span></a></li><li id="n-Code-of-Conduct" class="mw-list-item"><a href="https://whatwg.org/code-of-conduct" rel="nofollow"><span>Code of Conduct</span></a></li><li id="n-GitHub" class="mw-list-item"><a href="https://github.com/whatwg" rel="nofollow"><span>GitHub</span></a></li><li id="n-What-you-can-do" class="mw-list-item"><a href="/wiki/What_you_can_do"><span>What you can do</span></a></li><li id="n-To-do-list" class="mw-list-item"><a href="/wiki/Specs_todo"><span>To-do list</span></a></li></ul> </div> </nav> <nav id="p-Registries" class="vector-menu mw-portlet mw-portlet-Registries vector-menu-portal portal" aria-labelledby="p-Registries-label" role="navigation" > <h3 id="p-Registries-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">Registries</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="n-<meta-name>" class="mw-list-item"><a href="/wiki/MetaExtensions"><span><meta name></span></a></li><li id="n-rel=""" class="mw-list-item"><a href="http://microformats.org/wiki/existing-rel-values" rel="nofollow"><span>rel=""</span></a></li></ul> </div> </nav> <nav id="p-tb" class="vector-menu mw-portlet mw-portlet-tb vector-menu-portal portal" aria-labelledby="p-tb-label" role="navigation" > <h3 id="p-tb-label" class="vector-menu-heading " > <span class="vector-menu-heading-label">Tools</span> </h3> <div class="vector-menu-content"> <ul class="vector-menu-content-list"><li id="t-whatlinkshere" class="mw-list-item"><a href="/wiki/Special:WhatLinksHere/Web_Encodings" title="A list of all wiki pages that link here [j]" accesskey="j"><span>What links here</span></a></li><li id="t-recentchangeslinked" class="mw-list-item"><a href="/wiki/Special:RecentChangesLinked/Web_Encodings" rel="nofollow" title="Recent changes in pages linked from this page [k]" accesskey="k"><span>Related changes</span></a></li><li id="t-specialpages" class="mw-list-item"><a href="/wiki/Special:SpecialPages" title="A list of all special pages [q]" accesskey="q"><span>Special pages</span></a></li><li id="t-print" class="mw-list-item"><a href="javascript:print();" rel="alternate" title="Printable version of this page [p]" accesskey="p"><span>Printable version</span></a></li><li id="t-permalink" class="mw-list-item"><a href="/index.php?title=Web_Encodings&oldid=8675" title="Permanent link to this revision of this page"><span>Permanent link</span></a></li><li id="t-info" class="mw-list-item"><a href="/index.php?title=Web_Encodings&action=info" title="More information about this page"><span>Page information</span></a></li></ul> </div> </nav> </div> </div> <footer id="footer" class="mw-footer" role="contentinfo" > <ul id="footer-info"> <li id="footer-info-lastmod"> This page was last edited on 23 October 2012, at 19:35.</li> <li id="footer-info-copyright">Content is available under <a href="/wiki/WHATWG_Wiki:Copyrights" title="WHATWG Wiki:Copyrights">a CC0 Universal Public Domain Declaration, with some restrictions</a> unless otherwise noted.</li> </ul> <ul id="footer-places"> <li id="footer-places-about"><a href="/wiki/WHATWG_Wiki:About">About WHATWG Wiki</a></li> </ul> <ul id="footer-icons" class="noprint"> <li id="footer-poweredbyico"><a href="https://www.mediawiki.org/"><img src="/resources/assets/poweredby_mediawiki_88x31.png" alt="Powered by MediaWiki" srcset="/resources/assets/poweredby_mediawiki_132x47.png 1.5x, /resources/assets/poweredby_mediawiki_176x62.png 2x" width="88" height="31" loading="lazy"/></a></li> </ul> </footer> <script>(RLQ=window.RLQ||[]).push(function(){mw.config.set({"wgPageParseReport":{"limitreport":{"cputime":"0.060","walltime":"0.077","ppvisitednodes":{"value":94,"limit":1000000},"postexpandincludesize":{"value":477,"limit":2097152},"templateargumentsize":{"value":156,"limit":2097152},"expansiondepth":{"value":4,"limit":100},"expensivefunctioncount":{"value":0,"limit":100},"unstrip-depth":{"value":0,"limit":20},"unstrip-size":{"value":985,"limit":5000000},"timingprofile":["100.00% 11.612 1 Template:Obsolete","100.00% 11.612 1 -total"]},"cachereport":{"timestamp":"20250204233442","ttl":86400,"transientcontent":false}}});mw.config.set({"wgBackendResponseTime":263});});</script> </body> <!-- Cached 20250205023058 --> </html>