CINXE.COM

Universal Character Set characters - Wikipedia

<!DOCTYPE html> <html class="client-nojs vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-sticky-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-toc-available" lang="en" dir="ltr"> <head> <meta charset="UTF-8"> <title>Universal Character Set characters - Wikipedia</title> <script>(function(){var className="client-js vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-sticky-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-toc-available";var cookie=document.cookie.match(/(?:^|; )enwikimwclientpreferences=([^;]+)/);if(cookie){cookie[1].split('%2C').forEach(function(pref){className=className.replace(new RegExp('(^| )'+pref.replace(/-clientpref-\w+$|[^\w-]+/g,'')+'-clientpref-\\w+( |$)'),'$1'+pref+'$2');});}document.documentElement.className=className;}());RLCONF={"wgBreakFrames":false,"wgSeparatorTransformTable":["",""],"wgDigitTransformTable":["",""],"wgDefaultDateFormat":"dmy", "wgMonthNames":["","January","February","March","April","May","June","July","August","September","October","November","December"],"wgRequestId":"071691b4-3e30-40a1-a8cd-07f1771d7b4e","wgCanonicalNamespace":"","wgCanonicalSpecialPageName":false,"wgNamespaceNumber":0,"wgPageName":"Universal_Character_Set_characters","wgTitle":"Universal Character Set characters","wgCurRevisionId":1255067307,"wgRevisionId":1255067307,"wgArticleId":10633237,"wgIsArticle":true,"wgIsRedirect":false,"wgAction":"view","wgUserName":null,"wgUserGroups":["*"],"wgCategories":["Articles with short description","Short description is different from Wikidata","Commons category link is on Wikidata","IEC standards","Unicode"],"wgPageViewLanguage":"en","wgPageContentLanguage":"en","wgPageContentModel":"wikitext","wgRelevantPageName":"Universal_Character_Set_characters","wgRelevantArticleId":10633237,"wgIsProbablyEditable":true,"wgRelevantPageIsProbablyEditable":true,"wgRestrictionEdit":[],"wgRestrictionMove":[], "wgRedirectedFrom":"􏿿","wgNoticeProject":"wikipedia","wgCiteReferencePreviewsActive":false,"wgFlaggedRevsParams":{"tags":{"status":{"levels":1}}},"wgMediaViewerOnClick":true,"wgMediaViewerEnabledByDefault":true,"wgPopupsFlags":0,"wgVisualEditor":{"pageLanguageCode":"en","pageLanguageDir":"ltr","pageVariantFallbacks":"en"},"wgMFDisplayWikibaseDescriptions":{"search":true,"watchlist":true,"tagline":false,"nearby":true},"wgWMESchemaEditAttemptStepOversample":false,"wgWMEPageLength":60000,"wgInternalRedirectTargetUrl":"/wiki/Universal_Character_Set_characters#Noncharacters","wgRelatedArticlesCompat":[],"wgEditSubmitButtonLabelPublish":true,"wgULSPosition":"interlanguage","wgULSisCompactLinksEnabled":false,"wgVector2022LanguageInHeader":true,"wgULSisLanguageSelectorEmpty":false,"wgWikibaseItemId":"Q897819","wgCheckUserClientHintsHeadersJsApi":["brands","architecture","bitness","fullVersionList","mobile","model","platform","platformVersion"],"GEHomepageSuggestedEditsEnableTopics":true, "wgGETopicsMatchModeEnabled":false,"wgGEStructuredTaskRejectionReasonTextInputEnabled":false,"wgGELevelingUpEnabledForUser":false};RLSTATE={"ext.globalCssJs.user.styles":"ready","site.styles":"ready","user.styles":"ready","ext.globalCssJs.user":"ready","user":"ready","user.options":"loading","ext.cite.styles":"ready","skins.vector.search.codex.styles":"ready","skins.vector.styles":"ready","skins.vector.icons":"ready","jquery.makeCollapsible.styles":"ready","ext.wikimediamessages.styles":"ready","ext.visualEditor.desktopArticleTarget.noscript":"ready","ext.uls.interlanguage":"ready","wikibase.client.init":"ready","ext.wikimediaBadges":"ready"};RLPAGEMODULES=["mediawiki.action.view.redirect","ext.cite.ux-enhancements","mediawiki.page.media","site","mediawiki.page.ready","jquery.makeCollapsible","mediawiki.toc","skins.vector.js","ext.centralNotice.geoIP","ext.centralNotice.startUp","ext.gadget.ReferenceTooltips","ext.gadget.switcher","ext.urlShortener.toolbar", "ext.centralauth.centralautologin","mmv.bootstrap","ext.popups","ext.visualEditor.desktopArticleTarget.init","ext.visualEditor.targetLoader","ext.echo.centralauth","ext.eventLogging","ext.wikimediaEvents","ext.navigationTiming","ext.uls.interface","ext.cx.eventlogging.campaigns","ext.cx.uls.quick.actions","wikibase.client.vector-2022","ext.checkUser.clientHints","ext.growthExperiments.SuggestedEditSession"];</script> <script>(RLQ=window.RLQ||[]).push(function(){mw.loader.impl(function(){return["user.options@12s5i",function($,jQuery,require,module){mw.user.tokens.set({"patrolToken":"+\\","watchToken":"+\\","csrfToken":"+\\"}); }];});});</script> <link rel="stylesheet" href="/w/load.php?lang=en&amp;modules=ext.cite.styles%7Cext.uls.interlanguage%7Cext.visualEditor.desktopArticleTarget.noscript%7Cext.wikimediaBadges%7Cext.wikimediamessages.styles%7Cjquery.makeCollapsible.styles%7Cskins.vector.icons%2Cstyles%7Cskins.vector.search.codex.styles%7Cwikibase.client.init&amp;only=styles&amp;skin=vector-2022"> <script async="" src="/w/load.php?lang=en&amp;modules=startup&amp;only=scripts&amp;raw=1&amp;skin=vector-2022"></script> <meta name="ResourceLoaderDynamicStyles" content=""> <link rel="stylesheet" href="/w/load.php?lang=en&amp;modules=site.styles&amp;only=styles&amp;skin=vector-2022"> <meta name="generator" content="MediaWiki 1.44.0-wmf.6"> <meta name="referrer" content="origin"> <meta name="referrer" content="origin-when-cross-origin"> <meta name="robots" content="max-image-preview:standard"> <meta name="format-detection" content="telephone=no"> <meta property="og:image" content="https://upload.wikimedia.org/wikipedia/commons/thumb/0/09/New_Unicode_logo.svg/1200px-New_Unicode_logo.svg.png"> <meta property="og:image:width" content="1200"> <meta property="og:image:height" content="1439"> <meta property="og:image" content="https://upload.wikimedia.org/wikipedia/commons/thumb/0/09/New_Unicode_logo.svg/800px-New_Unicode_logo.svg.png"> <meta property="og:image:width" content="800"> <meta property="og:image:height" content="959"> <meta property="og:image" content="https://upload.wikimedia.org/wikipedia/commons/thumb/0/09/New_Unicode_logo.svg/640px-New_Unicode_logo.svg.png"> <meta property="og:image:width" content="640"> <meta property="og:image:height" content="768"> <meta name="viewport" content="width=1120"> <meta property="og:title" content="Universal Character Set characters - Wikipedia"> <meta property="og:type" content="website"> <link rel="preconnect" href="//upload.wikimedia.org"> <link rel="alternate" media="only screen and (max-width: 640px)" href="//en.m.wikipedia.org/wiki/Universal_Character_Set_characters#Noncharacters"> <link rel="alternate" type="application/x-wiki" title="Edit this page" href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit"> <link rel="apple-touch-icon" href="/static/apple-touch/wikipedia.png"> <link rel="icon" href="/static/favicon/wikipedia.ico"> <link rel="search" type="application/opensearchdescription+xml" href="/w/rest.php/v1/search" title="Wikipedia (en)"> <link rel="EditURI" type="application/rsd+xml" href="//en.wikipedia.org/w/api.php?action=rsd"> <link rel="canonical" href="https://en.wikipedia.org/wiki/Universal_Character_Set_characters#Noncharacters"> <link rel="license" href="https://creativecommons.org/licenses/by-sa/4.0/deed.en"> <link rel="alternate" type="application/atom+xml" title="Wikipedia Atom feed" href="/w/index.php?title=Special:RecentChanges&amp;feed=atom"> <link rel="dns-prefetch" href="//meta.wikimedia.org" /> <link rel="dns-prefetch" href="login.wikimedia.org"> </head> <body class="skin--responsive skin-vector skin-vector-search-vue mediawiki ltr sitedir-ltr mw-hide-empty-elt ns-0 ns-subject mw-editable page-Universal_Character_Set_characters rootpage-Universal_Character_Set_characters skin-vector-2022 action-view"><a class="mw-jump-link" href="#bodyContent">Jump to content</a> <div class="vector-header-container"> <header class="vector-header mw-header"> <div class="vector-header-start"> <nav class="vector-main-menu-landmark" aria-label="Site"> <div id="vector-main-menu-dropdown" class="vector-dropdown vector-main-menu-dropdown vector-button-flush-left vector-button-flush-right" > <input type="checkbox" id="vector-main-menu-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-main-menu-dropdown" class="vector-dropdown-checkbox " aria-label="Main menu" > <label id="vector-main-menu-dropdown-label" for="vector-main-menu-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-menu mw-ui-icon-wikimedia-menu"></span> <span class="vector-dropdown-label-text">Main menu</span> </label> <div class="vector-dropdown-content"> <div id="vector-main-menu-unpinned-container" class="vector-unpinned-container"> <div id="vector-main-menu" class="vector-main-menu vector-pinnable-element"> <div class="vector-pinnable-header vector-main-menu-pinnable-header vector-pinnable-header-unpinned" data-feature-name="main-menu-pinned" data-pinnable-element-id="vector-main-menu" data-pinned-container-id="vector-main-menu-pinned-container" data-unpinned-container-id="vector-main-menu-unpinned-container" > <div class="vector-pinnable-header-label">Main menu</div> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-main-menu.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-main-menu.unpin">hide</button> </div> <div id="p-navigation" class="vector-menu mw-portlet mw-portlet-navigation" > <div class="vector-menu-heading"> Navigation </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="n-mainpage-description" class="mw-list-item"><a href="/wiki/Main_Page" title="Visit the main page [z]" accesskey="z"><span>Main page</span></a></li><li id="n-contents" class="mw-list-item"><a href="/wiki/Wikipedia:Contents" title="Guides to browsing Wikipedia"><span>Contents</span></a></li><li id="n-currentevents" class="mw-list-item"><a href="/wiki/Portal:Current_events" title="Articles related to current events"><span>Current events</span></a></li><li id="n-randompage" class="mw-list-item"><a href="/wiki/Special:Random" title="Visit a randomly selected article [x]" accesskey="x"><span>Random article</span></a></li><li id="n-aboutsite" class="mw-list-item"><a href="/wiki/Wikipedia:About" title="Learn about Wikipedia and how it works"><span>About Wikipedia</span></a></li><li id="n-contactpage" class="mw-list-item"><a href="//en.wikipedia.org/wiki/Wikipedia:Contact_us" title="How to contact Wikipedia"><span>Contact us</span></a></li> </ul> </div> </div> <div id="p-interaction" class="vector-menu mw-portlet mw-portlet-interaction" > <div class="vector-menu-heading"> Contribute </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="n-help" class="mw-list-item"><a href="/wiki/Help:Contents" title="Guidance on how to use and edit Wikipedia"><span>Help</span></a></li><li id="n-introduction" class="mw-list-item"><a href="/wiki/Help:Introduction" title="Learn how to edit Wikipedia"><span>Learn to edit</span></a></li><li id="n-portal" class="mw-list-item"><a href="/wiki/Wikipedia:Community_portal" title="The hub for editors"><span>Community portal</span></a></li><li id="n-recentchanges" class="mw-list-item"><a href="/wiki/Special:RecentChanges" title="A list of recent changes to Wikipedia [r]" accesskey="r"><span>Recent changes</span></a></li><li id="n-upload" class="mw-list-item"><a href="/wiki/Wikipedia:File_upload_wizard" title="Add images or other media for use on Wikipedia"><span>Upload file</span></a></li> </ul> </div> </div> </div> </div> </div> </div> </nav> <a href="/wiki/Main_Page" class="mw-logo"> <img class="mw-logo-icon" src="/static/images/icons/wikipedia.png" alt="" aria-hidden="true" height="50" width="50"> <span class="mw-logo-container skin-invert"> <img class="mw-logo-wordmark" alt="Wikipedia" src="/static/images/mobile/copyright/wikipedia-wordmark-en.svg" style="width: 7.5em; height: 1.125em;"> <img class="mw-logo-tagline" alt="The Free Encyclopedia" src="/static/images/mobile/copyright/wikipedia-tagline-en.svg" width="117" height="13" style="width: 7.3125em; height: 0.8125em;"> </span> </a> </div> <div class="vector-header-end"> <div id="p-search" role="search" class="vector-search-box-vue vector-search-box-collapses vector-search-box-show-thumbnail vector-search-box-auto-expand-width vector-search-box"> <a href="/wiki/Special:Search" class="cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only search-toggle" title="Search Wikipedia [f]" accesskey="f"><span class="vector-icon mw-ui-icon-search mw-ui-icon-wikimedia-search"></span> <span>Search</span> </a> <div class="vector-typeahead-search-container"> <div class="cdx-typeahead-search cdx-typeahead-search--show-thumbnail cdx-typeahead-search--auto-expand-width"> <form action="/w/index.php" id="searchform" class="cdx-search-input cdx-search-input--has-end-button"> <div id="simpleSearch" class="cdx-search-input__input-wrapper" data-search-loc="header-moved"> <div class="cdx-text-input cdx-text-input--has-start-icon"> <input class="cdx-text-input__input" type="search" name="search" placeholder="Search Wikipedia" aria-label="Search Wikipedia" autocapitalize="sentences" title="Search Wikipedia [f]" accesskey="f" id="searchInput" > <span class="cdx-text-input__icon cdx-text-input__start-icon"></span> </div> <input type="hidden" name="title" value="Special:Search"> </div> <button class="cdx-button cdx-search-input__end-button">Search</button> </form> </div> </div> </div> <nav class="vector-user-links vector-user-links-wide" aria-label="Personal tools"> <div class="vector-user-links-main"> <div id="p-vector-user-menu-preferences" class="vector-menu mw-portlet emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> <div id="p-vector-user-menu-userpage" class="vector-menu mw-portlet emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> <nav class="vector-appearance-landmark" aria-label="Appearance"> <div id="vector-appearance-dropdown" class="vector-dropdown " title="Change the appearance of the page&#039;s font size, width, and color" > <input type="checkbox" id="vector-appearance-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-appearance-dropdown" class="vector-dropdown-checkbox " aria-label="Appearance" > <label id="vector-appearance-dropdown-label" for="vector-appearance-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-appearance mw-ui-icon-wikimedia-appearance"></span> <span class="vector-dropdown-label-text">Appearance</span> </label> <div class="vector-dropdown-content"> <div id="vector-appearance-unpinned-container" class="vector-unpinned-container"> </div> </div> </div> </nav> <div id="p-vector-user-menu-notifications" class="vector-menu mw-portlet emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> <div id="p-vector-user-menu-overflow" class="vector-menu mw-portlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="pt-sitesupport-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="https://donate.wikimedia.org/?wmf_source=donate&amp;wmf_medium=sidebar&amp;wmf_campaign=en.wikipedia.org&amp;uselang=en" class=""><span>Donate</span></a> </li> <li id="pt-createaccount-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="/w/index.php?title=Special:CreateAccount&amp;returnto=Universal+Character+Set+characters" title="You are encouraged to create an account and log in; however, it is not mandatory" class=""><span>Create account</span></a> </li> <li id="pt-login-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="/w/index.php?title=Special:UserLogin&amp;returnto=Universal+Character+Set+characters" title="You&#039;re encouraged to log in; however, it&#039;s not mandatory. [o]" accesskey="o" class=""><span>Log in</span></a> </li> </ul> </div> </div> </div> <div id="vector-user-links-dropdown" class="vector-dropdown vector-user-menu vector-button-flush-right vector-user-menu-logged-out" title="Log in and more options" > <input type="checkbox" id="vector-user-links-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-user-links-dropdown" class="vector-dropdown-checkbox " aria-label="Personal tools" > <label id="vector-user-links-dropdown-label" for="vector-user-links-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-ellipsis mw-ui-icon-wikimedia-ellipsis"></span> <span class="vector-dropdown-label-text">Personal tools</span> </label> <div class="vector-dropdown-content"> <div id="p-personal" class="vector-menu mw-portlet mw-portlet-personal user-links-collapsible-item" title="User menu" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="pt-sitesupport" class="user-links-collapsible-item mw-list-item"><a href="https://donate.wikimedia.org/?wmf_source=donate&amp;wmf_medium=sidebar&amp;wmf_campaign=en.wikipedia.org&amp;uselang=en"><span>Donate</span></a></li><li id="pt-createaccount" class="user-links-collapsible-item mw-list-item"><a href="/w/index.php?title=Special:CreateAccount&amp;returnto=Universal+Character+Set+characters" title="You are encouraged to create an account and log in; however, it is not mandatory"><span class="vector-icon mw-ui-icon-userAdd mw-ui-icon-wikimedia-userAdd"></span> <span>Create account</span></a></li><li id="pt-login" class="user-links-collapsible-item mw-list-item"><a href="/w/index.php?title=Special:UserLogin&amp;returnto=Universal+Character+Set+characters" title="You&#039;re encouraged to log in; however, it&#039;s not mandatory. [o]" accesskey="o"><span class="vector-icon mw-ui-icon-logIn mw-ui-icon-wikimedia-logIn"></span> <span>Log in</span></a></li> </ul> </div> </div> <div id="p-user-menu-anon-editor" class="vector-menu mw-portlet mw-portlet-user-menu-anon-editor" > <div class="vector-menu-heading"> Pages for logged out editors <a href="/wiki/Help:Introduction" aria-label="Learn more about editing"><span>learn more</span></a> </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="pt-anoncontribs" class="mw-list-item"><a href="/wiki/Special:MyContributions" title="A list of edits made from this IP address [y]" accesskey="y"><span>Contributions</span></a></li><li id="pt-anontalk" class="mw-list-item"><a href="/wiki/Special:MyTalk" title="Discussion about edits from this IP address [n]" accesskey="n"><span>Talk</span></a></li> </ul> </div> </div> </div> </div> </nav> </div> </header> </div> <div class="mw-page-container"> <div class="mw-page-container-inner"> <div class="vector-sitenotice-container"> <div id="siteNotice"><!-- CentralNotice --></div> </div> <div class="vector-column-start"> <div class="vector-main-menu-container"> <div id="mw-navigation"> <nav id="mw-panel" class="vector-main-menu-landmark" aria-label="Site"> <div id="vector-main-menu-pinned-container" class="vector-pinned-container"> </div> </nav> </div> </div> <div class="vector-sticky-pinned-container"> <nav id="mw-panel-toc" aria-label="Contents" data-event-name="ui.sidebar-toc" class="mw-table-of-contents-container vector-toc-landmark"> <div id="vector-toc-pinned-container" class="vector-pinned-container"> <div id="vector-toc" class="vector-toc vector-pinnable-element"> <div class="vector-pinnable-header vector-toc-pinnable-header vector-pinnable-header-pinned" data-feature-name="toc-pinned" data-pinnable-element-id="vector-toc" > <h2 class="vector-pinnable-header-label">Contents</h2> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-toc.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-toc.unpin">hide</button> </div> <ul class="vector-toc-contents" id="mw-panel-toc-list"> <li id="toc-mw-content-text" class="vector-toc-list-item vector-toc-level-1"> <a href="#" class="vector-toc-link"> <div class="vector-toc-text">(Top)</div> </a> </li> <li id="toc-Character_reference_overview" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Character_reference_overview"> <div class="vector-toc-text"> <span class="vector-toc-numb">1</span> <span>Character reference overview</span> </div> </a> <ul id="toc-Character_reference_overview-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Planes" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Planes"> <div class="vector-toc-text"> <span class="vector-toc-numb">2</span> <span>Planes</span> </div> </a> <ul id="toc-Planes-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Blocks" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Blocks"> <div class="vector-toc-text"> <span class="vector-toc-numb">3</span> <span>Blocks</span> </div> </a> <ul id="toc-Blocks-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Categories" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Categories"> <div class="vector-toc-text"> <span class="vector-toc-numb">4</span> <span>Categories</span> </div> </a> <ul id="toc-Categories-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Special-purpose_characters" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Special-purpose_characters"> <div class="vector-toc-text"> <span class="vector-toc-numb">5</span> <span>Special-purpose characters</span> </div> </a> <button aria-controls="toc-Special-purpose_characters-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle Special-purpose characters subsection</span> </button> <ul id="toc-Special-purpose_characters-sublist" class="vector-toc-list"> <li id="toc-Byte_order_mark" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Byte_order_mark"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.1</span> <span>Byte order mark</span> </div> </a> <ul id="toc-Byte_order_mark-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Mathematical_invisibles" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Mathematical_invisibles"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.2</span> <span>Mathematical invisibles</span> </div> </a> <ul id="toc-Mathematical_invisibles-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Fraction_slash" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Fraction_slash"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.3</span> <span>Fraction slash</span> </div> </a> <ul id="toc-Fraction_slash-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Bidirectional_neutral_formatting" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Bidirectional_neutral_formatting"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.4</span> <span>Bidirectional neutral formatting</span> </div> </a> <ul id="toc-Bidirectional_neutral_formatting-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Bidirectional_general_formatting" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Bidirectional_general_formatting"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.5</span> <span>Bidirectional general formatting</span> </div> </a> <ul id="toc-Bidirectional_general_formatting-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Interlinear_annotation_characters" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Interlinear_annotation_characters"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.6</span> <span>Interlinear annotation characters</span> </div> </a> <ul id="toc-Interlinear_annotation_characters-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Script-specific" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Script-specific"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.7</span> <span>Script-specific</span> </div> </a> <ul id="toc-Script-specific-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Others" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Others"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.8</span> <span>Others</span> </div> </a> <ul id="toc-Others-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Characters_vs._code_points" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Characters_vs._code_points"> <div class="vector-toc-text"> <span class="vector-toc-numb">6</span> <span>Characters vs. code points</span> </div> </a> <ul id="toc-Characters_vs._code_points-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Whitespace,_joiners,_and_separators" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Whitespace,_joiners,_and_separators"> <div class="vector-toc-text"> <span class="vector-toc-numb">7</span> <span>Whitespace, joiners, and separators</span> </div> </a> <button aria-controls="toc-Whitespace,_joiners,_and_separators-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle Whitespace, joiners, and separators subsection</span> </button> <ul id="toc-Whitespace,_joiners,_and_separators-sublist" class="vector-toc-list"> <li id="toc-Grapheme_joiners_and_non-joiners" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Grapheme_joiners_and_non-joiners"> <div class="vector-toc-text"> <span class="vector-toc-numb">7.1</span> <span>Grapheme joiners and non-joiners</span> </div> </a> <ul id="toc-Grapheme_joiners_and_non-joiners-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Word_joiners_and_separators" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Word_joiners_and_separators"> <div class="vector-toc-text"> <span class="vector-toc-numb">7.2</span> <span>Word joiners and separators</span> </div> </a> <ul id="toc-Word_joiners_and_separators-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Other_separators" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Other_separators"> <div class="vector-toc-text"> <span class="vector-toc-numb">7.3</span> <span>Other separators</span> </div> </a> <ul id="toc-Other_separators-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Spaces" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Spaces"> <div class="vector-toc-text"> <span class="vector-toc-numb">7.4</span> <span>Spaces</span> </div> </a> <ul id="toc-Spaces-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Line-break_control_characters" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Line-break_control_characters"> <div class="vector-toc-text"> <span class="vector-toc-numb">7.5</span> <span>Line-break control characters</span> </div> </a> <ul id="toc-Line-break_control_characters-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Types_of_code_point" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Types_of_code_point"> <div class="vector-toc-text"> <span class="vector-toc-numb">8</span> <span>Types of code point</span> </div> </a> <button aria-controls="toc-Types_of_code_point-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle Types of code point subsection</span> </button> <ul id="toc-Types_of_code_point-sublist" class="vector-toc-list"> <li id="toc-Assigned_characters" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Assigned_characters"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.1</span> <span>Assigned characters</span> </div> </a> <ul id="toc-Assigned_characters-sublist" class="vector-toc-list"> <li id="toc-Private-use_characters" class="vector-toc-list-item vector-toc-level-3"> <a class="vector-toc-link" href="#Private-use_characters"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.1.1</span> <span>Private-use characters</span> </div> </a> <ul id="toc-Private-use_characters-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Surrogates" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Surrogates"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.2</span> <span>Surrogates</span> </div> </a> <ul id="toc-Surrogates-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Noncharacters" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Noncharacters"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.3</span> <span>Noncharacters</span> </div> </a> <ul id="toc-Noncharacters-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Reserved_code_points" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Reserved_code_points"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.4</span> <span>Reserved code points</span> </div> </a> <ul id="toc-Reserved_code_points-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Characters,_grapheme_clusters_and_glyphs" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Characters,_grapheme_clusters_and_glyphs"> <div class="vector-toc-text"> <span class="vector-toc-numb">9</span> <span>Characters, grapheme clusters and glyphs</span> </div> </a> <button aria-controls="toc-Characters,_grapheme_clusters_and_glyphs-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle Characters, grapheme clusters and glyphs subsection</span> </button> <ul id="toc-Characters,_grapheme_clusters_and_glyphs-sublist" class="vector-toc-list"> <li id="toc-Compatibility_characters" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Compatibility_characters"> <div class="vector-toc-text"> <span class="vector-toc-numb">9.1</span> <span>Compatibility characters</span> </div> </a> <ul id="toc-Compatibility_characters-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Character_properties" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#Character_properties"> <div class="vector-toc-text"> <span class="vector-toc-numb">10</span> <span>Character properties</span> </div> </a> <ul id="toc-Character_properties-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-See_also" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#See_also"> <div class="vector-toc-text"> <span class="vector-toc-numb">11</span> <span>See also</span> </div> </a> <ul id="toc-See_also-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-References" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#References"> <div class="vector-toc-text"> <span class="vector-toc-numb">12</span> <span>References</span> </div> </a> <ul id="toc-References-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-External_links" class="vector-toc-list-item vector-toc-level-1"> <a class="vector-toc-link" href="#External_links"> <div class="vector-toc-text"> <span class="vector-toc-numb">13</span> <span>External links</span> </div> </a> <ul id="toc-External_links-sublist" class="vector-toc-list"> </ul> </li> </ul> </div> </div> </nav> </div> </div> <div class="mw-content-container"> <main id="content" class="mw-body"> <header class="mw-body-header vector-page-titlebar"> <nav aria-label="Contents" class="vector-toc-landmark"> <div id="vector-page-titlebar-toc" class="vector-dropdown vector-page-titlebar-toc vector-button-flush-left" > <input type="checkbox" id="vector-page-titlebar-toc-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-page-titlebar-toc" class="vector-dropdown-checkbox " aria-label="Toggle the table of contents" > <label id="vector-page-titlebar-toc-label" for="vector-page-titlebar-toc-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-listBullet mw-ui-icon-wikimedia-listBullet"></span> <span class="vector-dropdown-label-text">Toggle the table of contents</span> </label> <div class="vector-dropdown-content"> <div id="vector-page-titlebar-toc-unpinned-container" class="vector-unpinned-container"> </div> </div> </div> </nav> <h1 id="firstHeading" class="firstHeading mw-first-heading"><span class="mw-page-title-main">Universal Character Set characters</span></h1> <div id="p-lang-btn" class="vector-dropdown mw-portlet mw-portlet-lang" > <input type="checkbox" id="p-lang-btn-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-p-lang-btn" class="vector-dropdown-checkbox mw-interlanguage-selector" aria-label="Go to an article in another language. Available in 5 languages" > <label id="p-lang-btn-label" for="p-lang-btn-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--action-progressive mw-portlet-lang-heading-5" aria-hidden="true" ><span class="vector-icon mw-ui-icon-language-progressive mw-ui-icon-wikimedia-language-progressive"></span> <span class="vector-dropdown-label-text">5 languages</span> </label> <div class="vector-dropdown-content"> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li class="interlanguage-link interwiki-eo mw-list-item"><a href="https://eo.wikipedia.org/wiki/Unikoda_alfabeto" title="Unikoda alfabeto – Esperanto" lang="eo" hreflang="eo" data-title="Unikoda alfabeto" data-language-autonym="Esperanto" data-language-local-name="Esperanto" class="interlanguage-link-target"><span>Esperanto</span></a></li><li class="interlanguage-link interwiki-eu mw-list-item"><a href="https://eu.wikipedia.org/wiki/Zerrenda:Unicode_karaktereak" title="Zerrenda:Unicode karaktereak – Basque" lang="eu" hreflang="eu" data-title="Zerrenda:Unicode karaktereak" data-language-autonym="Euskara" data-language-local-name="Basque" class="interlanguage-link-target"><span>Euskara</span></a></li><li class="interlanguage-link interwiki-ilo mw-list-item"><a href="https://ilo.wikipedia.org/wiki/Dagiti_karakter_ti_Universal_Character_Set" title="Dagiti karakter ti Universal Character Set – Iloko" lang="ilo" hreflang="ilo" data-title="Dagiti karakter ti Universal Character Set" data-language-autonym="Ilokano" data-language-local-name="Iloko" class="interlanguage-link-target"><span>Ilokano</span></a></li><li class="interlanguage-link interwiki-nl mw-list-item"><a href="https://nl.wikipedia.org/wiki/Lijst_van_Unicode-subbereiken" title="Lijst van Unicode-subbereiken – Dutch" lang="nl" hreflang="nl" data-title="Lijst van Unicode-subbereiken" data-language-autonym="Nederlands" data-language-local-name="Dutch" class="interlanguage-link-target"><span>Nederlands</span></a></li><li class="interlanguage-link interwiki-ja mw-list-item"><a href="https://ja.wikipedia.org/wiki/Unicode%E6%96%87%E5%AD%97%E3%81%AE%E3%83%9E%E3%83%83%E3%83%94%E3%83%B3%E3%82%B0" title="Unicode文字のマッピング – Japanese" lang="ja" hreflang="ja" data-title="Unicode文字のマッピング" data-language-autonym="日本語" data-language-local-name="Japanese" class="interlanguage-link-target"><span>日本語</span></a></li> </ul> <div class="after-portlet after-portlet-lang"><span class="wb-langlinks-edit wb-langlinks-link"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q897819#sitelinks-wikipedia" title="Edit interlanguage links" class="wbc-editpage">Edit links</a></span></div> </div> </div> </div> </header> <div class="vector-page-toolbar"> <div class="vector-page-toolbar-container"> <div id="left-navigation"> <nav aria-label="Namespaces"> <div id="p-associated-pages" class="vector-menu vector-menu-tabs mw-portlet mw-portlet-associated-pages" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="ca-nstab-main" class="selected vector-tab-noicon mw-list-item"><a href="/wiki/Universal_Character_Set_characters" title="View the content page [c]" accesskey="c"><span>Article</span></a></li><li id="ca-talk" class="vector-tab-noicon mw-list-item"><a href="/wiki/Talk:Universal_Character_Set_characters" rel="discussion" title="Discuss improvements to the content page [t]" accesskey="t"><span>Talk</span></a></li> </ul> </div> </div> <div id="vector-variants-dropdown" class="vector-dropdown emptyPortlet" > <input type="checkbox" id="vector-variants-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-variants-dropdown" class="vector-dropdown-checkbox " aria-label="Change language variant" > <label id="vector-variants-dropdown-label" for="vector-variants-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet" aria-hidden="true" ><span class="vector-dropdown-label-text">English</span> </label> <div class="vector-dropdown-content"> <div id="p-variants" class="vector-menu mw-portlet mw-portlet-variants emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> </div> </div> </nav> </div> <div id="right-navigation" class="vector-collapsible"> <nav aria-label="Views"> <div id="p-views" class="vector-menu vector-menu-tabs mw-portlet mw-portlet-views" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="ca-view" class="selected vector-tab-noicon mw-list-item"><a href="/wiki/Universal_Character_Set_characters"><span>Read</span></a></li><li id="ca-edit" class="vector-tab-noicon mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit" title="Edit this page [e]" accesskey="e"><span>Edit</span></a></li><li id="ca-history" class="vector-tab-noicon mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=history" title="Past revisions of this page [h]" accesskey="h"><span>View history</span></a></li> </ul> </div> </div> </nav> <nav class="vector-page-tools-landmark" aria-label="Page tools"> <div id="vector-page-tools-dropdown" class="vector-dropdown vector-page-tools-dropdown" > <input type="checkbox" id="vector-page-tools-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-page-tools-dropdown" class="vector-dropdown-checkbox " aria-label="Tools" > <label id="vector-page-tools-dropdown-label" for="vector-page-tools-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet" aria-hidden="true" ><span class="vector-dropdown-label-text">Tools</span> </label> <div class="vector-dropdown-content"> <div id="vector-page-tools-unpinned-container" class="vector-unpinned-container"> <div id="vector-page-tools" class="vector-page-tools vector-pinnable-element"> <div class="vector-pinnable-header vector-page-tools-pinnable-header vector-pinnable-header-unpinned" data-feature-name="page-tools-pinned" data-pinnable-element-id="vector-page-tools" data-pinned-container-id="vector-page-tools-pinned-container" data-unpinned-container-id="vector-page-tools-unpinned-container" > <div class="vector-pinnable-header-label">Tools</div> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-page-tools.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-page-tools.unpin">hide</button> </div> <div id="p-cactions" class="vector-menu mw-portlet mw-portlet-cactions emptyPortlet vector-has-collapsible-items" title="More options" > <div class="vector-menu-heading"> Actions </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="ca-more-view" class="selected vector-more-collapsible-item mw-list-item"><a href="/wiki/Universal_Character_Set_characters"><span>Read</span></a></li><li id="ca-more-edit" class="vector-more-collapsible-item mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit" title="Edit this page [e]" accesskey="e"><span>Edit</span></a></li><li id="ca-more-history" class="vector-more-collapsible-item mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=history"><span>View history</span></a></li> </ul> </div> </div> <div id="p-tb" class="vector-menu mw-portlet mw-portlet-tb" > <div class="vector-menu-heading"> General </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="t-whatlinkshere" class="mw-list-item"><a href="/wiki/Special:WhatLinksHere/Universal_Character_Set_characters" title="List of all English Wikipedia pages containing links to this page [j]" accesskey="j"><span>What links here</span></a></li><li id="t-recentchangeslinked" class="mw-list-item"><a href="/wiki/Special:RecentChangesLinked/Universal_Character_Set_characters" rel="nofollow" title="Recent changes in pages linked from this page [k]" accesskey="k"><span>Related changes</span></a></li><li id="t-upload" class="mw-list-item"><a href="/wiki/Wikipedia:File_Upload_Wizard" title="Upload files [u]" accesskey="u"><span>Upload file</span></a></li><li id="t-specialpages" class="mw-list-item"><a href="/wiki/Special:SpecialPages" title="A list of all special pages [q]" accesskey="q"><span>Special pages</span></a></li><li id="t-permalink" class="mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;oldid=1255067307" title="Permanent link to this revision of this page"><span>Permanent link</span></a></li><li id="t-info" class="mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=info" title="More information about this page"><span>Page information</span></a></li><li id="t-cite" class="mw-list-item"><a href="/w/index.php?title=Special:CiteThisPage&amp;page=Universal_Character_Set_characters&amp;id=1255067307&amp;wpFormIdentifier=titleform" title="Information on how to cite this page"><span>Cite this page</span></a></li><li id="t-urlshortener" class="mw-list-item"><a href="/w/index.php?title=Special:UrlQ%C4%B1sald%C4%B1c%C4%B1s%C4%B1&amp;url=https%3A%2F%2Fen.wikipedia.org%2Fwiki%2FUniversal_Character_Set_characters%23Noncharacters"><span>Get shortened URL</span></a></li><li id="t-urlshortener-qrcode" class="mw-list-item"><a href="/w/index.php?title=Special:QrKodu&amp;url=https%3A%2F%2Fen.wikipedia.org%2Fwiki%2FUniversal_Character_Set_characters%23Noncharacters"><span>Download QR code</span></a></li> </ul> </div> </div> <div id="p-coll-print_export" class="vector-menu mw-portlet mw-portlet-coll-print_export" > <div class="vector-menu-heading"> Print/export </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="coll-download-as-rl" class="mw-list-item"><a href="/w/index.php?title=Special:DownloadAsPdf&amp;page=Universal_Character_Set_characters&amp;action=show-download-screen" title="Download this page as a PDF file"><span>Download as PDF</span></a></li><li id="t-print" class="mw-list-item"><a href="/w/index.php?title=Universal_Character_Set_characters&amp;printable=yes" title="Printable version of this page [p]" accesskey="p"><span>Printable version</span></a></li> </ul> </div> </div> <div id="p-wikibase-otherprojects" class="vector-menu mw-portlet mw-portlet-wikibase-otherprojects" > <div class="vector-menu-heading"> In other projects </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li class="wb-otherproject-link wb-otherproject-commons mw-list-item"><a href="https://commons.wikimedia.org/wiki/Category:Unicode" hreflang="en"><span>Wikimedia Commons</span></a></li><li id="t-wikibase" class="wb-otherproject-link wb-otherproject-wikibase-dataitem mw-list-item"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q897819" title="Structured data on this page hosted by Wikidata [g]" accesskey="g"><span>Wikidata item</span></a></li> </ul> </div> </div> </div> </div> </div> </div> </nav> </div> </div> </div> <div class="vector-column-end"> <div class="vector-sticky-pinned-container"> <nav class="vector-page-tools-landmark" aria-label="Page tools"> <div id="vector-page-tools-pinned-container" class="vector-pinned-container"> </div> </nav> <nav class="vector-appearance-landmark" aria-label="Appearance"> <div id="vector-appearance-pinned-container" class="vector-pinned-container"> <div id="vector-appearance" class="vector-appearance vector-pinnable-element"> <div class="vector-pinnable-header vector-appearance-pinnable-header vector-pinnable-header-pinned" data-feature-name="appearance-pinned" data-pinnable-element-id="vector-appearance" data-pinned-container-id="vector-appearance-pinned-container" data-unpinned-container-id="vector-appearance-unpinned-container" > <div class="vector-pinnable-header-label">Appearance</div> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-appearance.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-appearance.unpin">hide</button> </div> </div> </div> </nav> </div> </div> <div id="bodyContent" class="vector-body" aria-labelledby="firstHeading" data-mw-ve-target-container> <div class="vector-body-before-content"> <div class="mw-indicators"> </div> <div id="siteSub" class="noprint">From Wikipedia, the free encyclopedia</div> </div> <div id="contentSub"><div id="mw-content-subtitle"><span class="mw-redirectedfrom">(Redirected from <a href="/w/index.php?title=%F4%8F%BF%BF&amp;redirect=no" class="mw-redirect" title="􏿿">􏿿</a>)</span></div></div> <div id="mw-content-text" class="mw-body-content"><div class="mw-content-ltr mw-parser-output" lang="en" dir="ltr"><style data-mw-deduplicate="TemplateStyles:r1236090951">.mw-parser-output .hatnote{font-style:italic}.mw-parser-output div.hatnote{padding-left:1.6em;margin-bottom:0.5em}.mw-parser-output .hatnote i{font-style:normal}.mw-parser-output .hatnote+link+.hatnote{margin-top:-0.5em}@media print{body.ns-0 .mw-parser-output .hatnote{display:none!important}}</style><div role="note" class="hatnote navigation-not-searchable">"Unicode characters" redirects here. For a complete list of UCS characters, see <a href="/wiki/List_of_Unicode_characters" title="List of Unicode characters">List of Unicode characters</a>.</div> <div class="shortdescription nomobile noexcerpt noprint searchaux" style="display:none">Complete list of the characters available on most computers</div> <style data-mw-deduplicate="TemplateStyles:r1235681985">.mw-parser-output .side-box{margin:4px 0;box-sizing:border-box;border:1px solid #aaa;font-size:88%;line-height:1.25em;background-color:var(--background-color-interactive-subtle,#f8f9fa);display:flow-root}.mw-parser-output .side-box-abovebelow,.mw-parser-output .side-box-text{padding:0.25em 0.9em}.mw-parser-output .side-box-image{padding:2px 0 2px 0.9em;text-align:center}.mw-parser-output .side-box-imageright{padding:2px 0.9em 2px 0;text-align:center}@media(min-width:500px){.mw-parser-output .side-box-flex{display:flex;align-items:center}.mw-parser-output .side-box-text{flex:1;min-width:0}}@media(min-width:720px){.mw-parser-output .side-box{width:238px}.mw-parser-output .side-box-right{clear:right;float:right;margin-left:1em}.mw-parser-output .side-box-left{margin-right:1em}}</style><style data-mw-deduplicate="TemplateStyles:r1092331828">@media(min-width:720px){.mw-parser-output .contains-special-characters{width:22em}}</style><div class="side-box metadata side-box-right contains-special-characters noprint selfref"><style data-mw-deduplicate="TemplateStyles:r1126788409">.mw-parser-output .plainlist ol,.mw-parser-output .plainlist ul{line-height:inherit;list-style:none;margin:0;padding:0}.mw-parser-output .plainlist ol li,.mw-parser-output .plainlist ul li{margin-bottom:0}</style> <div class="side-box-flex"> <div class="side-box-text plainlist"><b>This article contains <a href="/wiki/Help:Special_characters" title="Help:Special characters">special characters</a>.</b> Without proper <a href="/wiki/Help:Special_characters" title="Help:Special characters">rendering support</a>, you may see <a href="/wiki/Specials_(Unicode_block)#Replacement_character" title="Specials (Unicode block)">question marks, boxes, or other symbols</a>.</div></div> </div> <figure class="mw-halign-right" typeof="mw:File"><a href="/wiki/File:New_Unicode_logo.svg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/0/09/New_Unicode_logo.svg/150px-New_Unicode_logo.svg.png" decoding="async" width="150" height="180" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/0/09/New_Unicode_logo.svg/225px-New_Unicode_logo.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/0/09/New_Unicode_logo.svg/300px-New_Unicode_logo.svg.png 2x" data-file-width="512" data-file-height="614" /></a><figcaption></figcaption></figure> <figure typeof="mw:File/Thumb"><a href="/wiki/File:Writing_systems_worldwide.svg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/6/63/Writing_systems_worldwide.svg/500px-Writing_systems_worldwide.svg.png" decoding="async" width="500" height="254" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/6/63/Writing_systems_worldwide.svg/750px-Writing_systems_worldwide.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/6/63/Writing_systems_worldwide.svg/1000px-Writing_systems_worldwide.svg.png 2x" data-file-width="2754" data-file-height="1398" /></a><figcaption><div class="navbox-styles"><style data-mw-deduplicate="TemplateStyles:r1129693374">.mw-parser-output .hlist dl,.mw-parser-output .hlist ol,.mw-parser-output .hlist ul{margin:0;padding:0}.mw-parser-output .hlist dd,.mw-parser-output .hlist dt,.mw-parser-output .hlist li{margin:0;display:inline}.mw-parser-output .hlist.inline,.mw-parser-output .hlist.inline dl,.mw-parser-output .hlist.inline ol,.mw-parser-output .hlist.inline ul,.mw-parser-output .hlist dl dl,.mw-parser-output .hlist dl ol,.mw-parser-output .hlist dl ul,.mw-parser-output .hlist ol dl,.mw-parser-output .hlist ol ol,.mw-parser-output .hlist ol ul,.mw-parser-output .hlist ul dl,.mw-parser-output .hlist ul ol,.mw-parser-output .hlist ul ul{display:inline}.mw-parser-output .hlist .mw-empty-li{display:none}.mw-parser-output .hlist dt::after{content:": "}.mw-parser-output .hlist dd::after,.mw-parser-output .hlist li::after{content:" · ";font-weight:bold}.mw-parser-output .hlist dd:last-child::after,.mw-parser-output .hlist dt:last-child::after,.mw-parser-output .hlist li:last-child::after{content:none}.mw-parser-output .hlist dd dd:first-child::before,.mw-parser-output .hlist dd dt:first-child::before,.mw-parser-output .hlist dd li:first-child::before,.mw-parser-output .hlist dt dd:first-child::before,.mw-parser-output .hlist dt dt:first-child::before,.mw-parser-output .hlist dt li:first-child::before,.mw-parser-output .hlist li dd:first-child::before,.mw-parser-output .hlist li dt:first-child::before,.mw-parser-output .hlist li li:first-child::before{content:" (";font-weight:normal}.mw-parser-output .hlist dd dd:last-child::after,.mw-parser-output .hlist dd dt:last-child::after,.mw-parser-output .hlist dd li:last-child::after,.mw-parser-output .hlist dt dd:last-child::after,.mw-parser-output .hlist dt dt:last-child::after,.mw-parser-output .hlist dt li:last-child::after,.mw-parser-output .hlist li dd:last-child::after,.mw-parser-output .hlist li dt:last-child::after,.mw-parser-output .hlist li li:last-child::after{content:")";font-weight:normal}.mw-parser-output .hlist ol{counter-reset:listitem}.mw-parser-output .hlist ol>li{counter-increment:listitem}.mw-parser-output .hlist ol>li::before{content:" "counter(listitem)"\a0 "}.mw-parser-output .hlist dd ol>li:first-child::before,.mw-parser-output .hlist dt ol>li:first-child::before,.mw-parser-output .hlist li ol>li:first-child::before{content:" ("counter(listitem)"\a0 "}</style><style data-mw-deduplicate="TemplateStyles:r1236075235">.mw-parser-output .navbox{box-sizing:border-box;border:1px solid #a2a9b1;width:100%;clear:both;font-size:88%;text-align:center;padding:1px;margin:1em auto 0}.mw-parser-output .navbox .navbox{margin-top:0}.mw-parser-output .navbox+.navbox,.mw-parser-output .navbox+.navbox-styles+.navbox{margin-top:-1px}.mw-parser-output .navbox-inner,.mw-parser-output .navbox-subgroup{width:100%}.mw-parser-output .navbox-group,.mw-parser-output .navbox-title,.mw-parser-output .navbox-abovebelow{padding:0.25em 1em;line-height:1.5em;text-align:center}.mw-parser-output .navbox-group{white-space:nowrap;text-align:right}.mw-parser-output .navbox,.mw-parser-output .navbox-subgroup{background-color:#fdfdfd}.mw-parser-output .navbox-list{line-height:1.5em;border-color:#fdfdfd}.mw-parser-output .navbox-list-with-group{text-align:left;border-left-width:2px;border-left-style:solid}.mw-parser-output tr+tr>.navbox-abovebelow,.mw-parser-output tr+tr>.navbox-group,.mw-parser-output tr+tr>.navbox-image,.mw-parser-output tr+tr>.navbox-list{border-top:2px solid #fdfdfd}.mw-parser-output .navbox-title{background-color:#ccf}.mw-parser-output .navbox-abovebelow,.mw-parser-output .navbox-group,.mw-parser-output .navbox-subgroup .navbox-title{background-color:#ddf}.mw-parser-output .navbox-subgroup .navbox-group,.mw-parser-output .navbox-subgroup .navbox-abovebelow{background-color:#e6e6ff}.mw-parser-output .navbox-even{background-color:#f7f7f7}.mw-parser-output .navbox-odd{background-color:transparent}.mw-parser-output .navbox .hlist td dl,.mw-parser-output .navbox .hlist td ol,.mw-parser-output .navbox .hlist td ul,.mw-parser-output .navbox td.hlist dl,.mw-parser-output .navbox td.hlist ol,.mw-parser-output .navbox td.hlist ul{padding:0.125em 0}.mw-parser-output .navbox .navbar{display:block;font-size:100%}.mw-parser-output .navbox-title .navbar{float:left;text-align:left;margin-right:0.5em}body.skin--responsive .mw-parser-output .navbox-image img{max-width:none!important}@media print{body.ns-0 .mw-parser-output .navbox{display:none!important}}</style><style data-mw-deduplicate="TemplateStyles:r981673959">.mw-parser-output .legend{page-break-inside:avoid;break-inside:avoid-column}.mw-parser-output .legend-color{display:inline-block;min-width:1.25em;height:1.25em;line-height:1.25;margin:1px 0;text-align:center;border:1px solid black;background-color:transparent;color:black}.mw-parser-output .legend-text{}</style><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r981673959"></div><div role="navigation" aria-labelledby="Index_of_predominant_national_and_selected_regional_or_minority_scripts"><table class="nowraplinks navbox-subgroup" style="border-spacing:0;font-size:90%;"><tbody><tr><td class="navbox-abovebelow" colspan="2" style="background:transparent;font-size:110%;padding:0;font-weight:bold;"><div id="Index_of_predominant_national_and_selected_regional_or_minority_scripts">Index of predominant national and selected regional or minority scripts</div></td></tr><tr><td colspan="2" class="navbox-list navbox-odd" style="width:100%;padding:0;background:transparent;color:inherit;"><div style="padding:0px"><table class="navbox-columns-table" style="border-spacing: 0px; text-align:left;width:100%;"><tbody><tr><td class="navbox-abovebelow" style="font-weight:bold;padding:0.15em 0.15em 0.25em;font-weight:normal;"><a href="/wiki/Alphabet" title="Alphabet">Alphabetic</a></td><td class="navbox-abovebelow" style="border-left:2px solid #fdfdfd;font-weight:bold;padding:0.15em 0.15em 0.25em;font-weight:normal;"><div style="display: inline-block; line-height: 1.2em; padding: .1em 0;"><a href="/wiki/Logogram" title="Logogram">[L]ogographic</a><br />and <a href="/wiki/Syllabary" title="Syllabary">[S]yllabic</a></div></td><td class="navbox-abovebelow" style="border-left:2px solid #fdfdfd;font-weight:bold;padding:0.15em 0.15em 0.25em;font-weight:normal;"><a href="/wiki/Abjad" title="Abjad">Abjad</a></td><td class="navbox-abovebelow" style="border-left:2px solid #fdfdfd;font-weight:bold;padding:0.15em 0.15em 0.25em;font-weight:normal;"><a href="/wiki/Abugida" title="Abugida">Abugida</a></td></tr><tr style="vertical-align:top"><td class="navbox-list" style="padding:0px;white-space:nowrap;width:10em;"><div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#A9A9C0; color:black;">&#160;</span>&#160;<a href="/wiki/Latin_script_in_Unicode" title="Latin script in Unicode">Latin</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#008899; color:black;">&#160;</span>&#160;<a href="/wiki/Cyrillic_script_in_Unicode" title="Cyrillic script in Unicode">Cyrillic</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#2175D8; color:black;">&#160;</span>&#160;<a href="/wiki/Greek_and_Coptic" title="Greek and Coptic">Greek</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#003A66; color:white;">&#160;</span>&#160;<a href="/wiki/Armenian_(Unicode_block)" title="Armenian (Unicode block)">Armenian</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#0000FF; color:white;">&#160;</span>&#160;<a href="/wiki/Georgian_(Unicode_block)" title="Georgian (Unicode block)">Georgian</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#00FFFF; color:black;">&#160;</span>&#160;<a href="/wiki/Mongolian_(Unicode_block)" title="Mongolian (Unicode block)">Mongolian</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#0090DA; color:black;">&#160;</span>&#160;<a href="/wiki/Tifinagh_(Unicode_block)" title="Tifinagh (Unicode block)">Neo-Tifinagh</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#97CBFF; color:black;">&#160;</span>&#160;<a href="/wiki/Osage_(Unicode_block)" title="Osage (Unicode block)">Osage</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#FF69B4; color:black;">&#160;</span>&#160;<a href="/wiki/Korean_language_and_computers#Hangul_in_Unicode" title="Korean language and computers">Hangul</a><sup>a</sup></div> </div></td><td class="navbox-list" style="border-left:2px solid #fdfdfd;padding:0px;white-space:nowrap;width:10em;"><div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#EE1C25; color:black;">&#160;</span>&#160;<a href="/wiki/CJK_Unified_Ideographs" title="CJK Unified Ideographs">Hanzi</a> <span style="font-size:85%;">[L]</span></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#C71585; color:white;">&#160;</span>&#160;<a href="/wiki/Kana#In_Unicode" title="Kana">Kana</a> <span style="font-size:85%;">[S]</span>&#160;/&#32;<a href="/wiki/CJK_Unified_Ideographs" title="CJK Unified Ideographs">Kanji</a> <span style="font-size:85%;">[L]</span><span class="nowrap">&#160;&#160;</span></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#FF69B4; color:black;">&#160;</span>&#160;<a href="/wiki/CJK_Unified_Ideographs" title="CJK Unified Ideographs">Hanja</a><sup>b</sup> <span style="font-size:85%;">[L]</span></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#8B008B; color:white;">&#160;</span>&#160;<a href="/wiki/Cherokee_(Unicode_block)" title="Cherokee (Unicode block)">Cherokee</a> <span style="font-size:85%;">[S]</span></div> </div></td><td class="navbox-list" style="border-left:2px solid #fdfdfd;padding:0px;white-space:nowrap;width:10em;"><div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#006624; color:white;">&#160;</span>&#160;<a href="/wiki/Arabic_(Unicode_block)" title="Arabic (Unicode block)">Arabic</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#38B800; color:black;">&#160;</span>&#160;<a href="/wiki/Hebrew_(Unicode_block)" title="Hebrew (Unicode block)">Hebrew</a></div> </div></td><td class="navbox-list" style="border-left:2px solid #fdfdfd;padding:0px;white-space:nowrap;width:10em;"><div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#F4C430; color:black;">&#160;</span>&#160;<a href="/wiki/Brahmic_scripts#Unicode_of_Brahmic_scripts" title="Brahmic scripts">North Indic</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#FF671F; color:black;">&#160;</span>&#160;<a href="/wiki/Brahmic_scripts#Unicode_of_Brahmic_scripts" title="Brahmic scripts">South Indic</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#A0522D ; color:white;">&#160;</span>&#160;<a href="/wiki/Ethiopic_(Unicode_block)" title="Ethiopic (Unicode block)">Ethiopic</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#B8860B; color:black;">&#160;</span>&#160;<a href="/wiki/Thaana_(Unicode_block)" title="Thaana (Unicode block)">Thaana</a></div> <div class="legend"><span class="legend-color mw-no-invert" style="background-color:#F0E68C; color:black;">&#160;</span>&#160;<a href="/wiki/Unified_Canadian_Aboriginal_Syllabics_(Unicode_block)" class="mw-redirect" title="Unified Canadian Aboriginal Syllabics (Unicode block)">Canadian syllabics</a></div> </div></td></tr></tbody></table></div></td></tr><tr><td class="navbox-abovebelow" colspan="2"><div><span class="nowrap"><sup>a</sup> <a href="/wiki/Featural_alphabet" class="mw-redirect" title="Featural alphabet">Featural-alphabetic</a>.<span class="nowrap">&#160;&#160;&#160;</span><sup>b</sup> Limited.</span></div></td></tr></tbody></table></div></figcaption></figure> <p>The <a href="/wiki/Unicode_Consortium" title="Unicode Consortium">Unicode Consortium</a> and the <a href="/wiki/ISO/IEC_JTC_1/SC_2" title="ISO/IEC JTC 1/SC 2">ISO/IEC JTC 1/SC 2</a>/<a href="/wiki/Working_group" title="Working group">WG</a> 2 jointly collaborate on the list of the <b>characters in the Universal Coded Character Set</b>. The Universal Coded Character Set, most commonly called the <a href="/wiki/Universal_Character_Set" class="mw-redirect" title="Universal Character Set">Universal Character Set</a> (<abbr title="abbreviated">abbr.</abbr> UCS, official designation: <a href="/wiki/International_Organization_for_Standardization" title="International Organization for Standardization">ISO</a>/<a href="/wiki/International_Electrotechnical_Commission" title="International Electrotechnical Commission">IEC</a> 10646), is an international standard to map <a href="/wiki/Character_(computing)" title="Character (computing)">characters</a>, discrete symbols used in <a href="/wiki/Orthography" title="Orthography">natural language</a>, <a href="/wiki/Mathematical_notation" title="Mathematical notation">mathematics</a>, <a href="/wiki/Musical_notation" title="Musical notation">music</a>, and other domains, to unique <a href="/wiki/Machine-readable_data" class="mw-redirect" title="Machine-readable data">machine-readable data</a> values. By creating this mapping, the UCS enables computer <a href="/wiki/Software_company" title="Software company">software vendors</a> to <a href="/wiki/Interoperate" class="mw-redirect" title="Interoperate">interoperate</a>, and transmit—<a href="https://en.wiktionary.org/wiki/interchange" class="extiw" title="wikt:interchange">interchange</a>—<a href="/wiki/Character_encoding#Unicode_encoding_model" title="Character encoding">UCS-encoded</a> text <a href="/wiki/String_(computer_science)" title="String (computer science)">strings</a> from one to another. Because it is a <i>universal</i> map, it can be used to represent multiple languages at the same time. This avoids the confusion of using multiple legacy <a href="/wiki/Character_encodings" class="mw-redirect" title="Character encodings">character encodings</a>, which can result in the same sequence of codes having multiple interpretations depending on the character encoding in use, resulting in <i><a href="/wiki/Mojibake" title="Mojibake">mojibake</a></i> if the wrong one is chosen. </p><p>UCS has a potential capacity of over 1 million characters. Each UCS character is abstractly represented by a <a href="/wiki/Code_point" title="Code point">code point</a>, an integer between 0 and 1,114,111 (1,114,112 = 2<sup>20</sup> + 2<sup>16</sup> <i>or</i> 17 × 2<sup>16</sup> = <style data-mw-deduplicate="TemplateStyles:r886049734">.mw-parser-output .monospaced{font-family:monospace,monospace}</style><span class="monospaced"><a href="/wiki/Hexadecimal" title="Hexadecimal">0x</a>110000</span> <a href="/wiki/Code_points" class="mw-redirect" title="Code points">code points</a>), used to represent each character within the internal logic of <a href="/wiki/Text_processing" title="Text processing">text processing</a> software. As of <a href="/wiki/Unicode" title="Unicode">Unicode</a> 16.0, released in September 2024, 299,056 (27%) of these code points are allocated, 155,063 (14%) have been assigned characters, 137,468 (12%) are reserved for <a href="#Private-Use_Characters">private use</a>, 2,048 are used to enable the mechanism of <a href="#Surrogates">surrogates</a>, and 66 are designated as <a href="#Noncharacters">noncharacters</a>, leaving the remaining 815,056 (73%) unallocated. The number of encoded characters is made up as follows: </p> <ul><li>149,641 graphical characters (some of which do not have a visible <a href="/wiki/Glyph" title="Glyph">glyph</a>, but are still counted as graphical)</li> <li>237 <a href="#Special-purpose_characters">special purpose characters</a> for <a href="/wiki/Control_character" title="Control character">control</a> and <a href="/wiki/Format_character" class="mw-redirect" title="Format character">formatting</a>.</li></ul> <p><a href="/wiki/International_Organization_for_Standardization" title="International Organization for Standardization">ISO</a> maintains the basic mapping of characters from <a href="/wiki/Character_name" class="mw-redirect" title="Character name">character name</a> to code point. Often, the terms <i>character</i> and <i>code point</i> will be used interchangeably. However, when a distinction is made, a <i>code point</i> refers to the <a href="/wiki/Integer" title="Integer">integer</a> of the character: what one might think of as its address. Meanwhile, a <i>character</i> in ISO/IEC 10646 includes the combination of the code point and its name, Unicode adds many other useful <a href="/wiki/Unicode_character_property" title="Unicode character property">properties</a> to the character set, such as <a href="/wiki/Unicode_block" title="Unicode block">block</a>, category, <a href="/wiki/Script_(Unicode)" title="Script (Unicode)">script</a>, and <a href="/wiki/Bidirectional_text" title="Bidirectional text">directionality</a>. </p><p>In addition to the UCS, the supplementary <a href="/wiki/Unicode_Standard" class="mw-redirect" title="Unicode Standard">Unicode Standard</a>, (not a joint project with ISO, but rather a publication of the Unicode Consortium,) provides other implementation details such as: </p> <ol><li>mappings between UCS and <a href="/wiki/Category:Character_sets" title="Category:Character sets">other character sets</a></li> <li>different <a href="/wiki/Collations" class="mw-redirect" title="Collations">collations</a> of characters and character strings for different languages</li> <li>an algorithm for <a href="/wiki/Page_layout" title="Page layout">laying out</a> bidirectional text ("the <a href="/wiki/Bidirectional_text#Bidirectional_script_support" title="Bidirectional text">BiDi</a> algorithm"), where text on the same line may shift between <a href="/wiki/Left_to_right" class="mw-redirect" title="Left to right">left-to-right</a> ("LTR") and <a href="/wiki/Right-to-left_script" title="Right-to-left script">right-to-left</a> ("RTL")</li> <li>a <a href="/wiki/Case_fold" class="mw-redirect" title="Case fold">case-folding</a> algorithm</li></ol> <p>Computer software <a href="/wiki/End_users" class="mw-redirect" title="End users">end users</a> enter these characters into programs through various <a href="/wiki/Input_methods" class="mw-redirect" title="Input methods">input methods</a>, for example, physical <a href="/wiki/Computer_keyboard" title="Computer keyboard">keyboards</a> or <a href="/wiki/Virtual_keyboard" title="Virtual keyboard">virtual character palettes</a>. </p><p>The UCS can be divided in various ways, such as by <a href="/wiki/Plane_(Unicode)" title="Plane (Unicode)">plane</a>, block, character category, or <a href="/wiki/Unicode_character_property" title="Unicode character property">character property</a>.<sup id="cite_ref-1" class="reference"><a href="#cite_note-1"><span class="cite-bracket">&#91;</span>1<span class="cite-bracket">&#93;</span></a></sup> </p> <meta property="mw:PageProp/toc" /> <div class="mw-heading mw-heading2"><h2 id="Character_reference_overview">Character reference overview</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=1" title="Edit section: Character reference overview"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/List_of_XML_and_HTML_character_entity_references" title="List of XML and HTML character entity references">List of XML and HTML character entity references</a> and <a href="/wiki/Unicode_input" title="Unicode input">Unicode input</a></div> <p>An <a href="/wiki/HTML" title="HTML">HTML</a> or <a href="/wiki/XML" title="XML">XML</a> numeric character reference refers to a character by its <a href="/wiki/Universal_Character_Set" class="mw-redirect" title="Universal Character Set">Universal Character Set</a>/Unicode code point, and uses the format </p> <dl><dd><code>&amp;#</code><i>nnnn</i><code>;</code></dd></dl> <p>or </p> <dl><dd><code>&amp;#x</code><i>hhhh</i><code>;</code></dd></dl> <p>where <i>nnnn</i> is the code point in <a href="/wiki/Decimal" title="Decimal">decimal</a> form, and <i>hhhh</i> is the code point in <a href="/wiki/Hexadecimal" title="Hexadecimal">hexadecimal</a> form. The <i>x</i> must be lowercase in XML documents. The <i>nnnn</i> or <i>hhhh</i> may be any number of digits and may include leading zeros. The <i>hhhh</i> may mix uppercase and lowercase, though uppercase is the usual style. </p><p>In contrast, a <i>character entity reference</i> refers to a character by the name of an <i><a href="/wiki/SGML_entity" title="SGML entity">entity</a></i> which has the desired character as its <i>replacement text</i>. The entity must either be predefined (built into the markup language) or explicitly declared in a <a href="/wiki/Document_Type_Definition" class="mw-redirect" title="Document Type Definition">Document Type Definition</a> (DTD). The format is the same as for any entity reference: </p> <dl><dd><code>&amp;</code><i>name</i><code>;</code></dd></dl> <p>where <i>name</i> is the case-sensitive name of the entity. The semicolon is required. </p> <div class="mw-heading mw-heading2"><h2 id="Planes">Planes</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=2" title="Edit section: Planes"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Plane_(Unicode)" title="Plane (Unicode)">Plane (Unicode)</a></div> <p>Unicode and ISO divide the set of code points into 17 planes, each capable of containing 65536 distinct characters or 1,114,112 total. As of 2024 (Unicode 16.0) ISO and the Unicode Consortium has only allocated characters and blocks in seven of the 17 planes. The others remain empty and reserved for future use. </p><p>Most characters are currently assigned to the first plane: the <i>Basic Multilingual Plane</i>. This is to help ease the transition for legacy software since the Basic Multilingual Plane is addressable with just two <a href="/wiki/Octet_(computing)" title="Octet (computing)">octets</a>. The characters outside the first plane usually have very specialized or rare use. </p><p>Each plane corresponds with the value of the one or two <a href="/wiki/Hexadecimal_digit" class="mw-redirect" title="Hexadecimal digit">hexadecimal digits</a> (0—9, A—F) preceding the four final ones: hence U+24321 is in Plane 2, U+4321 is in Plane 0 (implicitly read U+04321), and U+10A200 would be in Plane 16 (hex 10 = decimal 16). Within one plane, the range of code points is hexadecimal 0000—FFFF, yielding a maximum of 65536 code points. Planes restrict code points to a subset of that range. </p> <div class="mw-heading mw-heading2"><h2 id="Blocks">Blocks</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=3" title="Edit section: Blocks"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Unicode_block" title="Unicode block">Unicode block</a></div> <p>Unicode adds a block property to UCS that further divides each plane into separate blocks. Each block is a grouping of characters by their use such as "mathematical operators" or "Hebrew script characters". When assigning characters to previously unassigned code points, the Consortium typically allocates entire blocks of similar characters: for example all the characters belonging to the same script or all similarly purposed symbols get assigned to a single block. Blocks may also maintain unassigned or reserved code points when the Consortium expects a block to require additional assignments. </p><p>The first 256 code points in the UCS correspond with those of <a href="/wiki/ISO_8859-1" class="mw-redirect" title="ISO 8859-1">ISO 8859-1</a>, the most popular 8-bit <a href="/wiki/Character_encoding" title="Character encoding">character encoding</a> in the <a href="/wiki/Western_world" title="Western world">Western world</a>. As a result, the first 128 characters are also identical to <a href="/wiki/ASCII" title="ASCII">ASCII</a>. Though Unicode refers to these as a Latin script block, these two blocks contain many characters that are commonly useful outside of the Latin script. In general, not all characters in a given block need be of the same script, and a given script can occur in several different blocks. </p> <div class="mw-heading mw-heading2"><h2 id="Categories">Categories</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=4" title="Edit section: Categories"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Unicode assigns to every UCS character a <i>general category</i> and subcategory. The general categories are: letter, mark, number, punctuation, symbol, or control (in other words a formatting or non-graphical character). </p><p>Types include: </p> <ul><li><b>Modern, Historic, and Ancient Scripts</b>. As of 2024 (Unicode 16.0), the UCS identifies 168 scripts that are, or have been, used throughout of the world. Many more are in various approval stages for future inclusion of the UCS.<sup id="cite_ref-2" class="reference"><a href="#cite_note-2"><span class="cite-bracket">&#91;</span>2<span class="cite-bracket">&#93;</span></a></sup></li> <li><b>International Phonetic Alphabet</b>. The UCS devotes several blocks (over 300 characters) to characters for the <a href="/wiki/International_Phonetic_Alphabet" title="International Phonetic Alphabet">International Phonetic Alphabet</a>.</li> <li><b>Combining Diacritical Marks</b>. An important advance conceived by Unicode in designing the UCS and related algorithms for handling text was the introduction of combining diacritic marks. By providing accents that can combine with any letter character, the Unicode and the UCS reduce significantly the number of characters needed. While the UCS also includes precomposed characters, these were included primarily to facilitate support within UCS for non-Unicode text processing systems.</li> <li><b>Punctuation</b>. Along with unifying diacritical marks, the UCS also sought to unify punctuation across scripts. Many scripts also contain punctuation, however, when that punctuation has no similar semantics in other scripts.</li> <li><b>Symbols</b>. Many mathematics, technical, geometrical and other symbols are included within the UCS. This provides distinct symbols with their own code point or character rather than relying on switching fonts to provide symbolic glyphs. <ul><li><b>Currency</b>.</li> <li><b>Letterlike</b>. These symbols appear like combinations of many common Latin scripts letters such as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">℅</span>. Unicode designates many of the letterlike symbols as compatibility characters usually because they can be in plain text by substituting glyphs for a composing sequence of characters: for example substituting the glyph <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">℅</span> for the composed sequence of characters <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">c/o</span>.</li> <li><b>Number Forms</b>. Number forms primarily consist of precomposed fractions and Roman numerals. Like other areas of composing sequences of characters, the Unicode approach prefers the flexibility of composing fractions by combining characters together. In this case to create fractions, one combines numbers with the fraction slash character (U+2044). As an example of the flexibility this approach provides, there are nineteen precomposed fraction characters included within the UCS. However, there are an infinity of possible fractions. By using composing characters the infinity of fractions is handled by 11 characters (0-9 and the fraction slash). No character set could include code points for every precomposed fraction. Ideally a text system should present the same glyphs for a fraction whether it is one of the precomposed fractions (such as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">⅓</span>) or a composing sequence of characters (such as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">1⁄3</span>). However, web browsers are not typically that sophisticated with Unicode and text handling. Doing so ensures that precomposed fractions and combining sequence fractions will appear compatible next to each other.</li> <li><b>Arrows</b>.</li> <li><b>Mathematical</b>.</li> <li><b>Geometric Shapes</b>.</li> <li><b>Legacy Computing</b>.</li> <li><b>Control Pictures</b> Graphical representations of many control characters.</li> <li><b>Box Drawing</b>.</li> <li><b>Block Elements</b>.</li> <li><b>Braille Patterns</b>.</li> <li><b>Optical Character Recognition</b>.</li> <li><b>Technical</b>.</li> <li><b>Dingbats</b>.</li> <li><b>Miscellaneous Symbols</b>.</li> <li><b>Emoticons</b>.</li> <li><b>Symbols and Pictographs</b>.</li> <li><b>Alchemical Symbols</b>.</li> <li><b>Game Pieces</b> (chess, checkers, go, dice, dominoes, mahjong, playing cards, and many others).</li> <li><b>Chess Symbols</b></li> <li><b><a href="/wiki/Tai_Xuan_Jing" class="mw-redirect" title="Tai Xuan Jing">Tai Xuan Jing</a></b>.</li> <li><b>Yijing Hexagram Symbols</b>.</li></ul></li> <li><b>CJK</b>. Devoted to ideographs and other characters to support languages in China, Japan, Korea (CJK), Taiwan, Vietnam, and Thailand. <ul><li><b>Radicals and Strokes</b>.</li> <li><b>Ideographs</b>. By far the largest portion of the UCS is devoted to ideographs used in languages of Eastern Asia. While the glyph representation of these ideographs have diverged in the languages that use them, the UCS unifies these <a href="/wiki/Han_characters" class="mw-redirect" title="Han characters">Han characters</a> in what Unicode refers to as Unihan (for Unified Han). With Unihan, the text layout software must work together with the available fonts and these Unicode characters to produce the appropriate glyph for the appropriate language. Despite unifying these characters, the UCS still includes over 97,000 Unihan ideographs.</li></ul></li> <li><b>Musical Notation</b>.</li> <li><b>Duployan shorthands</b>.</li> <li><b>Sutton SignWriting</b>.</li> <li><b>Compatibility Characters</b>. Several blocks in the UCS are devoted almost entirely to compatibility characters. Compatibility characters are those included for support of legacy text handling systems that do not make a distinction between character and glyph the way Unicode does. For example, many Arabic letters are represented by a different glyph when the letter appears at the end of a word than when the letter appears at the beginning of a word. Unicode's approach prefers to have these letters mapped to the same character for ease of internal machine text processing and storage. To complement this approach, the text software must select different glyph variants for display of the character based on its context. Over 4000 characters are included for such compatibility reasons.</li> <li><b>Control Characters</b>.</li> <li><b>Surrogates</b>. The UCS includes 2048 code points in the Basic Multilingual Plane (BMP) for surrogate code point pairs. Together these surrogates allow any code point in the sixteen other planes to be addressed by using two surrogate code points. This provides a simple built-in method for encoding the 20.1 bit UCS within a 16 bit encoding such as UTF-16. In this way UTF-16 can represent any character within the BMP with a single 16-bit word. Characters outside the BMP are then encoded using two 16-bit words (4 octets or bytes total) using the surrogate pairs.</li> <li><b>Private Use</b>. The consortium provides several private use blocks and planes that can be assigned characters within various communities, as well as operating system and font vendors.</li> <li><b>Noncharacters</b>. The consortium guarantees certain code points will never be assigned a character and calls these noncharacter code points. These include the range U+FDD0..U+FDEF, and the last two code points of each plane (ending in the hexadecimal digits FFFE and FFFF).<sup id="cite_ref-3" class="reference"><a href="#cite_note-3"><span class="cite-bracket">&#91;</span>3<span class="cite-bracket">&#93;</span></a></sup></li></ul> <div class="mw-heading mw-heading2"><h2 id="Special-purpose_characters">Special-purpose characters</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=5" title="Edit section: Special-purpose characters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/Unicode_control_characters" title="Unicode control characters">Unicode control characters</a></div> <p>Unicode codifies over a hundred thousand characters. Most of those represent graphemes for processing as linear text. Some, however, either do not represent graphemes, or, as graphemes, require exceptional treatment.<sup id="cite_ref-4" class="reference"><a href="#cite_note-4"><span class="cite-bracket">&#91;</span>4<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-5" class="reference"><a href="#cite_note-5"><span class="cite-bracket">&#91;</span>5<span class="cite-bracket">&#93;</span></a></sup> Unlike the ASCII control characters and other characters included for legacy round-trip capabilities, these other special-purpose characters endow plain text with important semantics. </p><p>Some special characters can alter the layout of text, such as the <a href="#Grapheme_joiners_and_non-joiners">zero-width joiner and zero-width non-joiner</a>, while others do not affect text layout at all, but instead affect the way text strings are collated, matched or otherwise processed. Other special-purpose characters, such as the <a href="#Mathematical_invisibles">mathematical invisibles</a>, generally have no effect on text rendering, though sophisticated text layout software may choose to subtly adjust spacing around them. </p><p>Unicode does not specify the division of labor between font and text layout software (or "engine") when rendering Unicode text. Because the more complex font formats, such as <a href="/wiki/OpenType" title="OpenType">OpenType</a> or <a href="/wiki/Apple_Advanced_Typography" title="Apple Advanced Typography">Apple Advanced Typography</a>, provide for contextual substitution and positioning of glyphs, a simple text layout engine might rely entirely on the font for all decisions of glyph choice and placement. In the same situation a more complex engine may combine information from the font with its own rules to achieve its own idea of best rendering. To implement all recommendations of the Unicode specification, a text engine must be prepared to work with fonts of any level of sophistication, since contextual substitution and positioning rules do not exist in some font formats and are optional in the rest. The <a href="#Fraction_slash">fraction slash</a> is an example: complex fonts may or may not supply positioning rules in the presence of the fraction slash character to create a fraction, while fonts in simple formats cannot. </p> <div class="mw-heading mw-heading3"><h3 id="Byte_order_mark">Byte order mark</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=6" title="Edit section: Byte order mark"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>When appearing at the head of a text file or stream, the <a href="/wiki/Byte_order_mark" title="Byte order mark">byte order mark</a> (BOM) U+FEFF hints at the encoding form and its byte order. </p><p>If the stream's first byte is 0xFE and the second 0xFF, then the stream's text is not likely to be encoded in <a href="/wiki/UTF-8" title="UTF-8">UTF-8</a>, since those bytes are invalid in UTF-8. It is also not likely to be <a href="/wiki/UTF-16" title="UTF-16">UTF-16</a> in <a href="/wiki/Little-endian" class="mw-redirect" title="Little-endian">little-endian</a> byte order because 0xFE, 0xFF read as a 16-bit little endian word would be U+FFFE, which is meaningless. The sequence also has no meaning in any arrangement of <a href="/wiki/UTF-32" title="UTF-32">UTF-32</a> encoding, so, in summary, it serves as a fairly reliable indication that the text stream is encoded as UTF-16 in <a href="/wiki/Big-endian" class="mw-redirect" title="Big-endian">big-endian</a> byte order. Conversely, if the first two bytes are 0xFF, 0xFE, then the text stream may be assumed to be encoded as UTF-16LE because, read as a 16-bit little-endian value, the bytes yield the expected 0xFEFF byte order mark. This assumption becomes questionable, however, if the next two bytes are both 0x00; either the text begins with a null character (U+0000), or the correct encoding is actually UTF-32LE, in which the full 4-byte sequence FF FE 00 00 is one character, the BOM. </p><p>The UTF-8 sequence corresponding to U+FEFF is 0xEF, 0xBB, 0xBF. This sequence has no meaning in other Unicode encoding forms, so it may serve to indicate that that stream is encoded as UTF-8. </p><p>The Unicode specification does not require the use of byte order marks in text streams. It further states that they should not be used in situations where some other method of signaling the encoding form is already in use. </p> <div class="mw-heading mw-heading3"><h3 id="Mathematical_invisibles">Mathematical invisibles</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=7" title="Edit section: Mathematical invisibles"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Primarily for mathematics, the Invisible Separator (U+2063) provides a separator between characters where punctuation or space may be omitted such as in a two-dimensional index like i⁣j. Invisible Times (U+2062) and Function Application (U+2061) are useful in mathematics text where the multiplication of terms or the application of a function is implied without any glyph indicating the operation. Unicode 5.1 introduces the Mathematical Invisible Plus character as well (U+2064) which may indicate that an integral number followed by a fraction should denote their sum, but not their product. </p> <div class="mw-heading mw-heading3"><h3 id="Fraction_slash">Fraction slash</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=8" title="Edit section: Fraction slash"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Unicode_subscripts_and_superscripts#Fraction_slash" title="Unicode subscripts and superscripts">Unicode subscripts and superscripts §&#160;Fraction slash</a></div> <figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:AppleChancery1%C2%BCFractionExample.png" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/e/ef/AppleChancery1%C2%BCFractionExample.png" decoding="async" width="194" height="86" class="mw-file-element" data-file-width="194" data-file-height="86" /></a><figcaption>Example of <a href="#Fraction_slash">fraction slash</a> use. This <a href="/wiki/Typeface" title="Typeface">typeface</a> (<a href="/wiki/Chancery_hand" title="Chancery hand">Apple Chancery</a>) shows the synthesized common fraction on the left and the precomposed fraction glyph on the right as a rendering the plain text string "1 1⁄4 1¼". Depending on the text environment, the single string "1 1⁄4" might yield either result, the one on the right through substitution of the fraction sequence with the single precomposed fraction glyph.</figcaption></figure> <figure class="mw-halign-right" typeof="mw:File/Thumb"><a href="/wiki/File:AppleChancery4and221-225thsExample.svg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/a/ac/AppleChancery4and221-225thsExample.svg/220px-AppleChancery4and221-225thsExample.svg.png" decoding="async" width="220" height="66" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/a/ac/AppleChancery4and221-225thsExample.svg/330px-AppleChancery4and221-225thsExample.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/a/ac/AppleChancery4and221-225thsExample.svg/440px-AppleChancery4and221-225thsExample.svg.png 2x" data-file-width="200" data-file-height="60" /></a><figcaption>A more elaborate example of fraction slash usage: plain text "4 221⁄225" rendered in <a href="/wiki/Chancery_hand" title="Chancery hand">Apple Chancery</a>. This font supplies the text layout software with instructions to synthesize the fraction according to the <a href="/wiki/Unicode" title="Unicode">Unicode</a> rule described in this section.</figcaption></figure> <p>The fraction slash character (U+2044) has special behavior in the Unicode Standard:<sup id="cite_ref-6" class="reference"><a href="#cite_note-6"><span class="cite-bracket">&#91;</span>6<span class="cite-bracket">&#93;</span></a></sup> (section 6.2, Other Punctuation) </p> <blockquote><p>The standard form of a fraction built using the fraction slash is defined as follows: any sequence of one or more decimal digits (General Category = Nd), followed by the fraction slash, followed by any sequence of one or more decimal digits. Such a fraction should be displayed as a unit, such as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">¾</span>. If the displaying software is incapable of mapping the fraction to a unit, then it can also be displayed as a simple linear sequence as a fallback (for example, 3/4). If the fraction is to be separated from a previous number, then a space can be used, choosing the appropriate width (normal, thin, zero width, and so on). For example, 1 + <small>ZERO WIDTH SPACE</small> + 3 + <small>FRACTION SLASH</small> + 4 is displayed as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">1¾</span>.</p></blockquote> <p>By following this Unicode recommendation, text processing systems yield sophisticated symbols from plain text alone. Here the presence of the fraction slash character instructs the layout engine to synthesize a fraction from all consecutive digits preceding and following the slash. In practice, results vary because of the complicated interplay between fonts and layout engines. Simple text layout engines tend not to synthesize fractions at all, and instead draw the glyphs as a linear sequence as described in the Unicode fallback scheme. </p><p>More sophisticated layout engines face two practical choices: they can follow Unicode's recommendation, or they can rely on the font's own instructions for synthesizing fractions. By ignoring the font's instructions, the layout engine can guarantee Unicode's recommended behavior. By following the font's instructions, the layout engine can achieve better <a href="/wiki/Typography" title="Typography">typography</a> because placement and shaping of the digits will be tuned to that particular font at that particular size. </p><p>The problem with following the font's instructions is that the simpler font formats have no way to specify fraction synthesis behavior. Meanwhile, the more complex formats do not require the font to specify fraction synthesis behavior and therefore many do not. Most fonts of complex formats can instruct the layout engine to replace a plain text sequence such as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">1⁄2</span> with the precomposed <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">½</span> glyph. But because many of them will not issue instructions to synthesize fractions, a plain text string such as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">221⁄225</span> may well render as <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">22½25</span> (with the <span class="nounderlines" style="border: 1px solid var(--border-color-muted,#ddd); color: var(--color-base); background-color: var( --background-color-neutral-subtle, #fdfdfd); padding: 1px 1px;">½</span> being the substituted precomposed fraction, rather than synthesized). In the face of problems like this, those who wish to rely on the recommended Unicode behavior should choose fonts known to synthesize fractions or text layout software known to produce Unicode's recommended behavior regardless of font. </p> <div class="mw-heading mw-heading3"><h3 id="Bidirectional_neutral_formatting">Bidirectional neutral formatting</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=9" title="Edit section: Bidirectional neutral formatting"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Writing direction is the direction glyphs are placed on the page in relation to forward progression of characters in the Unicode string. English and other languages of Latin script have left-to-right writing direction. Several major writing scripts, such as <a href="/wiki/Arabic_alphabet" title="Arabic alphabet">Arabic</a> and <a href="/wiki/Hebrew_alphabet" title="Hebrew alphabet">Hebrew</a>, have right-to-left writing direction. The Unicode specification assigns a <i>directional type</i> to each character to inform text processors how sequences of characters should be ordered on the page. </p><p>While lexical characters (that is, letters) are normally specific to a single writing script, some symbols and punctuation marks are used across many writing scripts. Unicode could have created duplicate symbols in the repertoire that differ only by directional type, but chose instead to unify them and assign them a neutral directional type. They acquire direction at render time from adjacent characters. Some of these characters also have a <i>bidi-mirrored</i> property indicating the glyph should be rendered in mirror-image when used in right-to-left text. </p><p>The render-time directional type of a neutral character can remain ambiguous when the mark is placed on the boundary between directional changes. To address this, Unicode includes characters that have strong directionality, have no glyph associated with them, and are ignorable by systems that do not process bidirectional text: </p> <ul><li>Arabic letter mark (U+061C)</li> <li>Left-to-right mark (U+200E)</li> <li>Right-to-left mark (U+200F)</li></ul> <p>Surrounding a bidirectionally neutral character by the left-to-right mark will force the character to behave as a left-to-right character while surrounding it by the right-to-left mark will force it to behave as a right-to-left character. The behavior of these characters is detailed in Unicode's Bidirectional Algorithm. </p> <div class="mw-heading mw-heading3"><h3 id="Bidirectional_general_formatting">Bidirectional general formatting</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=10" title="Edit section: Bidirectional general formatting"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Further information: <a href="/wiki/Bidirectional_text" title="Bidirectional text">Bidirectional text</a></div> <p>While Unicode is designed to handle multiple languages, multiple writing systems and even text that flows either left-to-right or right-to-left with minimal author intervention, there are special circumstances where the mix of bidirectional text can become intricate—requiring more author control. For these circumstances, Unicode includes five other characters to control the complex embedding of left-to-right text within right-to-left text and vice versa: </p> <ul><li>Left-to-right embedding (U+202A)</li> <li>Right-to-left embedding (U+202B)</li> <li>Pop directional formatting (U+202C)</li> <li>Left-to-right override (U+202D)</li> <li>Right-to-left override (U+202E)</li> <li>Left-to-right isolate (U+2066)</li> <li>Right-to-left isolate (U+2067)</li> <li>First strong isolate (U+2068)</li> <li>Pop directional isolate (U+2069)</li></ul> <div class="mw-heading mw-heading3"><h3 id="Interlinear_annotation_characters">Interlinear annotation characters</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=11" title="Edit section: Interlinear annotation characters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li>Interlinear Annotation Anchor (U+FFF9)</li> <li>Interlinear Annotation Separator (U+FFFA)</li> <li>Interlinear Annotation Terminator (U+FFFB)</li></ul> <div class="mw-heading mw-heading3"><h3 id="Script-specific">Script-specific</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=12" title="Edit section: Script-specific"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li>Prefixed format control <ul><li>Arabic Number Sign (U+0600)</li> <li>Arabic Sign Sanah (U+0601)</li> <li>Arabic Footnote Marker (U+0602)</li> <li>Arabic Sign Safha (U+0603)</li> <li>Arabic Sign Samvat (U+0604)</li> <li>Arabic Number Mark Above (U+0605)</li> <li>Arabic End of Ayah (U+06DD)</li> <li><a href="/wiki/Syriac_Abbreviation_Mark" title="Syriac Abbreviation Mark">Syriac Abbreviation Mark</a> (U+070F)</li> <li>Arabic Pound Mark Above (U+0890)</li> <li>Arabic Piastre Mark Above (U+0891)</li> <li>Kaithi Number Sign (U+110BD)</li> <li>Kaithi Number Sign Above (U+110CD)</li></ul></li> <li>Egyptian Hieroglyphs <ul><li>Egyptian Hieroglyph Vertical Joiner (U+13430)</li> <li>Egyptian Hieroglyph Horizontal Joiner (U+13431)</li> <li>Egyptian Hieroglyph Insert At Top Start (U+13432)</li> <li>Egyptian Hieroglyph Insert At Bottom Start (U+13433)</li> <li>Egyptian Hieroglyph Insert At Top End (U+13434)</li> <li>Egyptian Hieroglyph Insert At Bottom End (U+13435)</li> <li>Egyptian Hieroglyph Overlay Middle (U+13436)</li> <li>Egyptian Hieroglyph Begin Segment (U+13437)</li> <li>Egyptian Hieroglyph End Segment (U+13438)</li> <li>Egyptian Hieroglyph Insert At Middle (U+13439)</li> <li>Egyptian Hieroglyph Insert At Top (U+1343A)</li> <li>Egyptian Hieroglyph Insert At Bottom (U+1343B)</li> <li>Egyptian Hieroglyph Begin Enclosure (U+1343C)</li> <li>Egyptian Hieroglyph End Enclosure (U+1343D)</li> <li>Egyptian Hieroglyph Begin Walled Enclosure (U+1343E)</li> <li>Egyptian Hieroglyph End Walled Enclosure (U+1343F)</li></ul></li> <li>Brahmi <ul><li>Brahmi Number Joiner (U+1107F)</li></ul></li> <li>Brahmi-derived script dead-character formation (<a href="/wiki/Virama" title="Virama">Virama</a> and similar diacritics) <ul><li>Devanagari Sign Virama (U+094D)</li> <li>Bengali Sign Virama (U+09CD)</li> <li>Gurmukhi Sign Virama (U+0A4D)</li> <li>Gujarati Sign Virama (U+0ACD)</li> <li>Oriya Sign Virama (U+0B4D)</li> <li>Tamil Sign Virama (U+0BCD)</li> <li>Telugu Sign Virama (U+0C4D)</li> <li>Kannada Sign Virama (U+0CCD)</li> <li>Malayalam Sign Vertical Bar Virama (U+0D3B)</li> <li>Malayalam Sign Circular Virama (U+0D3C)</li> <li>Malayalam Sign Virama (U+0D4D)</li> <li>Sinhala Sign Al-Lakuna (U+0DCA)</li> <li>Thai Character Phinthu (U+0E3A)</li> <li>Thai Character Yamakkan (U+0E4E)</li> <li>Lao Sign Pali Virama (U+0EBA)</li> <li>Myanmar Sign Virama (U+1039)</li> <li>Tagalog Sign Virama (U+1714)</li> <li>Tagalog Sign Pamudpod (U+1715)</li> <li>Hanunoo Sign Pamudpod (U+1734)</li> <li>Khmer Sign Viriam (U+17D1)</li> <li>Khmer Sign Coeng (U+17D2)</li> <li>Tai Tham Sign Sakot (U+1A60)</li> <li>Tai Tham Sign Ra Haam (U+1A7A)</li> <li>Balinese Adeg Adeg (U+1B44)</li> <li>Sundanese Sign Pamaaeh (U+1BAA)</li> <li>Sundanese Sign Virama (U+1BAB)</li> <li>Batak Pangolat (U+1BF2)</li> <li>Batak Panongonan (U+1BF3)</li> <li>Syloti Nagri Sign Hasanta (U+A806)</li> <li>Syloti Nagri Sign Alternate Hasanta (U+A82C)</li> <li>Saurashtra Sign Virama (U+A8C4)</li> <li>Rejang Virama (U+A953)</li> <li>Javanese Pangkon (U+A9C0)</li> <li>Meetei Mayek Virama (U+AAF6)</li> <li>Kharoshthi Virama (U+10A3F)</li> <li>Brahmi Virama (U+11046)</li> <li>Brahmi Sign Old Tamil Virama (U+11070)</li> <li>Kaithi Sign Virama (U+110B9)</li> <li>Chakma Virama (U+11133)</li> <li>Sharada Sign Virama (U+111C0)</li> <li>Khojki Sign Virama (U+11235)</li> <li>Khudawadi Sign Virama (U+112EA)</li> <li>Grantha Sign Virama (U+1134D)</li> <li>Tulu-Tigalari Sign Virama (U+113CE)</li> <li>Tulu-Tigalari Sign Looped Virama (U+113CF)</li> <li>Tulu-Tigalari Conjoiner (U+113D0)</li> <li>Newa Sign Virama (U+11442)</li> <li>Tirhuta Sign Virama (U+114C2)</li> <li>Siddham Sign Virama (U+115BF)</li> <li>Modi Sign Virama (U+1163F)</li> <li>Takri Sign Virama (U+116B6)</li> <li>Ahom Sign Killer (U+1172B)</li> <li>Dogra Sign Virama (U+11839)</li> <li>Dives Akuru Sign Halanta (U+1193D)</li> <li>Dives Akuru Virama (U+1193E)</li> <li>Nandinagari Sign Virama (U+119E0)</li> <li>Zanabazar Square Sign Virama (U+11A34)</li> <li>Zanabazar Square Subjoiner (U+11A47)</li> <li>Soyombo Subjoiner (U+11A99)</li> <li>Bhaiksuki Sign Virama (U+11C3F)</li> <li>Masaram Gondi Sign Halanta (U+11D44)</li> <li>Masaram Gondi Virama (U+11D45)</li> <li>Gunjala Gondi Virama (U+11D97)</li> <li>Kawi Sign Killer (U+11F41)</li> <li>Kawi Conjoiner (U+11F42)</li> <li>Gurung Khema Sign Tholhoma (U+1612F)</li> <li>Kirat Rai Sign Virama (U+16D6B)</li> <li>Kirat Rai Sign Saat (U+16D6C)</li></ul></li> <li>Historical Viramas with other functions <ul><li>Tibetan Mark Halanta (U+0F84)</li> <li>Myanmar Sign Asat (U+103A)</li> <li>Limbu Sign Sa-I (U+193B)</li> <li>Meetei Mayek Apun Iyek (U+ABED)</li> <li>Chakma Maayyaa (U+11134)</li></ul></li> <li>Mongolian Variation Selectors <ul><li>Mongolian Free Variation Selector One (U+180B)</li> <li>Mongolian Free Variation Selector Two (U+180C)</li> <li>Mongolian Free Variation Selector Three (U+180D)</li> <li>Mongolian Vowel Separator (U+180E)</li></ul></li> <li>Generic Variation Selectors <ul><li>Variation Selector-1 through -16 (U+FE00&#8211;U+FE0F)</li> <li>Variation Selector-17 through -256 (U+E0100&#8211;U+E01EF)</li></ul></li> <li>Tag characters (U+E0001 and U+E0020&#8211;U+E007F)</li> <li>Tifinagh <ul><li>Tifinagh Consonant Joiner (U+2D7F)</li></ul></li> <li>Ogham <ul><li>Ogham Space Mark (U+1680)</li></ul></li> <li>Ideographic <ul><li>Ideographic variation indicator (U+303E)</li> <li>Ideographic Description (U+2FF0&#8211;U+2FFB)</li></ul></li> <li>Musical Format Control <ul><li>Musical Symbol Begin Beam (U+1D173)</li> <li>Musical Symbol End Beam (U+1D174)</li> <li>Musical Symbol Begin Tie (U+1D175)</li> <li>Musical Symbol End Tie (U+1D176)</li> <li>Musical Symbol Begin Slur (U+1D177)</li> <li>Musical Symbol End Slur (U+1D178)</li> <li>Musical Symbol Begin Phrase (U+1D179)</li> <li>Musical Symbol End Phrase (U+1D17A)</li></ul></li> <li>Shorthand Format Control <ul><li>Shorthand Format Letter Overlap (U+1BCA0)</li> <li>Shorthand Format Continuing Overlap (U+1BCA1)</li> <li>Shorthand Format Down Step (U+1BCA2)</li> <li>Shorthand Format Up Step (U+1BCA3)</li></ul></li> <li>Deprecated Alternate Formatting <ul><li>Inhibit Symmetric Swapping (U+206A)</li> <li>Activate Symmetric Swapping (U+206B)</li> <li>Inhibit Arabic Form Shaping (U+206C)</li> <li>Activate Arabic Form Shaping (U+206D)</li> <li>National Digit Shapes (U+206E)</li> <li>Nominal Digit Shapes (U+206F)</li></ul></li></ul> <div class="mw-heading mw-heading3"><h3 id="Others">Others</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=13" title="Edit section: Others"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li>Object Replacement Character (U+FFFC)</li> <li>Replacement Character (U+FFFD)</li></ul> <div class="mw-heading mw-heading2"><h2 id="Characters_vs._code_points">Characters vs. code points</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=14" title="Edit section: Characters vs. code points"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The term "character" is not well defined, and what we are referring to most of the time is the <a href="/wiki/Grapheme" title="Grapheme">grapheme</a>. A grapheme is represented visually by its <a href="/wiki/Glyph" title="Glyph">glyph</a>. The <a href="/wiki/Typeface" title="Typeface">typeface</a> (often erroneously referred to as <a href="/wiki/Font" title="Font">font</a>) used can depict visual variations of the same character. It is possible that two different graphemes can have the exact same glyph or are visually so close that the average reader cannot tell them apart. </p><p>A grapheme is almost always represented by one code point, for example the LATIN CAPITAL LETTER A is represented by only code point U+0041. </p><p>The grapheme <a href="/wiki/%C3%84" title="Ä">LATIN CAPITAL A WITH DIAERESIS Ä</a> is an example where a character can be represented by more than one code point. It can be U+00C4, or U+0041U+0308. U+0041 is the familiar A and U+0308 is the <a href="/wiki/Diaeresis_(diacritic)" title="Diaeresis (diacritic)">COMBINING DIAERESIS ̈</a>, a <a href="/wiki/Combining_diacritical_mark" class="mw-redirect" title="Combining diacritical mark">combining diacritical mark</a>. </p><p>When a combining mark is adjacent to a non-combining mark code point, text rendering applications should superimpose the combining mark onto the glyph represented by the other code point to form a grapheme according to a set of rules.<sup id="cite_ref-7" class="reference"><a href="#cite_note-7"><span class="cite-bracket">&#91;</span>7<span class="cite-bracket">&#93;</span></a></sup> </p><p>The word BÄM would therefore be three graphemes. It may be made up of three code points or more depending on how the characters are actually composed. </p> <div class="mw-heading mw-heading2"><h2 id="Whitespace,_joiners,_and_separators"><span id="Whitespace.2C_joiners.2C_and_separators"></span>Whitespace, joiners, and separators</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=15" title="Edit section: Whitespace, joiners, and separators"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Whitespace_character" title="Whitespace character">Whitespace character</a></div> <p>Unicode provides a list of characters it deems whitespace characters for interoperability support. Software Implementations and other standards may use the term to denote a slightly different set of characters. For example, Java does not consider <span class="nowrap"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r886049734"><span class="monospaced">U+00A0</span>&#x20;</span><span class="Unicode" style="background:lightblue;line-height:1em">&#xa0;</span> <span style="font-variant: small-caps; text-transform: lowercase;">NO-BREAK SPACE</span> or <span class="nowrap"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r886049734"><span class="monospaced">U+0085</span>&#x20;</span><span style="font-size:small">&lt;control-0085&gt;</span> <span style="font-variant: small-caps; text-transform: lowercase;"></span> (NEXT LINE) to be whitespace, even though Unicode does. Whitespace characters are characters typically designated for programming environments. Often they have no syntactic meaning in such programming environments and are ignored by the machine interpreters. Unicode designates the legacy control characters U+0009 through U+000D and U+0085 as whitespace characters, as well as all characters whose General Category property value is Separator. There are 25 total whitespace characters as of Unicode 16.0. </p> <div class="mw-heading mw-heading3"><h3 id="Grapheme_joiners_and_non-joiners">Grapheme joiners and non-joiners</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=16" title="Edit section: Grapheme joiners and non-joiners"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The <a href="/wiki/Zero-width_joiner" title="Zero-width joiner">zero-width joiner</a> (U+200D) and <a href="/wiki/Zero-width_non-joiner" title="Zero-width non-joiner">zero-width non-joiner</a> (U+200C) control the joining and ligation of glyphs. The joiner does not cause characters that would not otherwise join or ligate to do so, but when paired with the non-joiner these characters can be used to control the joining and ligating properties of the surrounding two joining or ligating characters. The Combining Grapheme Joiner (U+034F) is used to distinguish two base characters as one common base or digraph, mostly for underlying text processing, collation of strings, case folding and so on. </p> <div class="mw-heading mw-heading3"><h3 id="Word_joiners_and_separators">Word joiners and separators</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=17" title="Edit section: Word joiners and separators"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The most common word separator is a space (U+0020). However, there are other word joiners and separators that also indicate a break between words and participate in line-breaking algorithms. The No-Break Space (U+00A0) also produces a baseline advance without a glyph but inhibits rather than enabling a line-break. The Zero Width Space (U+200B) allows a line-break but provides no space: in a sense joining, rather than separating, two words. Finally, the Word Joiner (U+2060) inhibits line breaks and also involves none of the white space produced by a baseline advance. </p> <table class="wikitable"> <tbody><tr> <th></th> <th>Baseline advance</th> <th>No baseline advance </th></tr> <tr> <td><b>Allow line-break</b> <br />(Separators)</td> <td>Space U+0020</td> <td>Zero Width Space U+200B </td></tr> <tr> <td><b>Inhibit line-break</b><br />(Joiners)</td> <td>No-Break Space U+00A0</td> <td>Word Joiner U+2060 </td></tr></tbody></table> <div class="mw-heading mw-heading3"><h3 id="Other_separators">Other separators</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=18" title="Edit section: Other separators"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li>Line Separator (U+2028)</li> <li>Paragraph Separator (U+2029)</li></ul> <p>These provide Unicode with native paragraph and line separators independent of the legacy encoded ASCII control characters such as carriage return (U+000A), linefeed (U+000D), and Next Line (U+0085). Unicode does not provide for other ASCII formatting control characters which presumably then are not part of the Unicode plain text processing model. These legacy formatting control characters include Tab (U+0009), Line Tabulation or Vertical Tab (U+000B), and Form Feed (U+000C) which is also thought of as a page break. </p> <div class="mw-heading mw-heading3"><h3 id="Spaces">Spaces</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=19" title="Edit section: Spaces"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Further information: <a href="/wiki/Space_(punctuation)" title="Space (punctuation)">Space (punctuation)</a></div> <p>The space character (U+0020) typically input by the space bar on a keyboard serves semantically as a word separator in many languages. For legacy reasons, the UCS also includes spaces of varying sizes that are compatibility equivalents for the space character. While these spaces of varying width are important in typography, the Unicode processing model calls for such visual effects to be handled by rich text, markup and other such protocols. They are included in the Unicode repertoire primarily to handle lossless roundtrip transcoding from other character set encodings. These spaces include: </p> <ol><li>En Quad (U+2000)</li> <li>Em Quad (U+2001)</li> <li>En Space (U+2002)</li> <li>Em Space (U+2003)</li> <li>Three-Per-Em Space (U+2004)</li> <li>Four-Per-Em Space (U+2005)</li> <li>Six-Per-Em Space (U+2006)</li> <li>Figure Space (U+2007)</li> <li>Punctuation Space (U+2008)</li> <li>Thin Space (U+2009)</li> <li>Hair Space (U+200A)</li> <li>Medium Mathematical Space (U+205F)</li></ol> <p>Aside from the original ASCII space, the other spaces are all compatibility characters. In this context this means that they effectively add no semantic content to the text, but instead provide styling control. Within Unicode, this non-semantic styling control is often referred to as rich text and is outside the thrust of Unicode's goals. Rather than using different spaces in different contexts, this styling should instead be handled through intelligent text layout software. </p><p>Three other writing-system-specific word separators are: </p> <ul><li>Mongolian Vowel Separator (U+180E)</li> <li>Ideographic Space (U+3000): behaves as an ideographic separator and generally rendered as white space of the same width as an ideograph.</li> <li>Ogham Space Mark (U+1680): this character is sometimes displayed with a glyph and other times as only white space.</li></ul> <div class="mw-heading mw-heading3"><h3 id="Line-break_control_characters">Line-break control characters</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=20" title="Edit section: Line-break control characters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Several characters are designed to help control line-breaks either by discouraging them (no-break characters) or suggesting line breaks such as the soft hyphen (U+00AD) (sometimes called the "shy hyphen"). Such characters, though designed for styling, are probably indispensable for the intricate types of line-breaking they make possible. </p> <dl><dt>Break inhibiting</dt></dl> <ol><li>Non-breaking hyphen (U+2011)</li> <li>No-break space (U+00A0)</li> <li>Tibetan Mark Delimiter Tsheg Bstar (U+0F0C)</li> <li>Narrow no-break space (U+202F)</li></ol> <p>The break inhibiting characters are meant to be equivalent to a character sequence wrapped in the Word Joiner U+2060. However, the Word Joiner may be appended before or after any character that would allow a line-break to inhibit such line-breaking. </p> <dl><dt>Break enabling</dt></dl> <ol><li>Soft hyphen (U+00AD)</li> <li>Tibetan Mark Intersyllabic Tsheg (U+0F0B)</li> <li>Zero-width space (U+200B)</li></ol> <p>Both the break inhibiting and break enabling characters participate with other punctuation and whitespace characters to enable text imaging systems to determine line breaks within the Unicode Line Breaking Algorithm.<sup id="cite_ref-8" class="reference"><a href="#cite_note-8"><span class="cite-bracket">&#91;</span>8<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading2"><h2 id="Types_of_code_point">Types of code point</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=21" title="Edit section: Types of code point"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>All code points given some kind of purpose or use are considered designated code points. Of those, they may be assigned to an abstract character, or otherwise designated for some other purpose. </p> <div class="mw-heading mw-heading3"><h3 id="Assigned_characters">Assigned characters</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=22" title="Edit section: Assigned characters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The majority of code points in actual use have been assigned to abstract characters. This includes private-use characters, which though not formally designated by the Unicode standard for a particular purpose, require a sender and recipient to have agreed in advance how they should be interpreted for meaningful <a href="/wiki/Information_interchange" class="mw-redirect" title="Information interchange">information interchange</a> to take place. </p> <div class="mw-heading mw-heading4"><h4 id="Private-use_characters">Private-use characters</h4><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=23" title="Edit section: Private-use characters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Private_Use_Areas" title="Private Use Areas">Private Use Areas</a></div> <p>The UCS includes 137,468 private-use characters, which are code points for private use spread across three different blocks, each called a <i>Private Use Area</i> (PUA). The Unicode standard recognizes code points within PUAs as legitimate Unicode character codes, but does not assign them any (abstract) character. Instead, individuals, organizations, software vendors, operating system vendors, font vendors and communities of end-users are free to use them as they see fit. Within closed systems, characters in the PUA can operate unambiguously, allowing such systems to represent characters or glyphs not defined in Unicode.<sup id="cite_ref-9" class="reference"><a href="#cite_note-9"><span class="cite-bracket">&#91;</span>9<span class="cite-bracket">&#93;</span></a></sup> In public systems their use is more problematic, since there is no registry and no way to prevent several organizations from adopting the same code points for different purposes. One example of such a conflict is <a href="/wiki/Apple_Inc." title="Apple Inc.">Apple</a>'s use of <a href="/wiki/Private_use_(unicode)" class="mw-redirect" title="Private use (unicode)">U+F8FF</a> for <a href="/wiki/Fonts_on_the_Mac#The_Apple_logo" class="mw-redirect" title="Fonts on the Mac">the Apple logo</a>, versus the <a href="/wiki/ConScript_Unicode_Registry" title="ConScript Unicode Registry">ConScript Unicode Registry</a>'s use of U+F8FF as <style data-mw-deduplicate="TemplateStyles:r920966791">.mw-parser-output span.smallcaps{font-variant:small-caps}.mw-parser-output span.smallcaps-smaller{font-size:85%}</style><span class="smallcaps">klingon mummification glyph</span> in the <a href="/wiki/Klingon_scripts" title="Klingon scripts">Klingon script</a>.<sup id="cite_ref-10" class="reference"><a href="#cite_note-10"><span class="cite-bracket">&#91;</span>10<span class="cite-bracket">&#93;</span></a></sup> </p><p>The Basic Multilingual Plane (Plane 0) contains 6,400 private-user characters in the eponymously named PUA <i>Private Use Area</i>, which ranges from U+E000 to U+F8FF. The <a href="/wiki/Private_Use_Planes" class="mw-redirect" title="Private Use Planes">Private Use Planes</a>, Plane 15 and Plane 16, each have their own PUAs of 65,534 private-use characters (with the final two code points of each plane being noncharacters). These are <i>Supplementary Private Use Area-A</i>, which ranges from U+F0000 to U+FFFFD, and <i>Supplementary Private Use Area-B</i>, which ranges from U+100000 to U+10FFFD. </p><p>PUAs are a concept inherited from certain Asian encoding systems. These systems had private use areas to encode what the Japanese call <i><a href="/wiki/Gaiji" class="mw-redirect" title="Gaiji">gaiji</a></i> (rare characters not normally found in fonts) in application-specific ways. </p> <div class="mw-heading mw-heading3"><h3 id="Surrogates">Surrogates</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=24" title="Edit section: Surrogates"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p><span class="anchor" id="Surrogates"></span><span class="anchor" id="Surrogate"></span> The UCS uses surrogates to address characters outside the initial <a href="/wiki/Plane_(Unicode)#Basic_Multilingual_Plane" title="Plane (Unicode)">Basic Multilingual Plane</a> without resorting to more-than-16-bit-word representations.<sup id="cite_ref-11" class="reference"><a href="#cite_note-11"><span class="cite-bracket">&#91;</span>11<span class="cite-bracket">&#93;</span></a></sup> There are 1024 "high" surrogates (D800–DBFF) and 1024 "low" surrogates (DC00–DFFF). By combining a pair of surrogates, the remaining characters in all the other planes can be addressed (1024 × 1024 = 1048576 code points in the other 16 planes). In <a href="/wiki/UTF-16" title="UTF-16">UTF-16</a>, they must always appear in pairs, as a high surrogate followed by a low surrogate, thus using 32 bits to denote one code point. </p><p>A surrogate pair denotes the code point </p> <dl><dd>10000<sub>16</sub> + (<i>H</i> - D800<sub>16</sub>) × 400<sub>16</sub> + (<i>L</i> - DC00<sub>16</sub>)</dd></dl> <p>where <i>H</i> and <i>L</i> are the numeric values of the high and low surrogates respectively.<sup id="cite_ref-12" class="reference"><a href="#cite_note-12"><span class="cite-bracket">&#91;</span>12<span class="cite-bracket">&#93;</span></a></sup> </p><p>Since high surrogate values in the range DB80–DBFF always produce values in the Private Use planes, the high surrogate range can be further divided into (normal) high surrogates (D800–DB7F) and "high private use surrogates" (DB80–DBFF). </p><p>Isolated surrogate code points have no general interpretation; consequently, no character code charts or names lists are provided for this range. In the <a href="/wiki/Python_(programming_language)" title="Python (programming language)">Python programming language</a>, individual surrogate codes are used to embed undecodable bytes in Unicode strings.<sup id="cite_ref-13" class="reference"><a href="#cite_note-13"><span class="cite-bracket">&#91;</span>13<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading3"><h3 id="Noncharacters">Noncharacters<span class="anchor" id="Non-characters"></span></h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=25" title="Edit section: Noncharacters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The unhyphenated term "noncharacter" refers to 66 code points (labeled <code>&lt;not a character&gt;</code>) permanently reserved for internal use, and therefore guaranteed to never be assigned to a character.<sup id="cite_ref-14" class="reference"><a href="#cite_note-14"><span class="cite-bracket">&#91;</span>14<span class="cite-bracket">&#93;</span></a></sup> Each of the 17 planes has its two ending code points set aside as noncharacters. So, noncharacters are: U+FFFE and U+FFFF on the BMP, U+1FFFE and U+1FFFF on Plane 1, and so on, up to U+10FFFE and U+10FFFF on Plane 16, for a total of 34 code points. In addition, there is a contiguous range of another 32 noncharacter code points in the BMP: U+FDD0..U+FDEF. Software implementations are free to use these code points for internal use. One particularly useful example of a noncharacter is the code point U+FFFE. This code point has the reverse UTF-16/UCS-2 byte sequence of the <a href="/wiki/Byte_order_mark" title="Byte order mark">byte order mark</a> (U+FEFF). If a stream of text contains this noncharacter, this is a good indication the text has been interpreted with the incorrect <a href="/wiki/Endianness" title="Endianness">endianness</a>. </p><p>Versions of the Unicode standard from 3.1.0 to 6.3.0 claimed that noncharacters "should never be interchanged". <a rel="nofollow" class="external text" href="https://www.unicode.org/versions/corrigendum9.html">Corrigendum #9</a> of the standard later stated that this was leading to "inappropriate over-rejection", clarifying that "[Noncharacters] are not illegal in interchange nor do they cause ill-formed Unicode text", and removing the original claim. </p> <div class="mw-heading mw-heading3"><h3 id="Reserved_code_points">Reserved code points</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=26" title="Edit section: Reserved code points"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>All other code points, being those not designated, are referred to as being reserved. These code points may be assigned for a particular use in future versions of the Unicode standard. </p> <div class="mw-heading mw-heading2"><h2 id="Characters,_grapheme_clusters_and_glyphs"><span id="Characters.2C_grapheme_clusters_and_glyphs"></span>Characters, grapheme clusters and glyphs</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=27" title="Edit section: Characters, grapheme clusters and glyphs"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Further information: <a href="/wiki/Unicode#Abstract_characters" title="Unicode">Unicode §&#160;Abstract characters</a></div> <p>Whereas many other character sets assign a character for every possible glyph representation of the character, Unicode seeks to treat characters separately from glyphs. This distinction is not always unambiguous; however, a few examples will help illustrate the distinction. Often two characters may be combined typographically to improve the readability of the text. For example, the three letter sequence "ffi" may be treated as a single glyph. Other character sets would often assign a code point to this glyph in addition to the individual letters: "f" and "i". </p><p>In addition, Unicode approaches <a href="/wiki/Diacritic" title="Diacritic">diacritic</a> modified letters as separate characters that, when rendered, become a single glyph. For example, an "o" with <a href="/wiki/Diaeresis_(diacritic)" title="Diaeresis (diacritic)">diaeresis</a>: "<a href="/wiki/%C3%96" title="Ö">ö</a>". Traditionally, other character sets assigned a unique character code point for each diacritic modified letter used in each language. Unicode seeks to create a more flexible approach by allowing combining diacritic characters to combine with any letter. This has the potential to significantly reduce the number of active code points needed for the character set. As an example, consider a language that uses the Latin script and combines the diaeresis with the upper- and lower-case letters "a", "o", and "u". With the Unicode approach, only the diaeresis diacritic character needs to be added to the character set to use with the Latin letters: "a", "A", "o", "O", "u", and "U": seven characters in all. A legacy character sets needs to add six <b>precomposed</b> letters with a diaeresis in addition to the six code points it uses for the letters without diaeresis: twelve character code points in total. </p> <div class="mw-heading mw-heading3"><h3 id="Compatibility_characters">Compatibility characters</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=28" title="Edit section: Compatibility characters"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>UCS includes thousands of characters that Unicode designates as compatibility characters. These are characters that were included in UCS in order to provide distinct code points for characters that other character sets differentiate, but would not be differentiated in the Unicode approach to characters. </p><p>The chief reason for this differentiation was that Unicode makes a distinction between characters and glyphs. For example, when writing English in a <a href="/wiki/Cursive" title="Cursive">cursive</a> style, the letter "i" may take different forms whether it appears at the beginning of a word, the end of a word, the middle of a word or in isolation. Languages such as <a href="/wiki/Arabic" title="Arabic">Arabic</a> written in an Arabic script are always cursive. Each letter has many different forms. UCS includes 730 Arabic form characters that decompose to just 88 unique Arabic characters. However, these additional Arabic characters are included so that text processing software may translate text from other character sets to UCS and back again without any loss of information crucial for non-Unicode software. </p><p>However, for UCS and Unicode in particular, the preferred approach is to always encode or map that letter to the same character no matter where it appears in a word. Then the distinct forms of each letter are determined by the font and text layout software methods. In this way, the internal memory for the characters remains identical regardless of where the character appears in a word. This greatly simplifies searching, sorting and other text processing operations. </p> <div class="mw-heading mw-heading2"><h2 id="Character_properties">Character properties</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=29" title="Edit section: Character properties"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Unicode_character_property" title="Unicode character property">Unicode character property</a></div> <p>Every character in Unicode is defined by a large and growing set of properties. Most of these properties are not part of Universal Character Set. The properties facilitate text processing including collation or sorting of text, identifying words, sentences and graphemes, rendering or imaging text and so on. Below is a list of some of the core properties. There are many others documented in the Unicode Character Database.<sup id="cite_ref-15" class="reference"><a href="#cite_note-15"><span class="cite-bracket">&#91;</span>15<span class="cite-bracket">&#93;</span></a></sup> </p> <table class="wikitable"> <tbody><tr> <th>Property</th> <th>Example</th> <th>Details </th></tr> <tr> <td><b>Name</b></td> <td>LATIN CAPITAL LETTER A</td> <td>This is a permanent name assigned by the joint cooperation of Unicode and the ISO UCS. A few known poorly chosen names exist and are acknowledged (e.g. U+FE18 PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET, which is misspelled – should be BRACKET) but will not be changed, in order to ensure specification stability.<sup id="cite_ref-16" class="reference"><a href="#cite_note-16"><span class="cite-bracket">&#91;</span>16<span class="cite-bracket">&#93;</span></a></sup> </td></tr> <tr> <td><b>Code Point</b></td> <td>U+0041</td> <td>The Unicode code point is a number also permanently assigned along with the "Name" property and included in the companion UCS. The usual custom is to represent the code point as hexadecimal number with the prefix "U+" in front. </td></tr> <tr> <td><b>Representative Glyph</b></td> <td><span typeof="mw:File"><a href="/wiki/File:LetterA.svg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/3/3e/LetterA.svg/24px-LetterA.svg.png" decoding="async" width="24" height="34" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/3/3e/LetterA.svg/36px-LetterA.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/3/3e/LetterA.svg/48px-LetterA.svg.png 2x" data-file-width="82" data-file-height="117" /></a></span><sup id="cite_ref-representative_17-0" class="reference"><a href="#cite_note-representative-17"><span class="cite-bracket">&#91;</span>17<span class="cite-bracket">&#93;</span></a></sup></td> <td>The representative glyphs are provided in code charts.<sup id="cite_ref-18" class="reference"><a href="#cite_note-18"><span class="cite-bracket">&#91;</span>18<span class="cite-bracket">&#93;</span></a></sup> </td></tr> <tr> <td><b>General Category</b></td> <td>Uppercase_Letter</td> <td>The general category<sup id="cite_ref-19" class="reference"><a href="#cite_note-19"><span class="cite-bracket">&#91;</span>19<span class="cite-bracket">&#93;</span></a></sup> is expressed as a two-letter sequence such as "Lu" for uppercase letter or "Nd", for decimal digit number. </td></tr> <tr> <td><b>Combining Class</b></td> <td>Not_Reordered (0)</td> <td>Since diacritics and other combining marks can be expressed with multiple characters in Unicode the "Combining Class" property allows characters to be differentiated by the type of combining character it represents. The combining class can be expressed as an integer between 0 and 255 or as a named value. The integer values allow the combining marks to be reordered into a canonical order to make string comparison of identical strings possible. </td></tr> <tr> <td><b>Bidirectional Category</b></td> <td>Left_To_Right</td> <td>Indicates the type of character for applying the Unicode bidirectional algorithm. </td></tr> <tr> <td><b>Bidirectional Mirrored</b></td> <td>no</td> <td>Indicates the character's glyph must be reversed or mirrored within the bidirectional algorithm. Mirrored glyphs can be provided by font makers, extracted from other characters related through the "Bidirectional Mirroring Glyph" property or synthesized by the text rendering system. </td></tr> <tr> <td><b>Bidirectional Mirroring Glyph</b></td> <td>N/A</td> <td>This property indicates the code point of another character whose glyph can serve as the mirrored glyph for the present character when mirroring within the bidirectional algorithm. </td></tr> <tr> <td><b>Decimal Digit Value</b></td> <td>NaN</td> <td rowspan="3">For numerals, this property indicates the numeric value of the character. Decimal digits have all three values set to the same value, presentational rich text compatibility characters and other Arabic-Indic non-decimal digits typically have only the latter two properties set to the numeric value of the character while numerals unrelated to Arabic Indic digits such as Roman Numerals or Hanzhou/Suzhou numerals typically have only the "Numeric Value" indicated. </td></tr> <tr> <td><b>Digit Value</b></td> <td>NaN </td></tr> <tr> <td><b>Numeric Value</b></td> <td>NaN </td></tr> <tr> <td><b>Ideographic</b></td> <td>False</td> <td>Indicates the character is a <a href="/wiki/CJK_ideograph" class="mw-redirect" title="CJK ideograph">CJK ideograph</a>: a <a href="/wiki/Logograph" class="mw-redirect" title="Logograph">logograph</a> in the <a href="/wiki/Han_script" class="mw-redirect" title="Han script">Han script</a>.<sup id="cite_ref-20" class="reference"><a href="#cite_note-20"><span class="cite-bracket">&#91;</span>20<span class="cite-bracket">&#93;</span></a></sup> </td></tr> <tr> <td><b>Default Ignorable</b></td> <td>False</td> <td>Indicates the character is ignorable for implementations and that no glyph, last resort glyph, or replacement character need be displayed. </td></tr> <tr> <td><b>Deprecated</b></td> <td>False</td> <td>Unicode never removes characters from the repertoire, but on occasion Unicode has deprecated a small number of characters. </td></tr></tbody></table> <p>Unicode provides an online database<sup id="cite_ref-21" class="reference"><a href="#cite_note-21"><span class="cite-bracket">&#91;</span>21<span class="cite-bracket">&#93;</span></a></sup> to interactively query the entire Unicode character repertoire by the various properties. </p> <div class="mw-heading mw-heading2"><h2 id="See_also">See also</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=30" title="Edit section: See also"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li><a href="/wiki/ConScript_Unicode_Registry" title="ConScript Unicode Registry">ConScript Unicode Registry</a></li> <li><a href="/wiki/Unicode_compatibility_characters" title="Unicode compatibility characters">Unicode compatibility characters</a></li></ul> <div class="mw-heading mw-heading2"><h2 id="References">References</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=31" title="Edit section: References"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <style data-mw-deduplicate="TemplateStyles:r1239543626">.mw-parser-output .reflist{margin-bottom:0.5em;list-style-type:decimal}@media screen{.mw-parser-output .reflist{font-size:90%}}.mw-parser-output .reflist .references{font-size:100%;margin-bottom:0;list-style-type:inherit}.mw-parser-output .reflist-columns-2{column-width:30em}.mw-parser-output .reflist-columns-3{column-width:25em}.mw-parser-output .reflist-columns{margin-top:0.3em}.mw-parser-output .reflist-columns ol{margin-top:0}.mw-parser-output .reflist-columns li{page-break-inside:avoid;break-inside:avoid-column}.mw-parser-output .reflist-upper-alpha{list-style-type:upper-alpha}.mw-parser-output .reflist-upper-roman{list-style-type:upper-roman}.mw-parser-output .reflist-lower-alpha{list-style-type:lower-alpha}.mw-parser-output .reflist-lower-greek{list-style-type:lower-greek}.mw-parser-output .reflist-lower-roman{list-style-type:lower-roman}</style><div class="reflist"> <div class="mw-references-wrap mw-references-columns"><ol class="references"> <li id="cite_note-1"><span class="mw-cite-backlink"><b><a href="#cite_ref-1">^</a></b></span> <span class="reference-text"><style data-mw-deduplicate="TemplateStyles:r1238218222">.mw-parser-output cite.citation{font-style:inherit;word-wrap:break-word}.mw-parser-output .citation q{quotes:"\"""\"""'""'"}.mw-parser-output .citation:target{background-color:rgba(0,127,255,0.133)}.mw-parser-output .id-lock-free.id-lock-free a{background:url("//upload.wikimedia.org/wikipedia/commons/6/65/Lock-green.svg")right 0.1em center/9px no-repeat}.mw-parser-output .id-lock-limited.id-lock-limited a,.mw-parser-output .id-lock-registration.id-lock-registration a{background:url("//upload.wikimedia.org/wikipedia/commons/d/d6/Lock-gray-alt-2.svg")right 0.1em center/9px no-repeat}.mw-parser-output .id-lock-subscription.id-lock-subscription a{background:url("//upload.wikimedia.org/wikipedia/commons/a/aa/Lock-red-alt-2.svg")right 0.1em center/9px no-repeat}.mw-parser-output .cs1-ws-icon a{background:url("//upload.wikimedia.org/wikipedia/commons/4/4c/Wikisource-logo.svg")right 0.1em center/12px no-repeat}body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-free a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-limited a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-registration a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-subscription a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .cs1-ws-icon a{background-size:contain;padding:0 1em 0 0}.mw-parser-output .cs1-code{color:inherit;background:inherit;border:none;padding:inherit}.mw-parser-output .cs1-hidden-error{display:none;color:var(--color-error,#d33)}.mw-parser-output .cs1-visible-error{color:var(--color-error,#d33)}.mw-parser-output .cs1-maint{display:none;color:#085;margin-left:0.3em}.mw-parser-output .cs1-kern-left{padding-left:0.2em}.mw-parser-output .cs1-kern-right{padding-right:0.2em}.mw-parser-output .citation .mw-selflink{font-weight:inherit}@media screen{.mw-parser-output .cs1-format{font-size:95%}html.skin-theme-clientpref-night .mw-parser-output .cs1-maint{color:#18911f}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .cs1-maint{color:#18911f}}</style><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/latest/">"The Unicode Standard"</a>. The Unicode Consortium<span class="reference-accessdate">. Retrieved <span class="nowrap">2016-08-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=The+Unicode+Standard&amp;rft.pub=The+Unicode+Consortium&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2Flatest%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-2"><span class="mw-cite-backlink"><b><a href="#cite_ref-2">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://unicode.org/roadmaps/">"Roadmaps to Unicode"</a>. The Unicode Consortium<span class="reference-accessdate">. Retrieved <span class="nowrap">2024-09-12</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Roadmaps+to+Unicode&amp;rft.pub=The+Unicode+Consortium&amp;rft_id=https%3A%2F%2Funicode.org%2Froadmaps%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-3"><span class="mw-cite-backlink"><b><a href="#cite_ref-3">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/faq/private_use.html">"FAQ - Private-Use Characters, Noncharacters, and Sentinels"</a>. <i>www.unicode.org</i><span class="reference-accessdate">. Retrieved <span class="nowrap">2023-10-24</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=www.unicode.org&amp;rft.atitle=FAQ+-+Private-Use+Characters%2C+Noncharacters%2C+and+Sentinels&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Ffaq%2Fprivate_use.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-4"><span class="mw-cite-backlink"><b><a href="#cite_ref-4">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/Unicode16.0.0/core-spec/chapter-2/#G27981">"Section 2.13: Special Characters"</a>. <i>The Unicode Standard</i>. The Unicode Consortium. September 2024.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Unicode+Standard&amp;rft.atitle=Section+2.13%3A+Special+Characters&amp;rft.date=2024-09&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2FUnicode16.0.0%2Fcore-spec%2Fchapter-2%2F%23G27981&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-5"><span class="mw-cite-backlink"><b><a href="#cite_ref-5">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/Unicode16.0.0/core-spec/chapter-4/#G124820">"Section 4.12: Characters with Unusual Properties"</a>. <i>The Unicode Standard</i>. The Unicode Consortium. September 2024.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Unicode+Standard&amp;rft.atitle=Section+4.12%3A+Characters+with+Unusual+Properties&amp;rft.date=2024-09&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2FUnicode16.0.0%2Fcore-spec%2Fchapter-4%2F%23G124820&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-6"><span class="mw-cite-backlink"><b><a href="#cite_ref-6">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/Unicode16.0.0/core-spec/chapter-6/#G2000">"Section 6.2: General Punctuation"</a>. <i>The Unicode Standard</i>. The Unicode Consortium. September 2024.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Unicode+Standard&amp;rft.atitle=Section+6.2%3A+General+Punctuation&amp;rft.date=2024-09&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2FUnicode16.0.0%2Fcore-spec%2Fchapter-6%2F%23G2000&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-7"><span class="mw-cite-backlink"><b><a href="#cite_ref-7">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.unicode.org/notes/tn2/tn2-2.html">"UTN #2: A General Method for Rendering Combining Marks"</a>. <i>www.unicode.org</i><span class="reference-accessdate">. Retrieved <span class="nowrap">2020-12-16</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=www.unicode.org&amp;rft.atitle=UTN+%232%3A+A+General+Method+for+Rendering+Combining+Marks&amp;rft_id=http%3A%2F%2Fwww.unicode.org%2Fnotes%2Ftn2%2Ftn2-2.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-8"><span class="mw-cite-backlink"><b><a href="#cite_ref-8">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/reports/tr14/">"UAX #14: Unicode Line Breaking Algorithm"</a>. The Unicode Consortium. 2016-06-01<span class="reference-accessdate">. Retrieved <span class="nowrap">2016-08-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=UAX+%2314%3A+Unicode+Line+Breaking+Algorithm&amp;rft.pub=The+Unicode+Consortium&amp;rft.date=2016-06-01&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Freports%2Ftr14%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-9"><span class="mw-cite-backlink"><b><a href="#cite_ref-9">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/Unicode15.0.0/ch23.pdf#G19184">"Section 23.5: Private-Use Characters"</a> <span class="cs1-format">(PDF)</span>. <i>The Unicode Standard</i>. The Unicode Consortium. September 2022.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Unicode+Standard&amp;rft.atitle=Section+23.5%3A+Private-Use+Characters&amp;rft.date=2022-09&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2FUnicode15.0.0%2Fch23.pdf%23G19184&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-10"><span class="mw-cite-backlink"><b><a href="#cite_ref-10">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMichael_Everson2004" class="citation web cs1">Michael Everson (2004-01-15). <a rel="nofollow" class="external text" href="http://www.evertype.com/standards/csur/klingon.html">"Klingon: U+F8D0 - U+F8FF"</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Klingon%3A+U%2BF8D0+-+U%2BF8FF&amp;rft.date=2004-01-15&amp;rft.au=Michael+Everson&amp;rft_id=http%3A%2F%2Fwww.evertype.com%2Fstandards%2Fcsur%2Fklingon.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-11"><span class="mw-cite-backlink"><b><a href="#cite_ref-11">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/Unicode15.0.0/ch23.pdf#G24089">"Section 23.6: Surrogates Area"</a> <span class="cs1-format">(PDF)</span>. <i>The Unicode Standard</i>. The Unicode Consortium. September 2022.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Unicode+Standard&amp;rft.atitle=Section+23.6%3A+Surrogates+Area&amp;rft.date=2022-09&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2FUnicode15.0.0%2Fch23.pdf%23G24089&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-12"><span class="mw-cite-backlink"><b><a href="#cite_ref-12">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFKaplan" class="citation web cs1">Kaplan, Michael. <a rel="nofollow" class="external text" href="https://unicode.org/iuc/iuc18/papers/a8.ppt">"Surrogate Support in Microsoft Products"</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Surrogate+Support+in+Microsoft+Products&amp;rft.aulast=Kaplan&amp;rft.aufirst=Michael&amp;rft_id=https%3A%2F%2Funicode.org%2Fiuc%2Fiuc18%2Fpapers%2Fa8.ppt&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-13"><span class="mw-cite-backlink"><b><a href="#cite_ref-13">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFv._Löwis2009" class="citation web cs1">v. Löwis, Martin (2009-04-22). <a rel="nofollow" class="external text" href="https://www.python.org/dev/peps/pep-0383/">"Non-decodable Bytes in System Character Interfaces"</a>. <i>Python Enhancement Proposals</i>. PEP 383<span class="reference-accessdate">. Retrieved <span class="nowrap">2016-08-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Python+Enhancement+Proposals&amp;rft.atitle=Non-decodable+Bytes+in+System+Character+Interfaces&amp;rft.date=2009-04-22&amp;rft.aulast=v.+L%C3%B6wis&amp;rft.aufirst=Martin&amp;rft_id=https%3A%2F%2Fwww.python.org%2Fdev%2Fpeps%2Fpep-0383%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-14"><span class="mw-cite-backlink"><b><a href="#cite_ref-14">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/versions/Unicode15.0.0/ch23.pdf#G12612">"Section 23.7: Noncharacters"</a> <span class="cs1-format">(PDF)</span>. <i>The Unicode Standard</i>. The Unicode Consortium. September 2022.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Unicode+Standard&amp;rft.atitle=Section+23.7%3A+Noncharacters&amp;rft.date=2022-09&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fversions%2FUnicode15.0.0%2Fch23.pdf%23G12612&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-15"><span class="mw-cite-backlink"><b><a href="#cite_ref-15">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/ucd/">"Unicode Character Database"</a>. The Unicode Consortium<span class="reference-accessdate">. Retrieved <span class="nowrap">2016-08-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Unicode+Character+Database&amp;rft.pub=The+Unicode+Consortium&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fucd%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-16"><span class="mw-cite-backlink"><b><a href="#cite_ref-16">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFFreytagMcGowanWhistler" class="citation web cs1">Freytag, Asmus; McGowan, Rick; Whistler, Ken. <a rel="nofollow" class="external text" href="https://unicode.org/notes/tn27/">"Unicode Technical Note #27 — Known Anomalies in Unicode Character Names"</a>. Unicode Consortium.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Unicode+Technical+Note+%2327+%E2%80%94+Known+Anomalies+in+Unicode+Character+Names&amp;rft.pub=Unicode+Consortium&amp;rft.aulast=Freytag&amp;rft.aufirst=Asmus&amp;rft.au=McGowan%2C+Rick&amp;rft.au=Whistler%2C+Ken&amp;rft_id=https%3A%2F%2Funicode.org%2Fnotes%2Ftn27%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-representative-17"><span class="mw-cite-backlink"><b><a href="#cite_ref-representative_17-0">^</a></b></span> <span class="reference-text">Not <i>the</i> official Unicode representative glyph, but merely <i>a</i> representative glyph. To see the official Unicode representative glyph, see the <a rel="nofollow" class="external text" href="https://www.unicode.org/charts/">code charts</a>.</span> </li> <li id="cite_note-18"><span class="mw-cite-backlink"><b><a href="#cite_ref-18">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/charts/">"Character Code Charts"</a>. The Unicode Consortium<span class="reference-accessdate">. Retrieved <span class="nowrap">2016-08-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Character+Code+Charts&amp;rft.pub=The+Unicode+Consortium&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Fcharts%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-19"><span class="mw-cite-backlink"><b><a href="#cite_ref-19">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.unicode.org/reports/tr44/#General_Category_Values">"UAX #44: Unicode Character Database"</a>. <i>General Category Values</i>. The Unicode Consortium. 2014-06-05<span class="reference-accessdate">. Retrieved <span class="nowrap">2016-08-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=General+Category+Values&amp;rft.atitle=UAX+%2344%3A+Unicode+Character+Database&amp;rft.date=2014-06-05&amp;rft_id=https%3A%2F%2Fwww.unicode.org%2Freports%2Ftr44%2F%23General_Category_Values&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-20"><span class="mw-cite-backlink"><b><a href="#cite_ref-20">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDavisIancuWhistler" class="citation web cs1">Davis, Mark; Iancu, Laurențiu; Whistler, Ken. <a rel="nofollow" class="external text" href="https://unicode.org/reports/tr44/#Ideographic">"Table 9. Property Table § PropList.txt"</a>. <i>Unicode Standard Annex #44 — Unicode Character Database</i>. Unicode Consortium.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Unicode+Standard+Annex+%2344+%E2%80%94+Unicode+Character+Database&amp;rft.atitle=Table+9.+Property+Table+%C2%A7+PropList.txt&amp;rft.aulast=Davis&amp;rft.aufirst=Mark&amp;rft.au=Iancu%2C+Lauren%C8%9Biu&amp;rft.au=Whistler%2C+Ken&amp;rft_id=https%3A%2F%2Funicode.org%2Freports%2Ftr44%2F%23Ideographic&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> <li id="cite_note-21"><span class="mw-cite-backlink"><b><a href="#cite_ref-21">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://unicode.org/cldr/utility/properties.jsp">"Unicode Utilities: Character Property Index"</a>. The Unicode Consortium<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-06-09</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Unicode+Utilities%3A+Character+Property+Index&amp;rft.pub=The+Unicode+Consortium&amp;rft_id=https%3A%2F%2Funicode.org%2Fcldr%2Futility%2Fproperties.jsp&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AUniversal+Character+Set+characters" class="Z3988"></span></span> </li> </ol></div></div> <div class="mw-heading mw-heading2"><h2 id="External_links">External links</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Universal_Character_Set_characters&amp;action=edit&amp;section=32" title="Edit section: External links"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1235681985"><style data-mw-deduplicate="TemplateStyles:r1237033735">@media print{body.ns-0 .mw-parser-output .sistersitebox{display:none!important}}@media screen{html.skin-theme-clientpref-night .mw-parser-output .sistersitebox img[src*="Wiktionary-logo-en-v2.svg"]{background-color:white}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .sistersitebox img[src*="Wiktionary-logo-en-v2.svg"]{background-color:white}}</style><div class="side-box side-box-right plainlinks sistersitebox"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1126788409"> <div class="side-box-flex"> <div class="side-box-image"><span class="noviewer" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/30px-Commons-logo.svg.png" decoding="async" width="30" height="40" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/45px-Commons-logo.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/59px-Commons-logo.svg.png 2x" data-file-width="1024" data-file-height="1376" /></span></span></div> <div class="side-box-text plainlist">Wikimedia Commons has media related to <span style="font-weight: bold; font-style: italic;"><a href="https://commons.wikimedia.org/wiki/Category:Unicode" class="extiw" title="commons:Category:Unicode">Unicode</a></span>.</div></div> </div> <ul><li><a rel="nofollow" class="external text" href="https://www.unicode.org">Unicode Consortium</a></li> <li><a rel="nofollow" class="external text" href="https://web.archive.org/web/20140312143430/http://www.decodeunicode.org/">decodeunicode.org</a> Unicode Wiki with all 98884 graphic characters of Unicode 5.0 as gifs, full text search</li> <li><a rel="nofollow" class="external text" href="https://unicode.org/cldr/utility/properties.jsp">Unicode Characters by Property</a></li></ul> <div class="navbox-styles"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236075235"></div><div role="navigation" class="navbox" aria-labelledby="Unicode" style="padding:3px"><table class="nowraplinks hlist mw-collapsible autocollapse navbox-inner" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="col" class="navbox-title" colspan="2"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><style data-mw-deduplicate="TemplateStyles:r1239400231">.mw-parser-output .navbar{display:inline;font-size:88%;font-weight:normal}.mw-parser-output .navbar-collapse{float:left;text-align:left}.mw-parser-output .navbar-boxtext{word-spacing:0}.mw-parser-output .navbar ul{display:inline-block;white-space:nowrap;line-height:inherit}.mw-parser-output .navbar-brackets::before{margin-right:-0.125em;content:"[ "}.mw-parser-output .navbar-brackets::after{margin-left:-0.125em;content:" ]"}.mw-parser-output .navbar li{word-spacing:-0.125em}.mw-parser-output .navbar a>span,.mw-parser-output .navbar a>abbr{text-decoration:inherit}.mw-parser-output .navbar-mini abbr{font-variant:small-caps;border-bottom:none;text-decoration:none;cursor:inherit}.mw-parser-output .navbar-ct-full{font-size:114%;margin:0 7em}.mw-parser-output .navbar-ct-mini{font-size:114%;margin:0 4em}html.skin-theme-clientpref-night .mw-parser-output .navbar li a abbr{color:var(--color-base)!important}@media(prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .navbar li a abbr{color:var(--color-base)!important}}@media print{.mw-parser-output .navbar{display:none!important}}</style><div class="navbar plainlinks hlist navbar-mini"><ul><li class="nv-view"><a href="/wiki/Template:Unicode_navigation" title="Template:Unicode navigation"><abbr title="View this template">v</abbr></a></li><li class="nv-talk"><a href="/wiki/Template_talk:Unicode_navigation" title="Template talk:Unicode navigation"><abbr title="Discuss this template">t</abbr></a></li><li class="nv-edit"><a href="/wiki/Special:EditPage/Template:Unicode_navigation" title="Special:EditPage/Template:Unicode navigation"><abbr title="Edit this template">e</abbr></a></li></ul></div><div id="Unicode" style="font-size:114%;margin:0 4em"><a href="/wiki/Unicode" title="Unicode">Unicode</a></div></th></tr><tr><th scope="row" class="navbox-group" style="width:1%">Unicode</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Unicode_Consortium" title="Unicode Consortium">Unicode Consortium</a></li> <li><a href="/wiki/Universal_Coded_Character_Set" title="Universal Coded Character Set">ISO/IEC 10646 (Universal Character Set)</a></li> <li><a href="/wiki/Unicode#Versions" title="Unicode">Versions</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Code_point" title="Code point">Code points</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Unicode_block" title="Unicode block">Block</a> <ul><li><a href="/wiki/Category:Unicode_blocks" title="Category:Unicode blocks">List</a></li></ul></li> <li><a class="mw-selflink selflink">Universal Character Set</a></li> <li><a href="/wiki/Category:Unicode_charts" title="Category:Unicode charts">Character charts</a></li> <li><a href="/wiki/Unicode_character_property" title="Unicode character property">Character property</a></li> <li><a href="/wiki/Plane_(Unicode)" title="Plane (Unicode)">Plane</a></li> <li><a href="/wiki/Private_Use_Areas" title="Private Use Areas">Private Use Area</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Characters</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"></div><table class="nowraplinks navbox-subgroup" style="border-spacing:0"><tbody><tr><th scope="row" class="navbox-group" style="width:12em"><a class="mw-selflink-fragment" href="#Special-purpose_characters">Special purpose</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Byte_order_mark" title="Byte order mark">BOM</a></li> <li><a href="/wiki/Combining_grapheme_joiner" title="Combining grapheme joiner">Combining grapheme joiner</a></li> <li><a href="/wiki/Left-to-right_mark" title="Left-to-right mark">Left-to-right mark</a>&#160;/ <a href="/wiki/Right-to-left_mark" title="Right-to-left mark">Right-to-left mark</a></li> <li><a href="/wiki/Soft_hyphen" title="Soft hyphen">Soft hyphen</a></li> <li><a href="/wiki/Variant_form_(Unicode)" title="Variant form (Unicode)">Variant form</a></li> <li><a href="/wiki/Word_joiner" title="Word joiner">Word joiner</a></li> <li><a href="/wiki/Zero-width_joiner" title="Zero-width joiner">Zero-width joiner</a></li> <li><a href="/wiki/Zero-width_non-joiner" title="Zero-width non-joiner">Zero-width non-joiner</a></li> <li><a href="/wiki/Zero-width_space" title="Zero-width space">Zero-width space</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:12em">Lists</th><td class="navbox-list-with-group navbox-list navbox-even" style="padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/List_of_Unicode_characters" title="List of Unicode characters">Characters</a></li> <li><a href="/wiki/CJK_Unified_Ideographs" title="CJK Unified Ideographs">CJK Unified Ideographs</a></li> <li><a href="/wiki/Combining_character" title="Combining character">Combining character</a></li> <li><a href="/wiki/Duplicate_characters_in_Unicode" title="Duplicate characters in Unicode">Duplicate characters</a></li> <li><a href="/wiki/Numerals_in_Unicode" title="Numerals in Unicode">Numerals</a></li> <li><a href="/wiki/Script_(Unicode)" title="Script (Unicode)">Scripts</a></li> <li><a href="/wiki/Space_(punctuation)#Spaces_in_Unicode" title="Space (punctuation)">Spaces</a></li> <li><a href="/wiki/Unicode_symbol" title="Unicode symbol">Symbols</a></li> <li><a href="/wiki/Halfwidth_and_fullwidth_forms" title="Halfwidth and fullwidth forms">Halfwidth and fullwidth</a></li> <li><a href="/wiki/Unicode_alias_names_and_abbreviations" title="Unicode alias names and abbreviations">Alias names and abbreviations</a></li> <li><a href="/wiki/Whitespace_character#Unicode" title="Whitespace character">Whitespace characters</a></li></ul> </div></td></tr></tbody></table><div></div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Processing</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"></div><table class="nowraplinks navbox-subgroup" style="border-spacing:0"><tbody><tr><th scope="row" class="navbox-group" style="width:12em">Algorithms</th><td class="navbox-list-with-group navbox-list navbox-odd" style="padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Bidirectional_text" title="Bidirectional text">Bidirectional text</a></li> <li><a href="/wiki/Unicode_collation_algorithm" title="Unicode collation algorithm">Collation</a> <ul><li><a href="/wiki/ISO/IEC_14651" title="ISO/IEC 14651">ISO/IEC 14651</a></li></ul></li> <li><a href="/wiki/Unicode_equivalence" title="Unicode equivalence">Equivalence</a></li> <li><a href="/wiki/Variant_form_(Unicode)" title="Variant form (Unicode)">Variation sequences</a></li> <li><a href="/wiki/International_Ideographs_Core" title="International Ideographs Core">International Ideographs Core</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:12em"><a href="/wiki/Comparison_of_Unicode_encodings" title="Comparison of Unicode encodings">Comparison of encodings</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Binary_Ordered_Compression_for_Unicode" title="Binary Ordered Compression for Unicode">BOCU-1</a></li> <li><a href="/wiki/CESU-8" title="CESU-8">CESU-8</a></li> <li><a href="/wiki/Punycode" title="Punycode">Punycode</a></li> <li><a href="/wiki/Standard_Compression_Scheme_for_Unicode" title="Standard Compression Scheme for Unicode">SCSU</a></li> <li><a href="/wiki/UTF-1" title="UTF-1">UTF-1</a></li> <li><a href="/wiki/UTF-7" title="UTF-7">UTF-7</a></li> <li><a href="/wiki/UTF-8" title="UTF-8">UTF-8</a></li> <li><a href="/wiki/UTF-16" title="UTF-16">UTF-16/UCS-2</a></li> <li><a href="/wiki/UTF-32" title="UTF-32">UTF-32/UCS-4</a></li> <li><a href="/wiki/UTF-EBCDIC" title="UTF-EBCDIC">UTF-EBCDIC</a></li></ul> </div></td></tr></tbody></table><div></div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">On pairs of<br />code points</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Combining_character" title="Combining character">Combining character</a></li> <li><a href="/wiki/Unicode_compatibility_characters" title="Unicode compatibility characters">Compatibility characters</a></li> <li><a href="/wiki/Duplicate_characters_in_Unicode" title="Duplicate characters in Unicode">Duplicate characters</a></li> <li><a href="/wiki/Unicode_equivalence" title="Unicode equivalence">Equivalence</a></li> <li><a href="/wiki/Homoglyph" title="Homoglyph">Homoglyph</a></li> <li><a href="/wiki/Precomposed_character" title="Precomposed character">Precomposed character</a> <ul><li><a href="/wiki/List_of_precomposed_Latin_characters_in_Unicode" title="List of precomposed Latin characters in Unicode">list</a></li></ul></li> <li><a href="/wiki/Z-variant" title="Z-variant">Z-variant</a></li> <li><a href="/wiki/Variant_form_(Unicode)" title="Variant form (Unicode)">Variation sequences</a></li> <li><a href="/wiki/Regional_indicator_symbol" title="Regional indicator symbol">Regional indicator symbol</a></li> <li><a href="/wiki/Emoji#Skin_color" title="Emoji">Emoji skin color</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Usage</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Internationalized_domain_name" title="Internationalized domain name">Domain names (IDN)</a></li> <li><a href="/wiki/Unicode_and_email" title="Unicode and email">Email</a></li> <li><a href="/wiki/Unicode_font" title="Unicode font">Fonts</a></li> <li><a href="/wiki/Unicode_and_HTML" title="Unicode and HTML">HTML</a> <ul><li><a href="/wiki/List_of_XML_and_HTML_character_entity_references" title="List of XML and HTML character entity references">entity references</a></li> <li><a href="/wiki/Numeric_character_reference" title="Numeric character reference">numeric references</a></li></ul></li> <li><a href="/wiki/Unicode_input" title="Unicode input">Input</a></li> <li><a href="/wiki/International_Ideographs_Core" title="International Ideographs Core">International Ideographs Core</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Related standards</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Common_Locale_Data_Repository" title="Common Locale Data Repository">Common Locale Data Repository (CLDR)</a></li> <li><a href="/wiki/GB_18030" title="GB 18030">GB 18030</a></li> <li><a href="/wiki/ISO/IEC_8859" title="ISO/IEC 8859">ISO/IEC 8859</a></li> <li><a href="/wiki/DIN_91379" title="DIN 91379">DIN 91379</a></li> <li><a href="/wiki/ISO_15924" title="ISO 15924">ISO 15924</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Related topics</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Unicode_anomaly" class="mw-redirect" title="Unicode anomaly">Anomalies</a></li> <li><a href="/wiki/ConScript_Unicode_Registry" title="ConScript Unicode Registry">ConScript Unicode Registry</a></li> <li><a href="/wiki/Ideographic_Research_Group" title="Ideographic Research Group">Ideographic Research Group</a></li> <li><a href="/wiki/International_Components_for_Unicode" title="International Components for Unicode">International Components for Unicode</a></li> <li><a href="/wiki/Category:People_involved_with_Unicode" title="Category:People involved with Unicode">People involved with Unicode</a></li> <li><a href="/wiki/Han_unification" title="Han unification">Han unification</a></li></ul> </div></td></tr><tr><td colspan="2" class="navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"></div><table class="nowraplinks mw-collapsible mw-collapsed navbox-subgroup" style="border-spacing:0"><tbody><tr><th scope="col" class="navbox-title" colspan="2"><div id="Scripts_and_symbols_in_Unicode" style="font-size:114%;margin:0 4em"><a href="/wiki/Script_(Unicode)" title="Script (Unicode)">Scripts</a> and symbols in Unicode</div></th></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Script_(Unicode)#Common_and_inherited_scripts" title="Script (Unicode)">Common and <br />inherited scripts</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Combining_character" title="Combining character">Combining marks</a></li> <li><a href="/wiki/Diacritic" title="Diacritic">Diacritics</a></li> <li><a href="/wiki/Punctuation#Punctuation_marks_in_Unicode" title="Punctuation">Punctuation marks</a></li> <li><a href="/wiki/Space_(punctuation)#Spaces_in_Unicode" title="Space (punctuation)">Spaces</a></li> <li><a href="/wiki/Numerals_in_Unicode" title="Numerals in Unicode">Numbers</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Modern scripts</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Adlam_script" title="Adlam script">Adlam</a></li> <li><a href="/wiki/Arabic_script" title="Arabic script">Arabic</a></li> <li><a href="/wiki/Armenian_alphabet" title="Armenian alphabet">Armenian</a></li> <li><a href="/wiki/Balinese_script" title="Balinese script">Balinese</a></li> <li><a href="/wiki/Bamum_script" title="Bamum script">Bamum</a></li> <li><a href="/wiki/Batak_script" title="Batak script">Batak</a></li> <li><a href="/wiki/Bengali%E2%80%93Assamese_script" title="Bengali–Assamese script">Bengali</a></li> <li><a href="/wiki/Bopomofo" title="Bopomofo">Bopomofo</a></li> <li><a href="/wiki/Braille" title="Braille">Braille</a></li> <li><a href="/wiki/Buhid_script" title="Buhid script">Buhid</a></li> <li><a href="/wiki/Mon%E2%80%93Burmese_script" title="Mon–Burmese script">Burmese</a></li> <li><a href="/wiki/Canadian_Aboriginal_syllabics" title="Canadian Aboriginal syllabics">Canadian Aboriginal</a></li> <li><a href="/wiki/Chakma_script" title="Chakma script">Chakma</a></li> <li><a href="/wiki/Cham_script" title="Cham script">Cham</a></li> <li><a href="/wiki/Cherokee_syllabary" title="Cherokee syllabary">Cherokee</a></li> <li><a href="/wiki/CJK_Unified_Ideographs" title="CJK Unified Ideographs">CJK Unified Ideographs (Han)</a></li> <li><a href="/wiki/Cyrillic_script_in_Unicode" title="Cyrillic script in Unicode">Cyrillic</a></li> <li><a href="/wiki/Deseret_alphabet" title="Deseret alphabet">Deseret</a></li> <li><a href="/wiki/Devanagari" title="Devanagari">Devanagari</a></li> <li><a href="/wiki/Garay_alphabet" title="Garay alphabet">Garay</a></li> <li><a href="/wiki/Ge%CA%BDez_script" title="Geʽez script">Geʽez</a></li> <li><a href="/wiki/Georgian_scripts" title="Georgian scripts">Georgian</a></li> <li><a href="/wiki/Greek_script_in_Unicode" title="Greek script in Unicode">Greek</a></li> <li><a href="/wiki/Gujarati_script" title="Gujarati script">Gujarati</a></li> <li><a href="/wiki/Gunjala_Gondi_script" title="Gunjala Gondi script">Gunjala Gondi</a></li> <li><a href="/wiki/Gurmukhi" title="Gurmukhi">Gurmukhi</a></li> <li><a href="/wiki/Gurung_Khema" class="mw-redirect" title="Gurung Khema">Gurung Khema</a></li> <li><a href="/wiki/Hangul" title="Hangul">Hangul</a></li> <li><a href="/wiki/Hanifi_Rohingya_script" title="Hanifi Rohingya script">Hanifi Rohingya</a></li> <li><a href="/wiki/Hanja" title="Hanja">Hanja</a></li> <li><a href="/wiki/Hanunoo_script" title="Hanunoo script">Hanunuoo</a></li> <li><a href="/wiki/Hebrew_alphabet" title="Hebrew alphabet">Hebrew</a></li> <li><a href="/wiki/Hiragana" title="Hiragana">Hiragana</a></li> <li><a href="/wiki/Javanese_script" title="Javanese script">Javanese</a></li> <li><a href="/wiki/Kanji" title="Kanji">Kanji</a></li> <li><a href="/wiki/Kannada_script" title="Kannada script">Kannada</a></li> <li><a href="/wiki/Katakana" title="Katakana">Katakana</a></li> <li><a href="/wiki/Kayah_Li_alphabet" title="Kayah Li alphabet">Kayah Li</a></li> <li><a href="/wiki/Khmer_script" title="Khmer script">Khmer</a></li> <li><a href="/wiki/Kirat_Rai" title="Kirat Rai">Kirat Rai</a></li> <li><a href="/wiki/Lao_script" title="Lao script">Lao</a></li> <li><a href="/wiki/Latin_script_in_Unicode" title="Latin script in Unicode">Latin</a></li> <li><a href="/wiki/Lepcha_script" title="Lepcha script">Lepcha</a></li> <li><a href="/wiki/Limbu_script" title="Limbu script">Limbu</a></li> <li><a href="/wiki/Fraser_script" title="Fraser script">Lisu (Fraser)</a></li> <li><a href="/wiki/Lontara_script" title="Lontara script">Lontara</a></li> <li><a href="/wiki/Malayalam_script" title="Malayalam script">Malayalam</a></li> <li><a href="/wiki/Gondi_writing#Munshi_Mangal_Singh_Masaram_Script" title="Gondi writing">Masaram Gondi</a></li> <li><a href="/wiki/Mende_Kikakui_script" title="Mende Kikakui script">Mende Kikakui</a></li> <li><a href="/wiki/Medefaidrin" title="Medefaidrin">Medefaidrin</a></li> <li><a href="/wiki/Pollard_script" title="Pollard script">Miao (Pollard)</a></li> <li><a href="/wiki/Mongolian_script" title="Mongolian script">Mongolian</a></li> <li><a href="/wiki/Mru_language#Alphabet" title="Mru language">Mru</a></li> <li><a href="/wiki/N%27Ko_script" title="N&#39;Ko script">N'Ko</a></li> <li><a href="/wiki/Nag_Mundari" class="mw-redirect" title="Nag Mundari">Nag Mundari</a></li> <li><a href="/wiki/New_Tai_Lue_alphabet" title="New Tai Lue alphabet">New Tai Lue</a></li> <li><a href="/wiki/N%C3%BCshu" title="Nüshu">Nüshu</a></li> <li><a href="/wiki/Nyiakeng_Puachue_Hmong" title="Nyiakeng Puachue Hmong">Nyiakeng Puachue Hmong</a></li> <li><a href="/wiki/Odia_script" title="Odia script">Odia</a></li> <li><a href="/wiki/Ol_Chiki_script" title="Ol Chiki script">Ol Chiki</a></li> <li><a href="/wiki/Ol_Onal" title="Ol Onal">Ol Onal</a></li> <li><a href="/wiki/Osage_script" title="Osage script">Osage</a></li> <li><a href="/wiki/Osmanya_alphabet" title="Osmanya alphabet">Osmanya</a></li> <li><a href="/wiki/Pahawh_Hmong" title="Pahawh Hmong">Pahawh Hmong</a></li> <li><a href="/wiki/Pau_Cin_Hau_script" title="Pau Cin Hau script">Pau Cin Hau</a></li> <li><a href="/wiki/Pracalit_script" title="Pracalit script">Pracalit (Newa)</a></li> <li><a href="/wiki/Ranjana_script" title="Ranjana script">Ranjana</a></li> <li><a href="/wiki/Rejang_alphabet" title="Rejang alphabet">Rejang</a></li> <li><a href="/wiki/Samaritan_script" title="Samaritan script">Samaritan</a></li> <li><a href="/wiki/Saurashtra_script" title="Saurashtra script">Saurashtra</a></li> <li><a href="/wiki/Shavian_alphabet" title="Shavian alphabet">Shavian</a></li> <li><a href="/wiki/Sinhala_script" title="Sinhala script">Sinhala</a></li> <li><a href="/wiki/Sorang_Sompeng_script" title="Sorang Sompeng script">Sorang Sompeng</a></li> <li><a href="/wiki/Sundanese_script" title="Sundanese script">Sundanese</a></li> <li><a href="/wiki/Sunwar_language" title="Sunwar language">Sunuwar</a></li> <li><a href="/wiki/Syriac_alphabet" title="Syriac alphabet">Syriac</a></li> <li><a href="/wiki/Tagbanwa_script" title="Tagbanwa script">Tagbanwa</a></li> <li><a href="/wiki/Tai_Le_script" title="Tai Le script">Tai Le</a></li> <li><a href="/wiki/Tai_Tham_script" title="Tai Tham script">Tai Tham</a></li> <li><a href="/wiki/Tai_Dam_language#Writing_system" title="Tai Dam language">Tai Viet</a></li> <li><a href="/wiki/Tamil_script" title="Tamil script">Tamil</a></li> <li><a href="/wiki/Tangsa_language" title="Tangsa language">Tangsa</a></li> <li><a href="/wiki/Telugu_script" title="Telugu script">Telugu</a></li> <li><a href="/wiki/Thaana" title="Thaana">Thaana</a></li> <li><a href="/wiki/Thai_script" title="Thai script">Thai</a></li> <li><a href="/wiki/Tibetan_script" title="Tibetan script">Tibetan</a></li> <li><a href="/wiki/Tifinagh" title="Tifinagh">Tifinagh</a></li> <li><a href="/wiki/Tirhuta_script" title="Tirhuta script">Tirhuta</a></li> <li><a href="/wiki/Toto_language#Writing_system" title="Toto language">Toto</a></li> <li><a href="/wiki/Vai_syllabary" title="Vai syllabary">Vai</a></li> <li><a href="/wiki/Wancho_script" title="Wancho script">Wancho</a></li> <li><a href="/wiki/Warang_Citi" title="Warang Citi">Warang Citi</a></li> <li><a href="/wiki/Yi_script" title="Yi script">Yi</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Ancient and<br />historic scripts</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Ahom_script" title="Ahom script">Ahom</a></li> <li><a href="/wiki/Anatolian_hieroglyphs" title="Anatolian hieroglyphs">Anatolian hieroglyphs</a></li> <li><a href="/wiki/Ancient_North_Arabian" title="Ancient North Arabian">Ancient North Arabian</a></li> <li><a href="/wiki/Avestan_alphabet" title="Avestan alphabet">Avestan</a></li> <li><a href="/wiki/Bassa_Vah_alphabet" title="Bassa Vah alphabet">Bassa Vah</a></li> <li><a href="/wiki/Bhaiksuki_script" title="Bhaiksuki script">Bhaiksuki</a></li> <li><a href="/wiki/Brahmi_script" title="Brahmi script">Brāhmī</a></li> <li><a href="/wiki/Carian_alphabets" title="Carian alphabets">Carian</a></li> <li><a href="/wiki/Caucasian_Albanian_script" title="Caucasian Albanian script">Caucasian Albanian</a></li> <li><a href="/wiki/Coptic_script" title="Coptic script">Coptic</a></li> <li><a href="/wiki/Cuneiform" title="Cuneiform">Cuneiform</a></li> <li><a href="/wiki/Cypriot_syllabary" title="Cypriot syllabary">Cypriot</a></li> <li><a href="/wiki/Cypro-Minoan_syllabary" title="Cypro-Minoan syllabary">Cypro-Minoan</a></li> <li><a href="/wiki/Dhives_Akuru" title="Dhives Akuru">Dives Akuru</a></li> <li><a href="/wiki/Dogri_script" title="Dogri script">Dogra</a></li> <li><a href="/wiki/Egyptian_hieroglyphs" title="Egyptian hieroglyphs">Egyptian hieroglyphs</a></li> <li><a href="/wiki/Elbasan" title="Elbasan">Elbasan</a></li> <li><a href="/wiki/Elymaic" title="Elymaic">Elymaic</a></li> <li><a href="/wiki/Glagolitic_script" title="Glagolitic script">Glagolitic</a></li> <li><a href="/wiki/Gothic_alphabet" title="Gothic alphabet">Gothic</a></li> <li><a href="/wiki/Grantha_script" title="Grantha script">Grantha</a></li> <li><a href="/wiki/Hatran_alphabet" class="mw-redirect" title="Hatran alphabet">Hatran</a></li> <li><a href="/wiki/Aramaic_alphabet" title="Aramaic alphabet">Imperial Aramaic</a></li> <li><a href="/wiki/Pahlavi_scripts#Inscriptional_Pahlavi" title="Pahlavi scripts">Inscriptional Pahlavi</a></li> <li><a href="/wiki/Parthian_language#Written_Parthian" title="Parthian language">Inscriptional Parthian</a></li> <li><a href="/wiki/Kaithi" title="Kaithi">Kaithi</a></li> <li><a href="/wiki/Kawi_script" title="Kawi script">Kawi</a></li> <li><a href="/wiki/Kharosthi" title="Kharosthi">Kharosthi</a></li> <li><a href="/wiki/Khitan_small_script" title="Khitan small script">Khitan small script</a></li> <li><a href="/wiki/Khojki_script" title="Khojki script">Khojki</a></li> <li><a href="/wiki/Khudabadi_script" title="Khudabadi script">Khudawadi</a></li> <li><a href="/wiki/Khwarezmian_language" title="Khwarezmian language">Khwarezmian</a> (Chorasmian)</li> <li><a href="/wiki/Linear_A" title="Linear A">Linear A</a></li> <li><a href="/wiki/Linear_B" title="Linear B">Linear B</a></li> <li><a href="/wiki/Lycian_alphabet" title="Lycian alphabet">Lycian</a></li> <li><a href="/wiki/Lydian_alphabet" title="Lydian alphabet">Lydian</a></li> <li><a href="/wiki/Mahajani" title="Mahajani">Mahajani</a></li> <li><a href="/wiki/Makassarese_language#Writing_systems" title="Makassarese language">Makasar</a></li> <li><a href="/wiki/Mandaic_alphabet" title="Mandaic alphabet">Mandaic</a></li> <li><a href="/wiki/Manichaean_script" title="Manichaean script">Manichaean</a></li> <li><a href="/wiki/Marchen_script" title="Marchen script">Marchen</a></li> <li><a href="/wiki/Meitei_script" title="Meitei script">Meetei Mayek</a></li> <li><a href="/wiki/Meroitic_script" title="Meroitic script">Meroitic</a></li> <li><a href="/wiki/Modi_script" title="Modi script">Modi</a></li> <li><a href="/wiki/Multani_script" title="Multani script">Multani</a></li> <li><a href="/wiki/Nabataean_script" title="Nabataean script">Nabataean</a></li> <li><a href="/wiki/Nandinagari" title="Nandinagari">Nandinagari</a></li> <li><a href="/wiki/Ogham" title="Ogham">Ogham</a></li> <li><a href="/wiki/Old_Hungarian_script" title="Old Hungarian script">Old Hungarian</a></li> <li><a href="/wiki/Old_Italic_scripts" title="Old Italic scripts">Old Italic</a></li> <li><a href="/wiki/Old_Permic_script" title="Old Permic script">Old Permic</a></li> <li><a href="/wiki/Old_Persian_cuneiform" title="Old Persian cuneiform">Old Persian cuneiform</a></li> <li><a href="/wiki/Sogdian_alphabet" title="Sogdian alphabet">Old Sogdian</a></li> <li><a href="/wiki/Old_Turkic_script" title="Old Turkic script">Old Turkic</a></li> <li><a href="/wiki/Old_Uyghur" title="Old Uyghur">Old Uyghur</a></li> <li><a href="/wiki/Palmyrene_alphabet" title="Palmyrene alphabet">Palmyrene</a></li> <li><a href="/wiki/%CA%BCPhags-pa_script" title="ʼPhags-pa script">ʼPhags-pa</a></li> <li><a href="/wiki/Phoenician_alphabet" title="Phoenician alphabet">Phoenician</a></li> <li><a href="/wiki/Pahlavi_scripts#Psalter_Pahlavi" title="Pahlavi scripts">Psalter Pahlavi</a></li> <li><a href="/wiki/Rune" title="Rune">Runic</a></li> <li><a href="/wiki/Sharada_script" title="Sharada script">Sharada</a></li> <li><a href="/wiki/Siddha%E1%B9%83_script" title="Siddhaṃ script">Siddham</a></li> <li><a href="/wiki/Sogdian_alphabet" title="Sogdian alphabet">Sogdian</a></li> <li><a href="/wiki/Ancient_South_Arabian_script" title="Ancient South Arabian script">South Arabian</a></li> <li><a href="/wiki/Soyombo_script" title="Soyombo script">Soyombo</a></li> <li><a href="/wiki/Sylheti_Nagri" title="Sylheti Nagri">Sylheti Nagri</a></li> <li><a href="/wiki/Baybayin" title="Baybayin">Tagalog (Baybayin)</a></li> <li><a href="/wiki/Takri_script" title="Takri script">Takri</a></li> <li><a href="/wiki/Tangut_script" title="Tangut script">Tangut</a></li> <li><a href="/wiki/Todhri_alphabet" title="Todhri alphabet">Todhri</a></li> <li><a href="/wiki/Tigalari_script" title="Tigalari script">Tulu Tigalari</a></li> <li><a href="/wiki/Ugaritic_alphabet" title="Ugaritic alphabet">Ugaritic</a></li> <li><a href="/wiki/Vithkuqi_alphabet" title="Vithkuqi alphabet">Vithkuqi</a></li> <li><a href="/wiki/Yezidi_(script)" class="mw-redirect" title="Yezidi (script)">Yezidi</a></li> <li><a href="/wiki/Zanabazar_square_script" title="Zanabazar square script">Zanabazar Square</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Notational scripts</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Duployan_shorthand" title="Duployan shorthand">Duployan</a></li> <li><a href="/wiki/SignWriting" title="SignWriting">SignWriting</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Symbols, emojis</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Religious_and_political_symbols_in_Unicode" title="Religious and political symbols in Unicode">Cultural, political, and religious symbols</a></li> <li><a href="/wiki/Currency_symbol" title="Currency symbol">Currency</a></li> <li><a href="/wiki/Control_Pictures" title="Control Pictures">Control Pictures</a></li> <li><a href="/wiki/Mathematical_operators_and_symbols_in_Unicode" title="Mathematical operators and symbols in Unicode">Mathematical operators and symbols</a> <ul><li><a href="/wiki/Glossary_of_mathematical_symbols" title="Glossary of mathematical symbols">Glossary</a></li></ul></li> <li><a href="/wiki/Phonetic_symbols_in_Unicode" title="Phonetic symbols in Unicode">Phonetic symbols (including IPA)</a></li> <li><a href="/wiki/Emoji" title="Emoji">Emoji</a></li></ul> </div></td></tr><tr><td class="navbox-abovebelow" colspan="2"><div> <ul><li><span class="noviewer" typeof="mw:File"><span title="Category"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/16px-Symbol_category_class.svg.png" decoding="async" width="16" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/23px-Symbol_category_class.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/31px-Symbol_category_class.svg.png 2x" data-file-width="180" data-file-height="185" /></span></span>&#160;<a href="/wiki/Category:Unicode" title="Category:Unicode">Category: Unicode</a></li> <li><span class="noviewer" typeof="mw:File"><span title="Category"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/16px-Symbol_category_class.svg.png" decoding="async" width="16" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/23px-Symbol_category_class.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/31px-Symbol_category_class.svg.png 2x" data-file-width="180" data-file-height="185" /></span></span>&#160;<a href="/wiki/Category:Unicode_blocks" title="Category:Unicode blocks">Category: Unicode blocks</a></li></ul> </div></td></tr></tbody></table><div></div></td></tr></tbody></table></div> <!-- NewPP limit report Parsed by mw‐web.codfw.main‐6cd96847f8‐tcx5r Cached time: 20241217124915 Cache expiry: 2592000 Reduced expiry: false Complications: [vary‐revision‐sha1, show‐toc] CPU time usage: 0.529 seconds Real time usage: 0.697 seconds Preprocessor visited node count: 4557/1000000 Post‐expand include size: 128135/2097152 bytes Template argument size: 4579/2097152 bytes Highest expansion depth: 21/100 Expensive parser function count: 15/500 Unstrip recursion depth: 1/20 Unstrip post‐expand size: 95728/5000000 bytes Lua time usage: 0.280/10.000 seconds Lua memory usage: 7384438/52428800 bytes Number of Wikibase entities loaded: 1/400 --> <!-- Transclusion expansion time report (%,ms,calls,template) 100.00% 561.709 1 -total 28.82% 161.887 1 Template:Reflist 25.61% 143.845 20 Template:Cite_web 19.90% 111.786 1 Template:Navbox_with_columns 9.17% 51.499 1 Template:Short_description 8.88% 49.876 20 Template:Legend 8.57% 48.166 2 Template:Side_box 8.22% 46.153 4 Template:Navbox 6.94% 38.972 2 Template:Unichar 6.49% 36.467 1 Template:Unicode_navigation --> <!-- Saved in parser cache with key enwiki:pcache:10633237:|#|:idhash:canonical and timestamp 20241217124915 and revision id 1255067307. Rendering was triggered because: page-view --> </div><!--esi <esi:include src="/esitest-fa8a495983347898/content" /> --><noscript><img src="https://login.wikimedia.org/wiki/Special:CentralAutoLogin/start?useformat=desktop&amp;type=1x1&amp;usesul3=0" alt="" width="1" height="1" style="border: none; position: absolute;"></noscript> <div class="printfooter" data-nosnippet="">Retrieved from "<a dir="ltr" href="https://en.wikipedia.org/w/index.php?title=Universal_Character_Set_characters&amp;oldid=1255067307#Noncharacters">https://en.wikipedia.org/w/index.php?title=Universal_Character_Set_characters&amp;oldid=1255067307#Noncharacters</a>"</div></div> <div id="catlinks" class="catlinks" data-mw="interface"><div id="mw-normal-catlinks" class="mw-normal-catlinks"><a href="/wiki/Help:Category" title="Help:Category">Categories</a>: <ul><li><a href="/wiki/Category:IEC_standards" title="Category:IEC standards">IEC standards</a></li><li><a href="/wiki/Category:Unicode" title="Category:Unicode">Unicode</a></li></ul></div><div id="mw-hidden-catlinks" class="mw-hidden-catlinks mw-hidden-cats-hidden">Hidden categories: <ul><li><a href="/wiki/Category:Articles_with_short_description" title="Category:Articles with short description">Articles with short description</a></li><li><a href="/wiki/Category:Short_description_is_different_from_Wikidata" title="Category:Short description is different from Wikidata">Short description is different from Wikidata</a></li><li><a href="/wiki/Category:Commons_category_link_is_on_Wikidata" title="Category:Commons category link is on Wikidata">Commons category link is on Wikidata</a></li></ul></div></div> </div> </main> </div> <div class="mw-footer-container"> <footer id="footer" class="mw-footer" > <ul id="footer-info"> <li id="footer-info-lastmod"> This page was last edited on 2 November 2024, at 23:45<span class="anonymous-show">&#160;(UTC)</span>.</li> <li id="footer-info-copyright">Text is available under the <a href="/wiki/Wikipedia:Text_of_the_Creative_Commons_Attribution-ShareAlike_4.0_International_License" title="Wikipedia:Text of the Creative Commons Attribution-ShareAlike 4.0 International License">Creative Commons Attribution-ShareAlike 4.0 License</a>; additional terms may apply. By using this site, you agree to the <a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Terms_of_Use" class="extiw" title="foundation:Special:MyLanguage/Policy:Terms of Use">Terms of Use</a> and <a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Privacy_policy" class="extiw" title="foundation:Special:MyLanguage/Policy:Privacy policy">Privacy Policy</a>. Wikipedia® is a registered trademark of the <a rel="nofollow" class="external text" href="https://wikimediafoundation.org/">Wikimedia Foundation, Inc.</a>, a non-profit organization.</li> </ul> <ul id="footer-places"> <li id="footer-places-privacy"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Privacy_policy">Privacy policy</a></li> <li id="footer-places-about"><a href="/wiki/Wikipedia:About">About Wikipedia</a></li> <li id="footer-places-disclaimers"><a href="/wiki/Wikipedia:General_disclaimer">Disclaimers</a></li> <li id="footer-places-contact"><a href="//en.wikipedia.org/wiki/Wikipedia:Contact_us">Contact Wikipedia</a></li> <li id="footer-places-wm-codeofconduct"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Universal_Code_of_Conduct">Code of Conduct</a></li> <li id="footer-places-developers"><a href="https://developer.wikimedia.org">Developers</a></li> <li id="footer-places-statslink"><a href="https://stats.wikimedia.org/#/en.wikipedia.org">Statistics</a></li> <li id="footer-places-cookiestatement"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Cookie_statement">Cookie statement</a></li> <li id="footer-places-mobileview"><a href="//en.m.wikipedia.org/w/index.php?title=Universal_Character_Set_characters&amp;mobileaction=toggle_view_mobile#Noncharacters" class="noprint stopMobileRedirectToggle">Mobile view</a></li> </ul> <ul id="footer-icons" class="noprint"> <li id="footer-copyrightico"><a href="https://wikimediafoundation.org/" class="cdx-button cdx-button--fake-button cdx-button--size-large cdx-button--fake-button--enabled"><img src="/static/images/footer/wikimedia-button.svg" width="84" height="29" alt="Wikimedia Foundation" loading="lazy"></a></li> <li id="footer-poweredbyico"><a href="https://www.mediawiki.org/" class="cdx-button cdx-button--fake-button cdx-button--size-large cdx-button--fake-button--enabled"><img src="/w/resources/assets/poweredby_mediawiki.svg" alt="Powered by MediaWiki" width="88" height="31" loading="lazy"></a></li> </ul> </footer> </div> </div> </div> <div class="vector-settings" id="p-dock-bottom"> <ul></ul> </div><script>(RLQ=window.RLQ||[]).push(function(){mw.config.set({"wgHostname":"mw-web.codfw.main-55db797859-6955j","wgBackendResponseTime":137,"wgPageParseReport":{"limitreport":{"cputime":"0.529","walltime":"0.697","ppvisitednodes":{"value":4557,"limit":1000000},"postexpandincludesize":{"value":128135,"limit":2097152},"templateargumentsize":{"value":4579,"limit":2097152},"expansiondepth":{"value":21,"limit":100},"expensivefunctioncount":{"value":15,"limit":500},"unstrip-depth":{"value":1,"limit":20},"unstrip-size":{"value":95728,"limit":5000000},"entityaccesscount":{"value":1,"limit":400},"timingprofile":["100.00% 561.709 1 -total"," 28.82% 161.887 1 Template:Reflist"," 25.61% 143.845 20 Template:Cite_web"," 19.90% 111.786 1 Template:Navbox_with_columns"," 9.17% 51.499 1 Template:Short_description"," 8.88% 49.876 20 Template:Legend"," 8.57% 48.166 2 Template:Side_box"," 8.22% 46.153 4 Template:Navbox"," 6.94% 38.972 2 Template:Unichar"," 6.49% 36.467 1 Template:Unicode_navigation"]},"scribunto":{"limitreport-timeusage":{"value":"0.280","limit":"10.000"},"limitreport-memusage":{"value":7384438,"limit":52428800}},"cachereport":{"origin":"mw-web.codfw.main-6cd96847f8-tcx5r","timestamp":"20241217124915","ttl":2592000,"transientcontent":false}}});});</script> <script type="application/ld+json">{"@context":"https:\/\/schema.org","@type":"Article","name":"Universal Character Set characters","url":"https:\/\/en.wikipedia.org\/wiki\/Universal_Character_Set_characters#Noncharacters","sameAs":"http:\/\/www.wikidata.org\/entity\/Q897819","mainEntity":"http:\/\/www.wikidata.org\/entity\/Q897819","author":{"@type":"Organization","name":"Contributors to Wikimedia projects"},"publisher":{"@type":"Organization","name":"Wikimedia Foundation, Inc.","logo":{"@type":"ImageObject","url":"https:\/\/www.wikimedia.org\/static\/images\/wmf-hor-googpub.png"}},"datePublished":"2007-04-13T02:51:45Z","dateModified":"2024-11-02T23:45:39Z","image":"https:\/\/upload.wikimedia.org\/wikipedia\/commons\/0\/09\/New_Unicode_logo.svg","headline":"Wikimedia list article"}</script> </body> </html>

Pages: 1 2 3 4 5 6 7 8 9 10