-//\r
-// CHARNAMES.CPP\r
-//\r
-// A header file that links Unicode character names to character numbers.\r
-// by James L. Hammons\r
-// (C) 2004 Underground Software\r
-//\r
-// JLH = James L. Hammons <jlhamm@acm.org>\r
-//\r
-// Who When What\r
-// --- ---------- -------------------------------------------------------------\r
-// JLH ??/??/200? Created this file\r
-//\r
-\r
-unsigned char macStdNames[] = {\r
- "\x06""notdef"\r
- "\x05"".null"\r
- "\x02""CR"\r
- "\x05""space"\r
- "\x06""exclam"\r
- "\x08""quotedbl"\r
- "\x0A""numbersign"\r
- "\x06""dollar"\r
- "\x07""percent"\r
- "\x09""ampersand"\r
- "\x0B""quotesingle"\r
- "\x09""parenleft"\r
- "\x0A""parenright"\r
- "\x08""asterisk"\r
- "\x04""plus"\r
- "\x05""comma"\r
- "\x06""hyphen"\r
- "\x06""period"\r
- "\x05""slash"\r
- "\x04""zero"\r
- "\x03""one"\r
- "\x03""two"\r
- "\x05""three"\r
- "\x04""four"\r
- "\x04""five"\r
- "\x03""six"\r
- "\x05""seven"\r
- "\x05""eight"\r
- "\x04""nine"\r
- "\x05""colon"\r
- "\x09""semicolon"\r
- "\x04""less"\r
- "\x05""equal"\r
- "\x07""greater"\r
- "\x08""question"\r
- "\x02""at"\r
- "\x01""A"\r
- "\x01""B"\r
- "\x01""C"\r
- "\x01""D"\r
- "\x01""E"\r
- "\x01""F"\r
- "\x01""G"\r
- "\x01""H"\r
- "\x01""I"\r
- "\x01""J"\r
- "\x01""K"\r
- "\x01""L"\r
- "\x01""M"\r
- "\x01""N"\r
- "\x01""O"\r
- "\x01""P"\r
- "\x01""Q"\r
- "\x01""R"\r
- "\x01""S"\r
- "\x01""T"\r
- "\x01""U"\r
- "\x01""V"\r
- "\x01""W"\r
- "\x01""X"\r
- "\x01""Y"\r
- "\x01""Z"\r
- "\x0B""bracketleft"\r
- "\x09""backslash"\r
- "\x0C""bracketright"\r
- "\x0B""asciicircum"\r
- "\x0A""underscore"\r
- "\x05""grave"\r
- "\x01""a"\r
- "\x01""b"\r
- "\x01""c"\r
- "\x01""d"\r
- "\x01""e"\r
- "\x01""f"\r
- "\x01""g"\r
- "\x01""h"\r
- "\x01""i"\r
- "\x01""j"\r
- "\x01""k"\r
- "\x01""l"\r
- "\x01""m"\r
- "\x01""n"\r
- "\x01""o"\r
- "\x01""p"\r
- "\x01""q"\r
- "\x01""r"\r
- "\x01""s"\r
- "\x01""t"\r
- "\x01""u"\r
- "\x01""v"\r
- "\x01""w"\r
- "\x01""x"\r
- "\x01""y"\r
- "\x01""z"\r
- "\x09""braceleft"\r
- "\x03""bar"\r
- "\x0A""braceright"\r
- "\x0A""asciitilde"\r
- "\x09""Adieresis"\r
- "\x05""Aring"\r
- "\x08""Ccedilla"\r
- "\x06""Eacute"\r
- "\x06""Ntilde"\r
- "\x09""Odieresis"\r
- "\x09""Udieresis"\r
- "\x06""aacute"\r
- "\x06""agrave"\r
- "\x0B""acircumflex"\r
- "\x09""adieresis"\r
- "\x06""atilde"\r
- "\x05""aring"\r
- "\x08""ccedilla"\r
- "\x06""eacute"\r
- "\x06""egrave"\r
- "\x0B""ecircumflex"\r
- "\x09""edieresis"\r
- "\x06""iacute"\r
- "\x06""igrave"\r
- "\x0B""icircumflex"\r
- "\x09""idieresis"\r
- "\x06""ntilde"\r
- "\x06""oacute"\r
- "\x06""ograve"\r
- "\x0B""ocircumflex"\r
- "\x09""odieresis"\r
- "\x06""otilde"\r
- "\x06""uacute"\r
- "\x06""ugrave"\r
- "\x0B""ucircumflex"\r
- "\x09""udieresis"\r
- "\x06""dagger"\r
- "\x06""degree"\r
- "\x04""cent"\r
- "\x08""sterling"\r
- "\x07""section"\r
- "\x06""bullet"\r
- "\x09""paragraph"\r
- "\x0A""germandbls"\r
- "\x0A""registered"\r
- "\x09""copyright"\r
- "\x09""trademark"\r
- "\x05""acute"\r
- "\x08""dieresis"\r
- "\x08""notequal"\r
- "\x02""AE"\r
- "\x06""Oslash"\r
- "\x08""infinity"\r
- "\x09""plusminus"\r
- "\x09""lessequal"\r
- "\x0C""greaterequal"\r
- "\x03""yen"\r
- "\x03""mu1"\r
- "\x0B""partialdiff"\r
- "\x09""summation"\r
- "\x07""product"\r
- "\x02""pi"\r
- "\x08""integral"\r
- "\x0B""ordfeminine"\r
- "\x0C""ordmasculine"\r
- "\x03""Ohm"\r
- "\x02""ae"\r
- "\x06""oslash"\r
- "\x0C""questiondown"\r
- "\x0A""exclamdown"\r
- "\x0A""logicalnot"\r
- "\x07""radical"\r
- "\x06""florin"\r
- "\x0B""approxequal"\r
- "\x09""increment"\r
- "\x0D""guillemotleft"\r
- "\x0E""guillemotright"\r
- "\x08""ellipsis"\r
- "\x07""nbspace"\r
- "\x06""Agrave"\r
- "\x06""Atilde"\r
- "\x06""Otilde"\r
- "\x02""OE"\r
- "\x02""oe"\r
- "\x06""endash"\r
- "\x06""emdash"\r
- "\x0C""quotedblleft"\r
- "\x0D""quotedblright"\r
- "\x09""quoteleft"\r
- "\x0A""quoteright"\r
- "\x06""divide"\r
- "\x07""lozenge"\r
- "\x09""ydieresis"\r
- "\x09""Ydieresis"\r
- "\x08""fraction"\r
- "\x08""currency"\r
- "\x0D""guilsinglleft"\r
- "\x0E""guilsinglright"\r
- "\x02""fi"\r
- "\x02""fl"\r
- "\x09""daggerdbl"\r
- "\x0E""periodcentered"\r
- "\x0E""quotesinglbase"\r
- "\x0C""quotedblbase"\r
- "\x0B""perthousand"\r
- "\x0B""Acircumflex"\r
- "\x0B""Ecircumflex"\r
- "\x06""Aacute"\r
- "\x09""Edieresis"\r
- "\x06""Egrave"\r
- "\x06""Iacute"\r
- "\x0B""Icircumflex"\r
- "\x09""Idieresis"\r
- "\x06""Igrave"\r
- "\x06""Oacute"\r
- "\x0B""Ocircumflex"\r
- "\x09""applelogo"\r
- "\x06""Ograve"\r
- "\x06""Uacute"\r
- "\x0B""Ucircumflex"\r
- "\x06""Ugrave"\r
- "\x08""dotlessi"\r
- "\x0A""circumflex"\r
- "\x05""tilde"\r
- "\x09""overscore"\r
- "\x05""breve"\r
- "\x09""dotaccent"\r
- "\x04""ring"\r
- "\x07""cedilla"\r
- "\x0C""hungarumlaut"\r
- "\x06""ogonek"\r
- "\x05""caron"\r
- "\x06""Lslash"\r
- "\x06""lslash"\r
- "\x06""Scaron"\r
- "\x06""scaron"\r
- "\x06""Zcaron"\r
- "\x06""zcaron"\r
- "\x09""brokenbar"\r
- "\x03""Eth"\r
- "\x03""eth"\r
- "\x06""Yacute"\r
- "\x06""yacute"\r
- "\x05""Thorn"\r
- "\x05""thorn"\r
- "\x05""minus"\r
- "\x08""multiply"\r
- "\x0B""onesuperior"\r
- "\x0B""twosuperior"\r
- "\x0D""threesuperior"\r
- "\x07""onehalf"\r
- "\x0A""onequarter"\r
- "\x0D""threequarters"\r
- "\x05""franc"\r
- "\x06""Gbreve"\r
- "\x06""gbreve"\r
- "\x04""Idot"\r
- "\x08""Scedilla"\r
- "\x08""scedilla"\r
- "\x06""Cacute"\r
- "\x06""cacute"\r
- "\x06""Ccaron"\r
- "\x06""ccaron"\r
- "\x07""dmacron"\r
-};\r
-\r
-/*struct unicodeChar\r
-{\r
- int cNum;\r
-\r
-};*/\r
-\r
-unsigned char unicodeChars[] = {\r
- "\x00\x20""space\0"\r
- "\x00\x21""exclamation mark\0"\r
- "\x00\x22""quotation mark\0"\r
- "\x00\x23""number sign\0"\r
-\r
-};\r
-\r
-/*\r
-\r
-0023 NUMBER SIGN\r
- = pound sign, hash, crosshatch, octothorpe\r
-0024 DOLLAR SIGN\r
- = milreis, escudo\r
- * glyph may have one or two vertical bars\r
- * other currency symbol characters: 20A0-20AF\r
- x (currency sign - 00A4)\r
-0025 PERCENT SIGN\r
- x (arabic percent sign - 066A)\r
- x (per mille sign - 2030)\r
- x (per ten thousand sign - 2031)\r
-0026 AMPERSAND\r
-0027 APOSTROPHE\r
- = APOSTROPHE-QUOTE\r
- = APL quote\r
- * neutral (vertical) glyph having mixed usage\r
- * preferred character for apostrophe is 2019\r
- * preferred characters in English for paired quotation marks are 2018 & 2019\r
- x (modifier letter prime - 02B9)\r
- x (modifier letter apostrophe - 02BC)\r
- x (modifier letter vertical line - 02C8)\r
- x (combining acute accent - 0301)\r
- x (prime - 2032)\r
-0028 LEFT PARENTHESIS\r
- = OPENING PARENTHESIS\r
-0029 RIGHT PARENTHESIS\r
- = CLOSING PARENTHESIS\r
- * see discussion on semantics of paired bracketing characters\r
-002A ASTERISK\r
- = star (on phone keypads)\r
- x (arabic five pointed star - 066D)\r
- x (asterisk operator - 2217)\r
- x (heavy asterisk - 2731)\r
-002B PLUS SIGN\r
-002C COMMA\r
- = decimal separator\r
- x (arabic comma - 060C)\r
- x (single low-9 quotation mark - 201A)\r
- x (ideographic comma - 3001)\r
-002D HYPHEN-MINUS\r
- = hyphen or minus sign\r
- * used for either hyphen or minus sign\r
- x (hyphen - 2010)\r
- x (non-breaking hyphen - 2011)\r
- x (figure dash - 2012)\r
- x (en dash - 2013)\r
- x (minus sign - 2212)\r
-002E FULL STOP\r
- = PERIOD\r
- = dot, decimal point\r
- * may be rendered as a raised decimal point in old style numbers\r
- x (arabic full stop - 06D4)\r
- x (ideographic full stop - 3002)\r
-002F SOLIDUS\r
- = SLASH\r
- = virgule, shilling (British)\r
- x (latin letter dental click - 01C0)\r
- x (combining long solidus overlay - 0338)\r
- x (fraction slash - 2044)\r
- x (division slash - 2215)\r
-0030 DIGIT ZERO\r
-0031 DIGIT ONE\r
-0032 DIGIT TWO\r
-0033 DIGIT THREE\r
-0034 DIGIT FOUR\r
-0035 DIGIT FIVE\r
-0036 DIGIT SIX\r
-0037 DIGIT SEVEN\r
-0038 DIGIT EIGHT\r
-0039 DIGIT NINE\r
-003A COLON\r
- x (armenian full stop - 0589)\r
- x (hebrew punctuation sof pasuq - 05C3)\r
- x (ratio - 2236)\r
-003B SEMICOLON\r
- x (greek question mark - 037E)\r
- x (arabic semicolon - 061B)\r
-003C LESS-THAN SIGN\r
- x (single left-pointing angle quotation mark - 2039)\r
- x (left-pointing angle bracket - 2329)\r
- x (left angle bracket - 3008)\r
-003D EQUALS SIGN\r
- * other related characters: 2241-2263\r
- x (not equal to - 2260)\r
- x (identical to - 2261)\r
-003E GREATER-THAN SIGN\r
- x (single right-pointing angle quotation mark - 203A)\r
- x (right-pointing angle bracket - 232A)\r
- x (right angle bracket - 3009)\r
-003F QUESTION MARK\r
- x (inverted question mark - 00BF)\r
- x (greek question mark - 037E)\r
- x (arabic question mark - 061F)\r
- x (interrobang - 203D)\r
- x (question exclamation mark - 2048)\r
- x (exclamation question mark - 2049)\r
-0040 COMMERCIAL AT\r
-0041 LATIN CAPITAL LETTER A\r
-0042 LATIN CAPITAL LETTER B\r
- x (script capital b - 212C)\r
-0043 LATIN CAPITAL LETTER C\r
- x (double-struck capital c - 2102)\r
- x (black-letter capital c - 212D)\r
-0044 LATIN CAPITAL LETTER D\r
-0045 LATIN CAPITAL LETTER E\r
- x (euler constant - 2107)\r
- x (script capital e - 2130)\r
-0046 LATIN CAPITAL LETTER F\r
- x (script capital f - 2131)\r
- x (turned capital f - 2132)\r
-0047 LATIN CAPITAL LETTER G\r
-0048 LATIN CAPITAL LETTER H\r
- x (script capital h - 210B)\r
- x (black-letter capital h - 210C)\r
- x (double-struck capital h - 210D)\r
-0049 LATIN CAPITAL LETTER I\r
- * Turkish and Azerbaijani use 0131 for lowercase\r
- x (latin capital letter i with dot above - 0130)\r
- x (cyrillic capital letter byelorussian-ukrainian i - 0406)\r
- x (cyrillic letter palochka - 04C0)\r
- x (script capital i - 2110)\r
- x (black-letter capital i - 2111)\r
- x (roman numeral one - 2160)\r
-004A LATIN CAPITAL LETTER J\r
-004B LATIN CAPITAL LETTER K\r
- x (kelvin sign - 212A)\r
-004C LATIN CAPITAL LETTER L\r
- x (script capital l - 2112)\r
-004D LATIN CAPITAL LETTER M\r
- x (script capital m - 2133)\r
-004E LATIN CAPITAL LETTER N\r
- x (double-struck capital n - 2115)\r
-004F LATIN CAPITAL LETTER O\r
-0050 LATIN CAPITAL LETTER P\r
- x (double-struck capital p - 2119)\r
-0051 LATIN CAPITAL LETTER Q\r
- x (double-struck capital q - 211A)\r
-0052 LATIN CAPITAL LETTER R\r
- x (script capital r - 211B)\r
- x (black-letter capital r - 211C)\r
- x (double-struck capital r - 211D)\r
-0053 LATIN CAPITAL LETTER S\r
-0054 LATIN CAPITAL LETTER T\r
-0055 LATIN CAPITAL LETTER U\r
-0056 LATIN CAPITAL LETTER V\r
-0057 LATIN CAPITAL LETTER W\r
-0058 LATIN CAPITAL LETTER X\r
-0059 LATIN CAPITAL LETTER Y\r
-005A LATIN CAPITAL LETTER Z\r
- x (double-struck capital z - 2124)\r
- x (black-letter capital z - 2128)\r
-005B LEFT SQUARE BRACKET\r
- = OPENING SQUARE BRACKET\r
- * other bracket characters: 3008-301B\r
-005C REVERSE SOLIDUS\r
- = BACKSLASH\r
- x (set minus - 2216)\r
-005D RIGHT SQUARE BRACKET\r
- = CLOSING SQUARE BRACKET\r
-005E CIRCUMFLEX ACCENT\r
- * this is a spacing character\r
- x (modifier letter up arrowhead - 02C4)\r
- x (modifier letter circumflex accent - 02C6)\r
- x (combining circumflex accent - 0302)\r
- x (up arrowhead - 2303)\r
-005F LOW LINE\r
- = SPACING UNDERSCORE\r
- * this is a spacing character\r
- x (modifier letter low macron - 02CD)\r
- x (combining macron below - 0331)\r
- x (combining low line - 0332)\r
- x (double low line - 2017)\r
-0060 GRAVE ACCENT\r
- * this is a spacing character\r
- x (modifier letter grave accent - 02CB)\r
- x (combining grave accent - 0300)\r
- x (reversed prime - 2035)\r
-0061 LATIN SMALL LETTER A\r
-0062 LATIN SMALL LETTER B\r
-0063 LATIN SMALL LETTER C\r
-0064 LATIN SMALL LETTER D\r
-0065 LATIN SMALL LETTER E\r
- x (estimated symbol - 212E)\r
- x (script small e - 212F)\r
-0066 LATIN SMALL LETTER F\r
-0067 LATIN SMALL LETTER G\r
- x (latin small letter script g - 0261)\r
- x (script small g - 210A)\r
-0068 LATIN SMALL LETTER H\r
- x (cyrillic small letter shha - 04BB)\r
- x (planck constant - 210E)\r
-0069 LATIN SMALL LETTER I\r
- * Turkish and Azerbaijani use 0130 for uppercase\r
- x (latin small letter dotless i - 0131)\r
-006A LATIN SMALL LETTER J\r
-006B LATIN SMALL LETTER K\r
-006C LATIN SMALL LETTER L\r
- x (script small l - 2113)\r
-006D LATIN SMALL LETTER M\r
-006E LATIN SMALL LETTER N\r
- x (superscript latin small letter n - 207F)\r
-006F LATIN SMALL LETTER O\r
- x (script small o - 2134)\r
-0070 LATIN SMALL LETTER P\r
-0071 LATIN SMALL LETTER Q\r
-0072 LATIN SMALL LETTER R\r
-0073 LATIN SMALL LETTER S\r
-0074 LATIN SMALL LETTER T\r
-0075 LATIN SMALL LETTER U\r
-0076 LATIN SMALL LETTER V\r
-0077 LATIN SMALL LETTER W\r
-0078 LATIN SMALL LETTER X\r
-0079 LATIN SMALL LETTER Y\r
-007A LATIN SMALL LETTER Z\r
- x (latin small letter z with stroke - 01B6)\r
-007B LEFT CURLY BRACKET\r
- = OPENING CURLY BRACKET\r
- = opening brace\r
-007C VERTICAL LINE\r
- = VERTICAL BAR\r
- * used in pairs to indicate absolute value\r
- x (latin letter dental click - 01C0)\r
- x (hebrew punctuation paseq - 05C0)\r
- x (divides - 2223)\r
- x (light vertical bar - 2758)\r
-007D RIGHT CURLY BRACKET\r
- = CLOSING CURLY BRACKET\r
- = closing brace\r
-007E TILDE\r
- * this is a spacing character\r
- x (small tilde - 02DC)\r
- x (combining tilde - 0303)\r
- x (tilde operator - 223C)\r
- x (fullwidth tilde - FF5E)\r
-007F <control>\r
- = DELETE\r
-@@ 0080 C1 Controls and Latin-1 Supplement (Latin-1 Supplement) 00FF\r
-@ C1 controls\r
-@+ Alias names are those for ISO 6429.\r
-0080 <control>\r
-0081 <control>\r
-0082 <control>\r
- = BREAK PERMITTED HERE\r
-0083 <control>\r
- = NO BREAK HERE\r
-0084 <control>\r
-0085 <control>\r
- = NEXT LINE\r
-0086 <control>\r
- = START OF SELECTED AREA\r
-0087 <control>\r
- = END OF SELECTED AREA\r
-0088 <control>\r
- = CHARACTER TABULATION SET\r
-0089 <control>\r
- = CHARACTER TABULATION WITH JUSTIFICATION\r
-008A <control>\r
- = LINE TABULATION SET\r
-008B <control>\r
- = PARTIAL LINE DOWN\r
-008C <control>\r
- = PARTIAL LINE UP\r
-008D <control>\r
- = REVERSE LINE FEED\r
-008E <control>\r
- = SINGLE SHIFT TWO\r
-008F <control>\r
- = SINGLE SHIFT THREE\r
-0090 <control>\r
- = DEVICE CONTROL STRING\r
-0091 <control>\r
- = PRIVATE USE ONE\r
-0092 <control>\r
- = PRIVATE USE TWO\r
-0093 <control>\r
- = SET TRANSMIT STATE\r
-0094 <control>\r
- = CANCEL CHARACTER\r
-0095 <control>\r
- = MESSAGE WAITING\r
-0096 <control>\r
- = START OF GUARDED AREA\r
-0097 <control>\r
- = END OF GUARDED AREA\r
-0098 <control>\r
- = START OF STRING\r
-0099 <control>\r
-009A <control>\r
- = SINGLE CHARACTER INTRODUCER\r
-009B <control>\r
- = CONTROL SEQUENCE INTRODUCER\r
-009C <control>\r
- = STRING TERMINATOR\r
-009D <control>\r
- = OPERATING SYSTEM COMMAND\r
-009E <control>\r
- = PRIVACY MESSAGE\r
-009F <control>\r
- = APPLICATION PROGRAM COMMAND\r
-@ ISO 8859-1 (aka Latin-1)\r
-00A0 NO-BREAK SPACE\r
- x (space - 0020)\r
- x (figure space - 2007)\r
- x (narrow no-break space - 202F)\r
- x (zero width no-break space - FEFF)\r
- # <noBreak> 0020\r
-00A1 INVERTED EXCLAMATION MARK\r
- * Spanish, Asturian, Galician\r
- x (exclamation mark - 0021)\r
-00A2 CENT SIGN\r
-00A3 POUND SIGN\r
- = pound sterling, Irish punt\r
- x (lira sign - 20A4)\r
-00A4 CURRENCY SIGN\r
- = Filzlaus, Ricardi-Sonne (German names)\r
- * other currency symbol characters: 20A0-20AF\r
- x (dollar sign - 0024)\r
-00A5 YEN SIGN\r
- = yuan sign\r
- * glyph may have one or two crossbars\r
-00A6 BROKEN BAR\r
- = BROKEN VERTICAL BAR\r
- = parted rule (in typography)\r
-00A7 SECTION SIGN\r
- * paragraph sign in some European usage\r
-00A8 DIAERESIS\r
- * this is a spacing character\r
- x (combining diaeresis - 0308)\r
- # 0020 0308\r
-00A9 COPYRIGHT SIGN\r
- x (sound recording copyright - 2117)\r
-00AA FEMININE ORDINAL INDICATOR\r
- * Spanish\r
- # <super> 0061\r
-00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK *\r
- = LEFT POINTING GUILLEMET\r
- = chevrons (in typography)\r
- * usually opening, sometimes closing\r
- x (much less-than - 226A)\r
- x (left double angle bracket - 300A)\r
-00AC NOT SIGN\r
- = angled dash (in typography)\r
- x (reversed not sign - 2310)\r
-00AD SOFT HYPHEN\r
- = discretionary hyphen\r
- x (mongolian todo soft hyphen - 1806)\r
-00AE REGISTERED SIGN\r
- = REGISTERED TRADE MARK SIGN\r
-00AF MACRON\r
- = overline, APL overbar\r
- * this is a spacing character\r
- x (modifier letter macron - 02C9)\r
- x (combining macron - 0304)\r
- x (combining overline - 0305)\r
- # 0020 0304\r
-00B0 DEGREE SIGN\r
- * this is a spacing character\r
- x (ring above - 02DA)\r
- x (combining ring above - 030A)\r
- x (superscript zero - 2070)\r
- x (ring operator - 2218)\r
-00B1 PLUS-MINUS SIGN\r
- x (minus-or-plus sign - 2213)\r
-00B2 SUPERSCRIPT TWO\r
- = squared\r
- * other superscript digit characters: 2070-2079\r
- x (superscript one - 00B9)\r
- # <super> 0032\r
-00B3 SUPERSCRIPT THREE\r
- = cubed\r
- x (superscript one - 00B9)\r
- # <super> 0033\r
-00B4 ACUTE ACCENT\r
- * this is a spacing character\r
- x (modifier letter prime - 02B9)\r
- x (modifier letter acute accent - 02CA)\r
- x (combining acute accent - 0301)\r
- x (prime - 2032)\r
- # 0020 0301\r
-00B5 MICRO SIGN\r
- # 03BC greek small letter mu\r
-00B6 PILCROW SIGN\r
- = PARAGRAPH SIGN\r
- * section sign in some European usage\r
- x (reversed pilcrow sign - 204B)\r
- x (curved stem paragraph sign ornament - 2761)\r
-00B7 MIDDLE DOT\r
- = midpoint (in typography)\r
- = Georgian comma\r
- = Greek middle dot\r
- x (bullet - 2022)\r
- x (one dot leader - 2024)\r
- x (hyphenation point - 2027)\r
- x (bullet operator - 2219)\r
- x (dot operator - 22C5)\r
- x (katakana middle dot - 30FB)\r
-00B8 CEDILLA\r
- * this is a spacing character\r
- * other spacing accent characters: 02D8-02DB\r
- x (combining cedilla - 0327)\r
- # 0020 0327\r
-00B9 SUPERSCRIPT ONE\r
- x (superscript two - 00B2)\r
- x (superscript three - 00B3)\r
- # <super> 0031\r
-00BA MASCULINE ORDINAL INDICATOR\r
- * Spanish\r
- # <super> 006F\r
-00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK *\r
- = RIGHT POINTING GUILLEMET\r
- * usually closing, sometimes opening\r
- x (much greater-than - 226B)\r
- x (right double angle bracket - 300B)\r
-00BC VULGAR FRACTION ONE QUARTER\r
- * bar may be horizontal or slanted\r
- * other fraction characters: 2153-215E\r
- # 0031 2044 0034\r
-00BD VULGAR FRACTION ONE HALF\r
- * bar may be horizontal or slanted\r
- # 0031 2044 0032\r
-00BE VULGAR FRACTION THREE QUARTERS\r
- * bar may be horizontal or slanted\r
- # 0033 2044 0034\r
-00BF INVERTED QUESTION MARK\r
- = turned question mark\r
- * Spanish\r
- x (question mark - 003F)\r
-00C0 LATIN CAPITAL LETTER A WITH GRAVE\r
- : 0041 0300\r
-00C1 LATIN CAPITAL LETTER A WITH ACUTE\r
- : 0041 0301\r
-00C2 LATIN CAPITAL LETTER A WITH CIRCUMFLEX\r
- : 0041 0302\r
-00C3 LATIN CAPITAL LETTER A WITH TILDE\r
- : 0041 0303\r
-00C4 LATIN CAPITAL LETTER A WITH DIAERESIS\r
- : 0041 0308\r
-00C5 LATIN CAPITAL LETTER A WITH RING ABOVE\r
- x (angstrom sign - 212B)\r
- : 0041 030A\r
-00C6 LATIN CAPITAL LETTER AE (ash) *\r
- = LATIN CAPITAL LIGATURE AE\r
-00C7 LATIN CAPITAL LETTER C WITH CEDILLA\r
- : 0043 0327\r
-00C8 LATIN CAPITAL LETTER E WITH GRAVE\r
- : 0045 0300\r
-00C9 LATIN CAPITAL LETTER E WITH ACUTE\r
- : 0045 0301\r
-00CA LATIN CAPITAL LETTER E WITH CIRCUMFLEX\r
- : 0045 0302\r
-00CB LATIN CAPITAL LETTER E WITH DIAERESIS\r
- : 0045 0308\r
-00CC LATIN CAPITAL LETTER I WITH GRAVE\r
- : 0049 0300\r
-00CD LATIN CAPITAL LETTER I WITH ACUTE\r
- : 0049 0301\r
-00CE LATIN CAPITAL LETTER I WITH CIRCUMFLEX\r
- : 0049 0302\r
-00CF LATIN CAPITAL LETTER I WITH DIAERESIS\r
- : 0049 0308\r
-00D0 LATIN CAPITAL LETTER ETH (Icelandic)\r
- x (latin small letter eth - 00F0)\r
- x (latin capital letter d with stroke - 0110)\r
- x (latin capital letter african d - 0189)\r
-00D1 LATIN CAPITAL LETTER N WITH TILDE\r
- : 004E 0303\r
-00D2 LATIN CAPITAL LETTER O WITH GRAVE\r
- : 004F 0300\r
-00D3 LATIN CAPITAL LETTER O WITH ACUTE\r
- : 004F 0301\r
-00D4 LATIN CAPITAL LETTER O WITH CIRCUMFLEX\r
- : 004F 0302\r
-00D5 LATIN CAPITAL LETTER O WITH TILDE\r
- : 004F 0303\r
-00D6 LATIN CAPITAL LETTER O WITH DIAERESIS\r
- : 004F 0308\r
-00D7 MULTIPLICATION SIGN\r
- = z notation Cartesian product\r
-00D8 LATIN CAPITAL LETTER O WITH STROKE\r
- = LATIN CAPITAL LETTER O SLASH\r
- x (empty set - 2205)\r
-00D9 LATIN CAPITAL LETTER U WITH GRAVE\r
- : 0055 0300\r
-00DA LATIN CAPITAL LETTER U WITH ACUTE\r
- : 0055 0301\r
-00DB LATIN CAPITAL LETTER U WITH CIRCUMFLEX\r
- : 0055 0302\r
-00DC LATIN CAPITAL LETTER U WITH DIAERESIS\r
- : 0055 0308\r
-00DD LATIN CAPITAL LETTER Y WITH ACUTE\r
- : 0059 0301\r
-00DE LATIN CAPITAL LETTER THORN (Icelandic)\r
-00DF LATIN SMALL LETTER SHARP S (German)\r
- = Eszett\r
- * German\r
- * uppercase is "SS"\r
- * in origin a ligature of 017F and 0073\r
- x (greek small letter beta - 03B2)\r
-00E0 LATIN SMALL LETTER A WITH GRAVE\r
- : 0061 0300\r
-00E1 LATIN SMALL LETTER A WITH ACUTE\r
- : 0061 0301\r
-00E2 LATIN SMALL LETTER A WITH CIRCUMFLEX\r
- : 0061 0302\r
-00E3 LATIN SMALL LETTER A WITH TILDE\r
- * Portuguese\r
- : 0061 0303\r
-00E4 LATIN SMALL LETTER A WITH DIAERESIS\r
- : 0061 0308\r
-00E5 LATIN SMALL LETTER A WITH RING ABOVE\r
- * Danish, Norwegian, Swedish, Walloon\r
- : 0061 030A\r
-00E6 LATIN SMALL LETTER AE (ash) *\r
- = LATIN SMALL LIGATURE AE\r
- = ash (from Old English æsc)\r
- * Danish, Norwegian, Icelandic, Faroese, Old English, French, IPA\r
- x (latin small ligature oe - 0153)\r
- x (cyrillic small ligature a ie - 04D5)\r
-00E7 LATIN SMALL LETTER C WITH CEDILLA\r
- : 0063 0327\r
-00E8 LATIN SMALL LETTER E WITH GRAVE\r
- : 0065 0300\r
-00E9 LATIN SMALL LETTER E WITH ACUTE\r
- : 0065 0301\r
-00EA LATIN SMALL LETTER E WITH CIRCUMFLEX\r
- : 0065 0302\r
-00EB LATIN SMALL LETTER E WITH DIAERESIS\r
- : 0065 0308\r
-00EC LATIN SMALL LETTER I WITH GRAVE\r
- * Italian, Malagasy\r
- : 0069 0300\r
-00ED LATIN SMALL LETTER I WITH ACUTE\r
- : 0069 0301\r
-00EE LATIN SMALL LETTER I WITH CIRCUMFLEX\r
- : 0069 0302\r
-00EF LATIN SMALL LETTER I WITH DIAERESIS\r
- : 0069 0308\r
-00F0 LATIN SMALL LETTER ETH (Icelandic)\r
- * Icelandic, Faroese, Old English, IPA\r
- x (latin capital letter eth - 00D0)\r
- x (greek small letter delta - 03B4)\r
- x (partial differential - 2202)\r
-00F1 LATIN SMALL LETTER N WITH TILDE\r
- : 006E 0303\r
-00F2 LATIN SMALL LETTER O WITH GRAVE\r
- : 006F 0300\r
-00F3 LATIN SMALL LETTER O WITH ACUTE\r
- : 006F 0301\r
-00F4 LATIN SMALL LETTER O WITH CIRCUMFLEX\r
- : 006F 0302\r
-00F5 LATIN SMALL LETTER O WITH TILDE\r
- * Portuguese, Estonian\r
- : 006F 0303\r
-00F6 LATIN SMALL LETTER O WITH DIAERESIS\r
- : 006F 0308\r
-00F7 DIVISION SIGN\r
-00F8 LATIN SMALL LETTER O WITH STROKE\r
- = LATIN SMALL LETTER O SLASH\r
- * Danish, Norwegian, Faroese, IPA\r
-00F9 LATIN SMALL LETTER U WITH GRAVE\r
- * French, Italian\r
- : 0075 0300\r
-00FA LATIN SMALL LETTER U WITH ACUTE\r
- : 0075 0301\r
-00FB LATIN SMALL LETTER U WITH CIRCUMFLEX\r
- : 0075 0302\r
-00FC LATIN SMALL LETTER U WITH DIAERESIS\r
- : 0075 0308\r
-00FD LATIN SMALL LETTER Y WITH ACUTE\r
- * Czech, Slovak, Icelandic, Faroese, Welsh, Malagasy\r
- : 0079 0301\r
-00FE LATIN SMALL LETTER THORN (Icelandic)\r
- * Icelandic, Old English, phonetics\r
- * Runic letter borrowed into Latin script\r
- x (runic letter thurisaz thurs thorn - 16A6)\r
-00FF LATIN SMALL LETTER Y WITH DIAERESIS\r
- * French\r
- x (latin capital letter y with diaeresis - 0178)\r
- : 0079 0308\r
-@@ 0100 Latin Extended-A 017F\r
-@ European Latin\r
-0100 LATIN CAPITAL LETTER A WITH MACRON\r
- : 0041 0304\r
-0101 LATIN SMALL LETTER A WITH MACRON\r
- * Latvian, Latin, ...\r
- : 0061 0304\r
-0102 LATIN CAPITAL LETTER A WITH BREVE\r
- : 0041 0306\r
-0103 LATIN SMALL LETTER A WITH BREVE\r
- * Romanian, Vietnamese, Latin, ...\r
- : 0061 0306\r
-0104 LATIN CAPITAL LETTER A WITH OGONEK\r
- : 0041 0328\r
-0105 LATIN SMALL LETTER A WITH OGONEK\r
- * Polish, Lithuanian, ...\r
- : 0061 0328\r
-0106 LATIN CAPITAL LETTER C WITH ACUTE\r
- : 0043 0301\r
-0107 LATIN SMALL LETTER C WITH ACUTE\r
- * Polish, Croatian, ...\r
- x (cyrillic small letter tshe - 045B)\r
- : 0063 0301\r
-0108 LATIN CAPITAL LETTER C WITH CIRCUMFLEX\r
- : 0043 0302\r
-0109 LATIN SMALL LETTER C WITH CIRCUMFLEX\r
- * Esperanto\r
- : 0063 0302\r
-010A LATIN CAPITAL LETTER C WITH DOT ABOVE\r
- : 0043 0307\r
-010B LATIN SMALL LETTER C WITH DOT ABOVE\r
- * Maltese, Irish Gaelic (old orthography)\r
- : 0063 0307\r
-010C LATIN CAPITAL LETTER C WITH CARON\r
- : 0043 030C\r
-010D LATIN SMALL LETTER C WITH CARON\r
- * Czech, Slovak, Slovenian, and many other languages\r
- : 0063 030C\r
-010E LATIN CAPITAL LETTER D WITH CARON\r
- * the form using caron/hacek is preferred in all contexts\r
- : 0044 030C\r
-010F LATIN SMALL LETTER D WITH CARON\r
- * Czech, Slovak\r
- * the form using apostrophe is preferred in typesetting\r
- : 0064 030C\r
-0110 LATIN CAPITAL LETTER D WITH STROKE\r
- x (latin capital letter eth - 00D0)\r
- x (latin small letter d with stroke - 0111)\r
- x (latin capital letter african d - 0189)\r
-0111 LATIN SMALL LETTER D WITH STROKE\r
- * Croatian, Vietnamese, Sámi\r
- x (latin capital letter d with stroke - 0110)\r
- x (cyrillic small letter dje - 0452)\r
-0112 LATIN CAPITAL LETTER E WITH MACRON\r
- : 0045 0304\r
-0113 LATIN SMALL LETTER E WITH MACRON\r
- * Latvian, Latin, ...\r
- : 0065 0304\r
-0114 LATIN CAPITAL LETTER E WITH BREVE\r
- : 0045 0306\r
-0115 LATIN SMALL LETTER E WITH BREVE\r
- * Malay, Latin, ...\r
- : 0065 0306\r
-0116 LATIN CAPITAL LETTER E WITH DOT ABOVE\r
- : 0045 0307\r
-0117 LATIN SMALL LETTER E WITH DOT ABOVE\r
- * Lithuanian\r
- : 0065 0307\r
-0118 LATIN CAPITAL LETTER E WITH OGONEK\r
- : 0045 0328\r
-0119 LATIN SMALL LETTER E WITH OGONEK\r
- * Polish, Lithuanian, ...\r
- : 0065 0328\r
-011A LATIN CAPITAL LETTER E WITH CARON\r
- : 0045 030C\r
-011B LATIN SMALL LETTER E WITH CARON\r
- * Czech, ...\r
- : 0065 030C\r
-011C LATIN CAPITAL LETTER G WITH CIRCUMFLEX\r
- : 0047 0302\r
-011D LATIN SMALL LETTER G WITH CIRCUMFLEX\r
- * Esperanto\r
- : 0067 0302\r
-011E LATIN CAPITAL LETTER G WITH BREVE\r
- : 0047 0306\r
-011F LATIN SMALL LETTER G WITH BREVE\r
- * Turkish, Azerbaijani\r
- x (latin small letter g with caron - 01E7)\r
- : 0067 0306\r
-0120 LATIN CAPITAL LETTER G WITH DOT ABOVE\r
- : 0047 0307\r
-0121 LATIN SMALL LETTER G WITH DOT ABOVE\r
- * Maltese, Irish Gaelic (old orthography)\r
- : 0067 0307\r
-0122 LATIN CAPITAL LETTER G WITH CEDILLA\r
- : 0047 0327\r
-0123 LATIN SMALL LETTER G WITH CEDILLA\r
- * Latvian\r
- * there are three major glyph variants\r
- : 0067 0327\r
-0124 LATIN CAPITAL LETTER H WITH CIRCUMFLEX\r
- : 0048 0302\r
-0125 LATIN SMALL LETTER H WITH CIRCUMFLEX\r
- * Esperanto\r
- : 0068 0302\r
-0126 LATIN CAPITAL LETTER H WITH STROKE\r
-0127 LATIN SMALL LETTER H WITH STROKE\r
- * Maltese, IPA, ...\r
- x (cyrillic small letter tshe - 045B)\r
- x (planck constant over two pi - 210F)\r
-0128 LATIN CAPITAL LETTER I WITH TILDE\r
- : 0049 0303\r
-0129 LATIN SMALL LETTER I WITH TILDE\r
- * Greenlandic (old orthography)\r
- : 0069 0303\r
-012A LATIN CAPITAL LETTER I WITH MACRON\r
- : 0049 0304\r
-012B LATIN SMALL LETTER I WITH MACRON\r
- * Latvian, Latin, ...\r
- : 0069 0304\r
-012C LATIN CAPITAL LETTER I WITH BREVE\r
- : 0049 0306\r
-012D LATIN SMALL LETTER I WITH BREVE\r
- * Latin, ...\r
- : 0069 0306\r
-012E LATIN CAPITAL LETTER I WITH OGONEK\r
- : 0049 0328\r
-012F LATIN SMALL LETTER I WITH OGONEK\r
- * Lithuanian, ...\r
- : 0069 0328\r
-0130 LATIN CAPITAL LETTER I WITH DOT ABOVE\r
- = LATIN CAPITAL LETTER I DOT\r
- * Turkish, Azerbaijani\r
- * lowercase is 0069\r
- x (latin capital letter i - 0049)\r
- : 0049 0307\r
-0131 LATIN SMALL LETTER DOTLESS I\r
- * Turkish, Azerbaijani\r
- * uppercase is 0049\r
- x (latin small letter i - 0069)\r
-0132 LATIN CAPITAL LIGATURE IJ\r
- # 0049 004A\r
-0133 LATIN SMALL LIGATURE IJ\r
- * Dutch\r
- # 0069 006A\r
-0134 LATIN CAPITAL LETTER J WITH CIRCUMFLEX\r
- : 004A 0302\r
-0135 LATIN SMALL LETTER J WITH CIRCUMFLEX\r
- * Esperanto\r
- : 006A 0302\r
-0136 LATIN CAPITAL LETTER K WITH CEDILLA\r
- : 004B 0327\r
-0137 LATIN SMALL LETTER K WITH CEDILLA\r
- * Latvian\r
- : 006B 0327\r
-0138 LATIN SMALL LETTER KRA (Greenlandic)\r
- * Greenlandic (old orthography)\r
-0139 LATIN CAPITAL LETTER L WITH ACUTE\r
- : 004C 0301\r
-013A LATIN SMALL LETTER L WITH ACUTE\r
- * Slovak\r
- : 006C 0301\r
-013B LATIN CAPITAL LETTER L WITH CEDILLA\r
- : 004C 0327\r
-013C LATIN SMALL LETTER L WITH CEDILLA\r
- * Latvian\r
- : 006C 0327\r
-013D LATIN CAPITAL LETTER L WITH CARON\r
- : 004C 030C\r
-013E LATIN SMALL LETTER L WITH CARON\r
- * Slovak\r
- * the form using apostrophe is preferred in typesetting\r
- : 006C 030C\r
-013F LATIN CAPITAL LETTER L WITH MIDDLE DOT\r
- * some fonts show the middle dot inside the L, but the preferred form has the dot following the L\r
- # 004C 00B7\r
-0140 LATIN SMALL LETTER L WITH MIDDLE DOT\r
- * Catalan\r
- # 006C 00B7\r
-0141 LATIN CAPITAL LETTER L WITH STROKE\r
-0142 LATIN SMALL LETTER L WITH STROKE\r
- * Polish, ...\r
- x (latin small letter l with bar - 019A)\r
-0143 LATIN CAPITAL LETTER N WITH ACUTE\r
- : 004E 0301\r
-0144 LATIN SMALL LETTER N WITH ACUTE\r
- * Polish, ...\r
- : 006E 0301\r
-0145 LATIN CAPITAL LETTER N WITH CEDILLA\r
- : 004E 0327\r
-0146 LATIN SMALL LETTER N WITH CEDILLA\r
- * Latvian\r
- : 006E 0327\r
-0147 LATIN CAPITAL LETTER N WITH CARON\r
- : 004E 030C\r
-0148 LATIN SMALL LETTER N WITH CARON\r
- * Czech, Slovak\r
- : 006E 030C\r
-0149 LATIN SMALL LETTER N PRECEDED BY APOSTROPHE\r
- = LATIN SMALL LETTER APOSTROPHE N\r
- * Afrikaans\r
- * this is not actually a single letter\r
- # 02BC 006E\r
-014A LATIN CAPITAL LETTER ENG (Sami)\r
- * glyph may also have appearance of large form of the small letter\r
-014B LATIN SMALL LETTER ENG (Sami)\r
- * Sámi, Mende, IPA, ...\r
-014C LATIN CAPITAL LETTER O WITH MACRON\r
- : 004F 0304\r
-014D LATIN SMALL LETTER O WITH MACRON\r
- * Latvian, Latin, ...\r
- : 006F 0304\r
-014E LATIN CAPITAL LETTER O WITH BREVE\r
- : 004F 0306\r
-014F LATIN SMALL LETTER O WITH BREVE\r
- * Latin\r
- : 006F 0306\r
-0150 LATIN CAPITAL LETTER O WITH DOUBLE ACUTE\r
- : 004F 030B\r
-0151 LATIN SMALL LETTER O WITH DOUBLE ACUTE\r
- * Hungarian\r
- : 006F 030B\r
-0152 LATIN CAPITAL LIGATURE OE\r
-0153 LATIN SMALL LIGATURE OE\r
- = LATIN SMALL LETTER O E\r
- = ethel (from Old English eðel)\r
- * French, IPA, Old Icelandic, Old English, ...\r
- x (latin small letter ae - 00E6)\r
- x (latin letter small capital oe - 0276)\r
-0154 LATIN CAPITAL LETTER R WITH ACUTE\r
- : 0052 0301\r
-0155 LATIN SMALL LETTER R WITH ACUTE\r
- * Slovak, ...\r
- : 0072 0301\r
-0156 LATIN CAPITAL LETTER R WITH CEDILLA\r
- : 0052 0327\r
-0157 LATIN SMALL LETTER R WITH CEDILLA\r
- * Latvian\r
- : 0072 0327\r
-0158 LATIN CAPITAL LETTER R WITH CARON\r
- : 0052 030C\r
-0159 LATIN SMALL LETTER R WITH CARON\r
- * Czech, ...\r
- : 0072 030C\r
-015A LATIN CAPITAL LETTER S WITH ACUTE\r
- : 0053 0301\r
-015B LATIN SMALL LETTER S WITH ACUTE\r
- * Polish, Indic transliteration, ...\r
- : 0073 0301\r
-015C LATIN CAPITAL LETTER S WITH CIRCUMFLEX\r
- : 0053 0302\r
-015D LATIN SMALL LETTER S WITH CIRCUMFLEX\r
- * Esperanto\r
- : 0073 0302\r
-015E LATIN CAPITAL LETTER S WITH CEDILLA *\r
- : 0053 0327\r
-015F LATIN SMALL LETTER S WITH CEDILLA *\r
- * Turkish, Azerbaijani, Romanian, ...\r
- * this character is used in both Turkish and Romanian data\r
- * a glyph variant with comma below is preferred for Romanian\r
- x (latin small letter s with comma below - 0219)\r
- : 0073 0327\r
-0160 LATIN CAPITAL LETTER S WITH CARON\r
- : 0053 030C\r
-0161 LATIN SMALL LETTER S WITH CARON\r
- * Czech, Estonian, Finnish, Slovak, and many other languages\r
- : 0073 030C\r
-0162 LATIN CAPITAL LETTER T WITH CEDILLA *\r
- : 0054 0327\r
-0163 LATIN SMALL LETTER T WITH CEDILLA *\r
- * Romanian, Semitic transliteration, ...\r
- * this character is used in Romanian data\r
- * a glyph variant with comma below is preferred for Romanian\r
- x (latin small letter t with comma below - 021B)\r
- : 0074 0327\r
-0164 LATIN CAPITAL LETTER T WITH CARON\r
- * the form using caron/hacek is preferred in all contexts\r
- : 0054 030C\r
-0165 LATIN SMALL LETTER T WITH CARON\r
- * Czech, Slovak\r
- * the form using apostrophe is preferred in typesetting\r
- : 0074 030C\r
-0166 LATIN CAPITAL LETTER T WITH STROKE\r
-0167 LATIN SMALL LETTER T WITH STROKE\r
- * Sámi\r
-0168 LATIN CAPITAL LETTER U WITH TILDE\r
- : 0055 0303\r
-0169 LATIN SMALL LETTER U WITH TILDE\r
- * Greenlandic (old orthography)\r
- : 0075 0303\r
-016A LATIN CAPITAL LETTER U WITH MACRON\r
- : 0055 0304\r
-016B LATIN SMALL LETTER U WITH MACRON\r
- * Latvian, Lithuanian, Latin, ...\r
- : 0075 0304\r
-016C LATIN CAPITAL LETTER U WITH BREVE\r
- : 0055 0306\r
-016D LATIN SMALL LETTER U WITH BREVE\r
- * Latin, Esperanto, ...\r
- : 0075 0306\r
-016E LATIN CAPITAL LETTER U WITH RING ABOVE\r
- : 0055 030A\r
-016F LATIN SMALL LETTER U WITH RING ABOVE\r
- * Czech, ...\r
- : 0075 030A\r
-0170 LATIN CAPITAL LETTER U WITH DOUBLE ACUTE\r
- : 0055 030B\r
-0171 LATIN SMALL LETTER U WITH DOUBLE ACUTE\r
- * Hungarian\r
- : 0075 030B\r
-0172 LATIN CAPITAL LETTER U WITH OGONEK\r
- : 0055 0328\r
-0173 LATIN SMALL LETTER U WITH OGONEK\r
- * Lithuanian\r
- : 0075 0328\r
-0174 LATIN CAPITAL LETTER W WITH CIRCUMFLEX\r
- : 0057 0302\r
-0175 LATIN SMALL LETTER W WITH CIRCUMFLEX\r
- * Welsh\r
- : 0077 0302\r
-0176 LATIN CAPITAL LETTER Y WITH CIRCUMFLEX\r
- : 0059 0302\r
-0177 LATIN SMALL LETTER Y WITH CIRCUMFLEX\r
- * Welsh\r
- : 0079 0302\r
-0178 LATIN CAPITAL LETTER Y WITH DIAERESIS\r
- * French, Igbo\r
- x (latin small letter y with diaeresis - 00FF)\r
- : 0059 0308\r
-0179 LATIN CAPITAL LETTER Z WITH ACUTE\r
- : 005A 0301\r
-017A LATIN SMALL LETTER Z WITH ACUTE\r
- * Polish, ...\r
- : 007A 0301\r
-017B LATIN CAPITAL LETTER Z WITH DOT ABOVE\r
- : 005A 0307\r
-017C LATIN SMALL LETTER Z WITH DOT ABOVE\r
- * Polish, ...\r
- : 007A 0307\r
-017D LATIN CAPITAL LETTER Z WITH CARON\r
- : 005A 030C\r
-017E LATIN SMALL LETTER Z WITH CARON\r
- * Czech, Estonian, Finnish, Slovak, Slovenian, and many other languages\r
- : 007A 030C\r
-017F LATIN SMALL LETTER LONG S\r
- * in common use in Roman types until the 18th century\r
- * in current use in Fraktur and Gaelic types\r
- # 0073 latin small letter s\r
-@@ 0180 Latin Extended-B 024F\r
-@ Latin extended-B\r
-0180 LATIN SMALL LETTER B WITH STROKE\r
- * Americanist and Indo-Europeanist usage for phonetic beta\r
- * Old Saxon\r
- x (greek small letter beta - 03B2)\r
- x (blank symbol - 2422)\r
-0181 LATIN CAPITAL LETTER B WITH HOOK\r
- * Zulu, Pan-Nigerian alphabet\r
- x (latin small letter b with hook - 0253)\r
-0182 LATIN CAPITAL LETTER B WITH TOPBAR\r
-0183 LATIN SMALL LETTER B WITH TOPBAR\r
- * Zhuang\r
- * former Soviet minority language scripts\r
- x (cyrillic capital letter be - 0411)\r
-0184 LATIN CAPITAL LETTER TONE SIX\r
-0185 LATIN SMALL LETTER TONE SIX\r
- * Zhuang\r
- * Zhuang tone three is Cyrillic ze\r
- * Zhuang tone four is Cyrillic che\r
- x (latin small letter tone two - 01A8)\r
- x (latin small letter tone five - 01BD)\r
- x (cyrillic small letter ze - 0437)\r
- x (cyrillic small letter che - 0447)\r
- x (cyrillic small letter soft sign - 044C)\r
-0186 LATIN CAPITAL LETTER OPEN O\r
- * typographically a turned C\r
- x (latin small letter open o - 0254)\r
-0187 LATIN CAPITAL LETTER C WITH HOOK\r
-0188 LATIN SMALL LETTER C WITH HOOK\r
- * African\r
-0189 LATIN CAPITAL LETTER AFRICAN D *\r
- * Ewe\r
- x (latin capital letter eth - 00D0)\r
- x (latin capital letter d with stroke - 0110)\r
- x (latin small letter d with tail - 0256)\r
-018A LATIN CAPITAL LETTER D WITH HOOK\r
- * Pan-Nigerian alphabet\r
- x (latin small letter d with hook - 0257)\r
-018B LATIN CAPITAL LETTER D WITH TOPBAR\r
-018C LATIN SMALL LETTER D WITH TOPBAR\r
- * former-Soviet minority language scripts\r
-018D LATIN SMALL LETTER TURNED DELTA\r
- * archaic phonetic for labialized dental fricative\r
- * recommended spellings 007A 02B7 or 007A 032B\r
-018E LATIN CAPITAL LETTER REVERSED E\r
- = LATIN CAPITAL LETTER TURNED E\r
- * Pan-Nigerian alphabet\r
- * lowercase is 01DD\r
-018F LATIN CAPITAL LETTER SCHWA\r
- * Azerbaijani, ...\r
- x (latin small letter schwa - 0259)\r
- x (cyrillic capital letter schwa - 04D8)\r
-0190 LATIN CAPITAL LETTER OPEN E\r
- = LATIN CAPITAL LETTER EPSILON\r
- * African\r
- x (latin small letter open e - 025B)\r
- x (euler constant - 2107)\r
-0191 LATIN CAPITAL LETTER F WITH HOOK\r
- * African\r
-0192 LATIN SMALL LETTER F WITH HOOK\r
- = LATIN SMALL LETTER SCRIPT F\r
- = Florin currency symbol (Netherlands)\r
- = function symbol\r
- = abbreviation convention for folder\r
-0193 LATIN CAPITAL LETTER G WITH HOOK\r
- * African\r
- x (latin small letter g with hook - 0260)\r
-0194 LATIN CAPITAL LETTER GAMMA\r
- * African\r
- x (latin small letter gamma - 0263)\r
-0195 LATIN SMALL LETTER HV (hwair)\r
- * Gothic transliteration\r
- * uppercase is 01F6\r
-0196 LATIN CAPITAL LETTER IOTA\r
- * African\r
- x (latin small letter iota - 0269)\r
-0197 LATIN CAPITAL LETTER I WITH STROKE\r
- = barred i, i bar\r
- * African\r
- * ISO 6438 gives lowercase as 026A, not 0268\r
- x (latin letter small capital i - 026A)\r
-0198 LATIN CAPITAL LETTER K WITH HOOK\r
-0199 LATIN SMALL LETTER K WITH HOOK\r
- * Hausa, Pan-Nigerian alphabet\r
-019A LATIN SMALL LETTER L WITH BAR\r
- = barred l\r
- * Americanist phonetic usage for 026C\r
- x (latin small letter l with stroke - 0142)\r
-019B LATIN SMALL LETTER LAMBDA WITH STROKE\r
- = barred lambda, lambda bar\r
- * Americanist phonetic usage\r
-019C LATIN CAPITAL LETTER TURNED M\r
- * Zhuang\r
- x (latin small letter turned m - 026F)\r
-019D LATIN CAPITAL LETTER N WITH LEFT HOOK\r
- * African\r
- x (latin small letter n with left hook - 0272)\r
-019E LATIN SMALL LETTER N WITH LONG RIGHT LEG\r
- * archaic phonetic for Japanese syllabic "n"\r
- * recommended spelling 006E 0329\r
-019F LATIN CAPITAL LETTER O WITH MIDDLE TILDE *\r
- = barred o, o bar\r
- * lowercase is 0275\r
- * African\r
- x (cyrillic capital letter barred o - 04E8)\r
-01A0 LATIN CAPITAL LETTER O WITH HORN\r
- : 004F 031B\r
-01A1 LATIN SMALL LETTER O WITH HORN\r
- * Vietnamese\r
- : 006F 031B\r
-01A2 LATIN CAPITAL LETTER OI (gha)\r
-01A3 LATIN SMALL LETTER OI (gha)\r
- = gha\r
- * Pan-Turkic Latin alphabets\r
-01A4 LATIN CAPITAL LETTER P WITH HOOK\r
-01A5 LATIN SMALL LETTER P WITH HOOK\r
- * African\r
-01A6 LATIN LETTER YR *\r
- * old Norse\r
- * from German Standard DIN 31624 and ISO 5246-2\r
- * lowercase is 0280\r
-01A7 LATIN CAPITAL LETTER TONE TWO\r
-01A8 LATIN SMALL LETTER TONE TWO\r
- * Zhuang\r
- * typographically a reversed S\r
- x (latin small letter tone six - 0185)\r
-01A9 LATIN CAPITAL LETTER ESH\r
- * African\r
- x (latin small letter esh - 0283)\r
- x (greek capital letter sigma - 03A3)\r
-01AA LATIN LETTER REVERSED ESH LOOP\r
- * archaic phonetic for labialized palatoalveolar or palatal fricative\r
- * Twi\r
- * recommended spellings 0283 02B7, 00E7 02B7, 0068 0265, etc.\r
-01AB LATIN SMALL LETTER T WITH PALATAL HOOK\r
- * archaic phonetic for palatalized alveolar or dental stop\r
- * recommended spelling 0074 02B2\r
-01AC LATIN CAPITAL LETTER T WITH HOOK\r
-01AD LATIN SMALL LETTER T WITH HOOK\r
- * African\r
-01AE LATIN CAPITAL LETTER T WITH RETROFLEX HOOK\r
- * African\r
- x (latin small letter t with retroflex hook - 0288)\r
-01AF LATIN CAPITAL LETTER U WITH HORN\r
- : 0055 031B\r
-01B0 LATIN SMALL LETTER U WITH HORN\r
- * Vietnamese\r
- : 0075 031B\r
-01B1 LATIN CAPITAL LETTER UPSILON\r
- * African\r
- * typographically based on turned capital Greek omega\r
- x (latin small letter upsilon - 028A)\r
- x (inverted ohm sign - 2127)\r
-01B2 LATIN CAPITAL LETTER V WITH HOOK\r
- = LATIN CAPITAL LETTER SCRIPT V\r
- * African\r
- x (latin small letter v with hook - 028B)\r
-01B3 LATIN CAPITAL LETTER Y WITH HOOK\r
-01B4 LATIN SMALL LETTER Y WITH HOOK\r
- * Bini, Esoko, and other Edo languages in West Africa\r
-01B5 LATIN CAPITAL LETTER Z WITH STROKE\r
-01B6 LATIN SMALL LETTER Z WITH STROKE\r
- = barred z, z bar\r
- * Pan-Turkic Latin orthography\r
- * handwritten variant of Latin "z"\r
- x (latin small letter z - 007A)\r
-01B7 LATIN CAPITAL LETTER EZH\r
- * African, Skolt Sámi\r
- * lowercase is 0292\r
- x (latin capital letter yogh - 021C)\r
- x (cyrillic capital letter abkhasian dze - 04E0)\r
-01B8 LATIN CAPITAL LETTER EZH REVERSED\r
-01B9 LATIN SMALL LETTER EZH REVERSED\r
- * archaic phonetic for voiced pharyngeal fricative\r
- * sometimes typographically rendered with a turned digit 3\r
- * recommended spelling 0295\r
- x (latin letter pharyngeal voiced fricative - 0295)\r
- x (arabic letter ain - 0639)\r
-01BA LATIN SMALL LETTER EZH WITH TAIL\r
- * archaic phonetic for labialized voiced palatoalveolar or palatal fricative\r
- * Twi\r
- * recommended spellings 0292 02B7 or 006A 02B7\r
-01BB LATIN LETTER TWO WITH STROKE\r
- * archaic phonetic for [dz] affricate\r
- * recommended spellings 0292 or 0064 007A\r
-01BC LATIN CAPITAL LETTER TONE FIVE\r
-01BD LATIN SMALL LETTER TONE FIVE\r
- * Zhuang\r
- x (latin small letter tone six - 0185)\r
-01BE LATIN LETTER INVERTED GLOTTAL STOP WITH STROKE\r
- * archaic phonetic for [ts] affricate\r
- * recommended spelling 0074 0073\r
- * letter form is actually derived from ligation of ts, rather than inverted glottal stop\r
-01BF LATIN LETTER WYNN\r
- = wen\r
- * Runic letter borrowed into Latin script\r
- * replaced by "w" in modern transcriptions of Old English\r
- * uppercase is 01F7\r
- x (runic letter wunjo wynn w - 16B9)\r
-01C0 LATIN LETTER DENTAL CLICK\r
- = pipe\r
- * Khoisan tradition\r
- * "c" in Zulu orthography\r
- x (solidus - 002F)\r
- x (vertical line - 007C)\r
- x (latin small letter turned t - 0287)\r
- x (divides - 2223)\r
-01C1 LATIN LETTER LATERAL CLICK\r
- = double pipe\r
- * Khoisan tradition\r
- * "x" in Zulu orthography\r
- x (latin letter inverted glottal stop - 0296)\r
- x (parallel to - 2225)\r
-01C2 LATIN LETTER ALVEOLAR CLICK\r
- = double-barred pipe\r
- * Khoisan tradition\r
- x (not equal to - 2260)\r
-01C3 LATIN LETTER RETROFLEX CLICK\r
- = LATIN LETTER EXCLAMATION MARK\r
- * Khoisan tradition\r
- * "q" in Zulu orthography\r
- x (exclamation mark - 0021)\r
- x (latin letter stretched c - 0297)\r
-@ Croatian digraphs matching Serbian Cyrillic letters\r
-01C4 LATIN CAPITAL LETTER DZ WITH CARON\r
- # 0044 017D\r
-01C5 LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON\r
- # 0044 017E\r
-01C6 LATIN SMALL LETTER DZ WITH CARON\r
- x (cyrillic small letter dzhe - 045F)\r
- # 0064 017E\r
-01C7 LATIN CAPITAL LETTER LJ\r
- # 004C 004A\r
-01C8 LATIN CAPITAL LETTER L WITH SMALL LETTER J\r
- # 004C 006A\r
-01C9 LATIN SMALL LETTER LJ\r
- x (cyrillic small letter lje - 0459)\r
- # 006C 006A\r
-01CA LATIN CAPITAL LETTER NJ\r
- # 004E 004A\r
-01CB LATIN CAPITAL LETTER N WITH SMALL LETTER J\r
- # 004E 006A\r
-01CC LATIN SMALL LETTER NJ\r
- x (cyrillic small letter nje - 045A)\r
- # 006E 006A\r
-@ Pinyin diacritic-vowel combinations\r
-01CD LATIN CAPITAL LETTER A WITH CARON\r
- : 0041 030C\r
-01CE LATIN SMALL LETTER A WITH CARON\r
- * Pinyin third tone\r
- : 0061 030C\r
-01CF LATIN CAPITAL LETTER I WITH CARON\r
- : 0049 030C\r
-01D0 LATIN SMALL LETTER I WITH CARON\r
- * Pinyin third tone\r
- : 0069 030C\r
-01D1 LATIN CAPITAL LETTER O WITH CARON\r
- : 004F 030C\r
-01D2 LATIN SMALL LETTER O WITH CARON\r
- * Pinyin third tone\r
- : 006F 030C\r
-01D3 LATIN CAPITAL LETTER U WITH CARON\r
- : 0055 030C\r
-01D4 LATIN SMALL LETTER U WITH CARON\r
- * Pinyin third tone\r
- : 0075 030C\r
-01D5 LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON\r
- : 00DC 0304\r
-01D6 LATIN SMALL LETTER U WITH DIAERESIS AND MACRON\r
- * Pinyin first tone\r
- : 00FC 0304\r
-01D7 LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE\r
- : 00DC 0301\r
-01D8 LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE\r
- * Pinyin second tone\r
- : 00FC 0301\r
-01D9 LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON\r
- : 00DC 030C\r
-01DA LATIN SMALL LETTER U WITH DIAERESIS AND CARON\r
- * Pinyin third tone\r
- : 00FC 030C\r
-01DB LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE\r
- : 00DC 0300\r
-01DC LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE\r
- * Pinyin fourth tone\r
- : 00FC 0300\r
-@ Additions\r
-01DD LATIN SMALL LETTER TURNED E\r
- * Pan-Nigerian alphabet\r
- * all other usages of schwa are 0259\r
- * uppercase is 018E\r
- x (latin small letter schwa - 0259)\r
-01DE LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON\r
- : 00C4 0304\r
-01DF LATIN SMALL LETTER A WITH DIAERESIS AND MACRON\r
- * Livonian, Uralicist usage\r
- : 00E4 0304\r
-01E0 LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON\r
- : 0226 0304\r
-01E1 LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON\r
- * Uralicist usage\r
- : 0227 0304\r
-01E2 LATIN CAPITAL LETTER AE WITH MACRON (ash) *\r
- : 00C6 0304\r
-01E3 LATIN SMALL LETTER AE WITH MACRON (ash) *\r
- * Old Norse, Old English\r
- : 00E6 0304\r
-01E4 LATIN CAPITAL LETTER G WITH STROKE\r
-01E5 LATIN SMALL LETTER G WITH STROKE\r
- * Skolt Sámi\r
-01E6 LATIN CAPITAL LETTER G WITH CARON\r
- : 0047 030C\r
-01E7 LATIN SMALL LETTER G WITH CARON\r
- * Skolt Sámi\r
- x (latin small letter g with breve - 011F)\r
- : 0067 030C\r
-01E8 LATIN CAPITAL LETTER K WITH CARON\r
- : 004B 030C\r
-01E9 LATIN SMALL LETTER K WITH CARON\r
- * Skolt Sámi\r
- : 006B 030C\r
-01EA LATIN CAPITAL LETTER O WITH OGONEK\r
- : 004F 0328\r
-01EB LATIN SMALL LETTER O WITH OGONEK\r
- * Sámi, Iroquoian, Old Icelandic\r
- : 006F 0328\r
-01EC LATIN CAPITAL LETTER O WITH OGONEK AND MACRON\r
- : 01EA 0304\r
-01ED LATIN SMALL LETTER O WITH OGONEK AND MACRON\r
- * Old Icelandic\r
- : 01EB 0304\r
-01EE LATIN CAPITAL LETTER EZH WITH CARON\r
- : 01B7 030C\r
-01EF LATIN SMALL LETTER EZH WITH CARON\r
- * Skolt Sámi\r
- : 0292 030C\r
-01F0 LATIN SMALL LETTER J WITH CARON\r
- * IPA and many languages\r
- : 006A 030C\r
-01F1 LATIN CAPITAL LETTER DZ\r
- # 0044 005A\r
-01F2 LATIN CAPITAL LETTER D WITH SMALL LETTER Z\r
- # 0044 007A\r
-01F3 LATIN SMALL LETTER DZ\r
- # 0064 007A\r
-01F4 LATIN CAPITAL LETTER G WITH ACUTE\r
- : 0047 0301\r
-01F5 LATIN SMALL LETTER G WITH ACUTE\r
- * Macedonian and Serbian transliteration\r
- : 0067 0301\r
-01F6 LATIN CAPITAL LETTER HWAIR\r
- * lowercase is 0195\r
-01F7 LATIN CAPITAL LETTER WYNN\r
- = wen\r
- * lowercase is 01BF\r
-01F8 LATIN CAPITAL LETTER N WITH GRAVE\r
- : 004E 0300\r
-01F9 LATIN SMALL LETTER N WITH GRAVE\r
- * Pinyin\r
- : 006E 0300\r
-01FA LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE\r
- : 00C5 0301\r
-01FB LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE\r
- : 00E5 0301\r
-01FC LATIN CAPITAL LETTER AE WITH ACUTE (ash) *\r
- : 00C6 0301\r
-01FD LATIN SMALL LETTER AE WITH ACUTE (ash) *\r
- : 00E6 0301\r
-01FE LATIN CAPITAL LETTER O WITH STROKE AND ACUTE\r
- : 00D8 0301\r
-01FF LATIN SMALL LETTER O WITH STROKE AND ACUTE\r
- : 00F8 0301\r
-@ Additions for Slovenian and Croatian\r
-0200 LATIN CAPITAL LETTER A WITH DOUBLE GRAVE\r
- : 0041 030F\r
-0201 LATIN SMALL LETTER A WITH DOUBLE GRAVE\r
- : 0061 030F\r
-0202 LATIN CAPITAL LETTER A WITH INVERTED BREVE\r
- : 0041 0311\r
-0203 LATIN SMALL LETTER A WITH INVERTED BREVE\r
- : 0061 0311\r
-0204 LATIN CAPITAL LETTER E WITH DOUBLE GRAVE\r
- : 0045 030F\r
-0205 LATIN SMALL LETTER E WITH DOUBLE GRAVE\r
- : 0065 030F\r
-0206 LATIN CAPITAL LETTER E WITH INVERTED BREVE\r
- : 0045 0311\r
-0207 LATIN SMALL LETTER E WITH INVERTED BREVE\r
- : 0065 0311\r
-0208 LATIN CAPITAL LETTER I WITH DOUBLE GRAVE\r
- : 0049 030F\r
-0209 LATIN SMALL LETTER I WITH DOUBLE GRAVE\r
- : 0069 030F\r
-020A LATIN CAPITAL LETTER I WITH INVERTED BREVE\r
- : 0049 0311\r
-020B LATIN SMALL LETTER I WITH INVERTED BREVE\r
- : 0069 0311\r
-020C LATIN CAPITAL LETTER O WITH DOUBLE GRAVE\r
- : 004F 030F\r
-020D LATIN SMALL LETTER O WITH DOUBLE GRAVE\r
- : 006F 030F\r
-020E LATIN CAPITAL LETTER O WITH INVERTED BREVE\r
- : 004F 0311\r
-020F LATIN SMALL LETTER O WITH INVERTED BREVE\r
- : 006F 0311\r
-0210 LATIN CAPITAL LETTER R WITH DOUBLE GRAVE\r
- : 0052 030F\r
-0211 LATIN SMALL LETTER R WITH DOUBLE GRAVE\r
- : 0072 030F\r
-0212 LATIN CAPITAL LETTER R WITH INVERTED BREVE\r
- : 0052 0311\r
-0213 LATIN SMALL LETTER R WITH INVERTED BREVE\r
- : 0072 0311\r
-0214 LATIN CAPITAL LETTER U WITH DOUBLE GRAVE\r
- : 0055 030F\r
-0215 LATIN SMALL LETTER U WITH DOUBLE GRAVE\r
- : 0075 030F\r
-0216 LATIN CAPITAL LETTER U WITH INVERTED BREVE\r
- : 0055 0311\r
-0217 LATIN SMALL LETTER U WITH INVERTED BREVE\r
- : 0075 0311\r
-@ Additions for Romanian\r
-0218 LATIN CAPITAL LETTER S WITH COMMA BELOW *\r
- : 0053 0326\r
-0219 LATIN SMALL LETTER S WITH COMMA BELOW *\r
- * Romanian, when distinct comma below form is required\r
- x (latin small letter s with cedilla - 015F)\r
- : 0073 0326\r
-021A LATIN CAPITAL LETTER T WITH COMMA BELOW *\r
- : 0054 0326\r
-021B LATIN SMALL LETTER T WITH COMMA BELOW *\r
- * Romanian, when distinct comma below form is required\r
- x (latin small letter t with cedilla - 0163)\r
- : 0074 0326\r
-@ Miscellaneous additions\r
-021C LATIN CAPITAL LETTER YOGH\r
- x (latin capital letter ezh - 01B7)\r
-021D LATIN SMALL LETTER YOGH\r
- * Middle English, Scots\r
- x (latin small letter ezh - 0292)\r
- x (ounce sign - 2125)\r
-021E LATIN CAPITAL LETTER H WITH CARON\r
- : 0048 030C\r
-021F LATIN SMALL LETTER H WITH CARON\r
- * Finnish Romany\r
- : 0068 030C\r
-0222 LATIN CAPITAL LETTER OU\r
-0223 LATIN SMALL LETTER OU\r
- * Algonquin, Huron\r
- x (digit eight - 0038)\r
-0224 LATIN CAPITAL LETTER Z WITH HOOK\r
-0225 LATIN SMALL LETTER Z WITH HOOK\r
- * Middle High German\r
-0226 LATIN CAPITAL LETTER A WITH DOT ABOVE\r
- : 0041 0307\r
-0227 LATIN SMALL LETTER A WITH DOT ABOVE\r
- * Uralicist usage\r
- : 0061 0307\r
-0228 LATIN CAPITAL LETTER E WITH CEDILLA\r
- : 0045 0327\r
-0229 LATIN SMALL LETTER E WITH CEDILLA\r
- : 0065 0327\r
-@ Additions for Livonian\r
-022A LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON\r
- : 00D6 0304\r
-022B LATIN SMALL LETTER O WITH DIAERESIS AND MACRON\r
- * Livonian\r
- : 00F6 0304\r
-022C LATIN CAPITAL LETTER O WITH TILDE AND MACRON\r
- : 00D5 0304\r
-022D LATIN SMALL LETTER O WITH TILDE AND MACRON\r
- * Livonian\r
- : 00F5 0304\r
-022E LATIN CAPITAL LETTER O WITH DOT ABOVE\r
- : 004F 0307\r
-022F LATIN SMALL LETTER O WITH DOT ABOVE\r
- * Livonian\r
- : 006F 0307\r
-0230 LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON\r
- : 022E 0304\r
-0231 LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON\r
- * Livonian\r
- : 022F 0304\r
-0232 LATIN CAPITAL LETTER Y WITH MACRON\r
- : 0059 0304\r
-0233 LATIN SMALL LETTER Y WITH MACRON\r
- * Livonian, Cornish\r
- : 0079 0304\r
-@@ 0250 IPA Extensions 02AF\r
-@ IPA extensions\r
-@+ IPA includes basic Latin letters and a number of Latin letters from other blocks.\r
- x (latin small letter ae - 00E6)\r
- x (latin small letter c with cedilla - 00E7)\r
- x (latin small letter eth - 00F0)\r
- x (latin small letter o with stroke - 00F8)\r
- x (latin small letter h with stroke - 0127)\r
- x (latin small letter eng - 014B)\r
- x (latin small ligature oe - 0153)\r
- x (greek small letter beta - 03B2)\r
- x (greek small letter theta - 03B8)\r
- x (greek small letter lamda - 03BB)\r
- x (greek small letter chi - 03C7)\r
-0250 LATIN SMALL LETTER TURNED A\r
- * low central unrounded vowel\r
-0251 LATIN SMALL LETTER ALPHA\r
- = LATIN SMALL LETTER SCRIPT A\r
- * low back unrounded vowel\r
- x (greek small letter alpha - 03B1)\r
-0252 LATIN SMALL LETTER TURNED ALPHA\r
- * low back rounded vowel\r
-0253 LATIN SMALL LETTER B WITH HOOK\r
- * implosive bilabial stop\r
- * Pan-Nigerian alphabet\r
- x (latin capital letter b with hook - 0181)\r
-0254 LATIN SMALL LETTER OPEN O\r
- * typographically a turned c\r
- * lower-mid back rounded vowel\r
- x (latin capital letter open o - 0186)\r
-0255 LATIN SMALL LETTER C WITH CURL\r
- * voiceless alveolo-palatal laminal fricative\r
- * used in transcription of Mandarin Chinese\r
- * sound spelled with 015B in Polish\r
-0256 LATIN SMALL LETTER D WITH TAIL\r
- = LATIN SMALL LETTER D RETROFLEX HOOK\r
- * voiced retroflex stop\r
- x (latin capital letter african d - 0189)\r
-0257 LATIN SMALL LETTER D WITH HOOK\r
- * implosive dental or alveolar stop\r
- * Ewe, Pan-Nigerian alphabet\r
- x (latin capital letter d with hook - 018A)\r
-0258 LATIN SMALL LETTER REVERSED E\r
- * upper-mid central unrounded vowel\r
-0259 LATIN SMALL LETTER SCHWA\r
- * mid-central unrounded vowel\r
- * variant uppercase form 018E is associated with 01DD\r
- x (latin capital letter schwa - 018F)\r
- x (latin small letter turned e - 01DD)\r
- x (cyrillic small letter schwa - 04D9)\r
-025A LATIN SMALL LETTER SCHWA WITH HOOK\r
- * rhotacized schwa\r
-025B LATIN SMALL LETTER OPEN E\r
- = LATIN SMALL LETTER EPSILON\r
- * lower-mid front unrounded vowel\r
- x (latin capital letter open e - 0190)\r
- x (greek small letter epsilon - 03B5)\r
-025C LATIN SMALL LETTER REVERSED OPEN E\r
- * lower-mid central unrounded vowel\r
-025D LATIN SMALL LETTER REVERSED OPEN E WITH HOOK\r
- * rhotacized lower-mid central vowel\r
-025E LATIN SMALL LETTER CLOSED REVERSED OPEN E\r
- = LATIN SMALL LETTER CLOSED REVERSED EPSILON\r
- * lower-mid central rounded vowel\r
-025F LATIN SMALL LETTER DOTLESS J WITH STROKE\r
- * voiced palatal stop\r
- * typographically a turned f, but better thought of as a form of j\r
- * "gy" in Hungarian orthography\r
- * also archaic phonetic for palatoalveolar affricate 02A4\r
-0260 LATIN SMALL LETTER G WITH HOOK\r
- * implosive velar stop\r
- x (latin capital letter g with hook - 0193)\r
-0261 LATIN SMALL LETTER SCRIPT G\r
- * voiced velar stop\r
- x (latin small letter g - 0067)\r
-0262 LATIN LETTER SMALL CAPITAL G\r
- * voiced uvular stop\r
-0263 LATIN SMALL LETTER GAMMA\r
- * voiced velar fricative\r
- x (latin capital letter gamma - 0194)\r
- x (greek small letter gamma - 03B3)\r
-0264 LATIN SMALL LETTER RAMS HORN\r
- = LATIN SMALL LETTER BABY GAMMA\r
- * upper-mid back unrounded vowel\r
-0265 LATIN SMALL LETTER TURNED H\r
- * voiced rounded palatal approximant\r
-0266 LATIN SMALL LETTER H WITH HOOK\r
- * breathy-voiced glottal fricative\r
- x (modifier letter small h with hook - 02B1)\r
-0267 LATIN SMALL LETTER HENG WITH HOOK\r
- * voiceless coarticulated velar and palatoalveolar fricative\r
- * "tj" or "kj" or "sj" in some Swedish dialects\r
-0268 LATIN SMALL LETTER I WITH STROKE\r
- = barred i, i bar\r
- * high central unrounded vowel\r
- * ISO 6438 gives lowercase of 0197 as 026A, not 0268\r
-0269 LATIN SMALL LETTER IOTA\r
- * semi-high front unrounded vowel\r
-@+ * obsoleted by IPA in 1989\r
- * preferred use is 026A LATIN LETTER SMALL CAPITAL I\r
- x (latin capital letter iota - 0196)\r
- x (greek small letter iota - 03B9)\r
-026A LATIN LETTER SMALL CAPITAL I\r
- * semi-high front unrounded vowel\r
- * preferred IPA alternate for 0269\r
- x (latin capital letter i with stroke - 0197)\r
-026B LATIN SMALL LETTER L WITH MIDDLE TILDE\r
- * velarized voiced alveolar lateral approximant\r
-026C LATIN SMALL LETTER L WITH BELT\r
- * voiceless alveolar lateral fricative\r
-026D LATIN SMALL LETTER L WITH RETROFLEX HOOK\r
- * voiced retroflex lateral\r
-026E LATIN SMALL LETTER LEZH\r
- * voiced lateral fricative\r
- * "dhl" in Zulu orthography\r
-026F LATIN SMALL LETTER TURNED M\r
- * high back unrounded vowel\r
- x (latin capital letter turned m - 019C)\r
-0270 LATIN SMALL LETTER TURNED M WITH LONG LEG\r
- * voiced velar approximant\r
-0271 LATIN SMALL LETTER M WITH HOOK\r
- * voiced labiodental nasal\r
-0272 LATIN SMALL LETTER N WITH LEFT HOOK\r
- * voiced palatal nasal\r
- x (latin capital letter n with left hook - 019D)\r
-0273 LATIN SMALL LETTER N WITH RETROFLEX HOOK\r
- * voiced retroflex nasal\r
-0274 LATIN LETTER SMALL CAPITAL N\r
- * voiced uvular nasal\r
-0275 LATIN SMALL LETTER BARRED O\r
- = o bar\r
- * rounded mid-central vowel, i.e. rounded schwa\r
- * uppercase is 019F\r
- x (greek small letter theta - 03B8)\r
- x (cyrillic small letter fita - 0473)\r
- x (cyrillic small letter barred o - 04E9)\r
-0276 LATIN LETTER SMALL CAPITAL OE\r
- * low front rounded vowel\r
- x (latin small ligature oe - 0153)\r
-0277 LATIN SMALL LETTER CLOSED OMEGA\r
- * semi-high back rounded vowel\r
-@+ * obsoleted by IPA in 1989\r
- * preferred use is 028A latin small letter upsilon\r
-0278 LATIN SMALL LETTER PHI\r
- * voiceless bilabial fricative\r
- x (greek small letter phi - 03C6)\r
-0279 LATIN SMALL LETTER TURNED R\r
- * voiced alveolar approximant\r
- x (modifier letter small turned r - 02B4)\r
-027A LATIN SMALL LETTER TURNED R WITH LONG LEG\r
- * voiced lateral flap\r
-027B LATIN SMALL LETTER TURNED R WITH HOOK\r
- * voiced retroflex approximant\r
- x (modifier letter small turned r with hook - 02B5)\r
-027C LATIN SMALL LETTER R WITH LONG LEG\r
- * voiced strident apico-alveolar trill\r
-@+ * obsoleted by IPA in 1989\r
- * sound spelled with 0159 in Czech\r
- * preferred phonetic representation for Czech is 0072 031D\r
- * in current use in Gaelic types (as glyph variant of 0072)\r
-027D LATIN SMALL LETTER R WITH TAIL\r
- * voiced retroflex flap\r
-027E LATIN SMALL LETTER R WITH FISHHOOK\r
- * voiced alveolar flap or tap\r
-027F LATIN SMALL LETTER REVERSED R WITH FISHHOOK\r
- * apical dental vowel\r
- * used in Sinological tradition\r
- * IPA spelling - 007A 0329\r
-0280 LATIN LETTER SMALL CAPITAL R *\r
- * voiced uvular trill\r
- * Germanic, Old Norse\r
- * uppercase is 01A6\r
-0281 LATIN LETTER SMALL CAPITAL INVERTED R\r
- * voiced uvular fricative or approximant\r
- x (modifier letter small capital inverted r - 02B6)\r
-0282 LATIN SMALL LETTER S WITH HOOK\r
- * voiceless retroflex fricative\r
-0283 LATIN SMALL LETTER ESH\r
- * voiceless postalveolar fricative\r
- x (latin capital letter esh - 01A9)\r
- x (integral - 222B)\r
-0284 LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK\r
- * implosive palatal stop\r
- * typographically based on 025F, not on 0283\r
-0285 LATIN SMALL LETTER SQUAT REVERSED ESH\r
- * apical retroflex vowel\r
- * used in Sinological tradition\r
- * IPA spelling - 0290 0329\r
-0286 LATIN SMALL LETTER ESH WITH CURL\r
- * palatalized voiceless postalveolar fricative\r
- * suggested spelling - 0283 02B2\r
-0287 LATIN SMALL LETTER TURNED T\r
- * dental click (sound of "tsk tsk")\r
- x (latin letter dental click - 01C0)\r
-0288 LATIN SMALL LETTER T WITH RETROFLEX HOOK\r
- * voiceless retroflex stop\r
- x (latin capital letter t with retroflex hook - 01AE)\r
-0289 LATIN SMALL LETTER U BAR\r
- * high central rounded vowel\r
-028A LATIN SMALL LETTER UPSILON\r
- * semi-high back rounded vowel\r
- * preferred IPA alternate to 0277\r
- x (latin capital letter upsilon - 01B1)\r
- x (greek small letter upsilon - 03C5)\r
-028B LATIN SMALL LETTER V WITH HOOK\r
- = LATIN SMALL LETTER SCRIPT V\r
- * voiced labiodental approximant\r
- x (latin capital letter v with hook - 01B2)\r
- x (greek small letter upsilon - 03C5)\r
-028C LATIN SMALL LETTER TURNED V\r
- = caret, wedge\r
- * lower-mid back unrounded vowel\r
- x (greek capital letter lamda - 039B)\r
- x (caret - 2038)\r
- x (logical and - 2227)\r
-028D LATIN SMALL LETTER TURNED W\r
- * voiceless rounded labiovelar approximant\r
-028E LATIN SMALL LETTER TURNED Y\r
- * voiced lateral approximant\r
-028F LATIN LETTER SMALL CAPITAL Y\r
- * semi-high front rounded vowel\r
-0290 LATIN SMALL LETTER Z WITH RETROFLEX HOOK\r
- * voiced retroflex fricative\r
-0291 LATIN SMALL LETTER Z WITH CURL\r
- * voiced alveolo-palatal laminal fricative\r
- * sound spelled with 017A in Polish\r
-0292 LATIN SMALL LETTER EZH\r
- = LATIN SMALL LETTER YOGH\r
- = dram\r
- * voiced postalveolar fricative\r
- * uppercase is 01B7\r
- * Skolt Sámi\r
- x (latin small letter yogh - 021D)\r
- x (cyrillic small letter abkhasian dze - 04E1)\r
- x (ounce sign - 2125)\r
-0293 LATIN SMALL LETTER EZH WITH CURL\r
- * palatalized voiced postalveolar fricative\r
-0294 LATIN LETTER GLOTTAL STOP\r
- x (modifier letter glottal stop - 02C0)\r
-0295 LATIN LETTER PHARYNGEAL VOICED FRICATIVE\r
- = LATIN LETTER REVERSED GLOTTAL STOP\r
- * voiced pharyngeal fricative\r
- * ain\r
- x (latin small letter ezh reversed - 01B9)\r
- x (modifier letter reversed glottal stop - 02C1)\r
-0296 LATIN LETTER INVERTED GLOTTAL STOP\r
- * lateral click\r
- x (latin letter lateral click - 01C1)\r
-0297 LATIN LETTER STRETCHED C\r
- * palatal (or alveolar) click\r
- x (latin letter retroflex click - 01C3)\r
- x (complement - 2201)\r
-0298 LATIN LETTER BILABIAL CLICK\r
- = LATIN LETTER BULLSEYE\r
- x (circled dot operator - 2299)\r
-0299 LATIN LETTER SMALL CAPITAL B\r
- * bilabial trill\r
-029A LATIN SMALL LETTER CLOSED OPEN E\r
- = LATIN SMALL LETTER CLOSED EPSILON\r
- * lower-mid front rounded vowel\r
- * non-IPA alternate for the preferred 0153\r
-029B LATIN LETTER SMALL CAPITAL G WITH HOOK\r
- * voiced uvular implosive\r
-029C LATIN LETTER SMALL CAPITAL H\r
- * voiceless epiglottal fricative\r
-029D LATIN SMALL LETTER J WITH CROSSED-TAIL\r
- * voiced palatal fricative\r
-029E LATIN SMALL LETTER TURNED K\r
- * proposed for velar click\r
-@+ * withdrawn by IPA in 1970\r
-029F LATIN LETTER SMALL CAPITAL L\r
- * velar lateral approximant\r
-02A0 LATIN SMALL LETTER Q WITH HOOK\r
- * voiceless uvular implosive\r
-02A1 LATIN LETTER GLOTTAL STOP WITH STROKE\r
- * voiced epiglottal stop\r
-02A2 LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE\r
- * voiced epiglottal fricative\r
-02A3 LATIN SMALL LETTER DZ DIGRAPH\r
- * voiced dental affricate\r
-02A4 LATIN SMALL LETTER DEZH DIGRAPH\r
- * voiced postalveolar affricate\r
-02A5 LATIN SMALL LETTER DZ DIGRAPH WITH CURL\r
- * voiced alveolo-palatal affricate\r
-02A6 LATIN SMALL LETTER TS DIGRAPH\r
- * voiceless dental affricate\r
-02A7 LATIN SMALL LETTER TESH DIGRAPH\r
- * voiceless postalveolar affricate\r
-02A8 LATIN SMALL LETTER TC DIGRAPH WITH CURL\r
- * voiceless alveolo-palatal affricate\r
-@ IPA characters for disordered speech\r
-02A9 LATIN SMALL LETTER FENG DIGRAPH\r
- * velopharyngeal fricative\r
-02AA LATIN SMALL LETTER LS DIGRAPH\r
- * lateral alveolar fricative (lisp)\r
-02AB LATIN SMALL LETTER LZ DIGRAPH\r
- * voiced lateral alveolar fricative\r
-02AC LATIN LETTER BILABIAL PERCUSSIVE\r
- * audible lip smack\r
-02AD LATIN LETTER BIDENTAL PERCUSSIVE\r
- * audible teeth gnashing\r
-@@ 02B0 Spacing Modifier Letters 02FF\r
-@ Phonetic modifiers derived from Latin letters\r
-02B0 MODIFIER LETTER SMALL H\r
- * aspiration\r
- # <super> 0068\r
-02B1 MODIFIER LETTER SMALL H WITH HOOK\r
- * breathy voiced, murmured\r
- x (latin small letter h with hook - 0266)\r
- x (combining diaeresis below - 0324)\r
- # <super> 0266\r
-02B2 MODIFIER LETTER SMALL J\r
- * palatalization\r
- x (combining palatalized hook below - 0321)\r
- # <super> 006A\r
-02B3 MODIFIER LETTER SMALL R\r
- # <super> 0072\r
-02B4 MODIFIER LETTER SMALL TURNED R\r
- x (latin small letter turned r - 0279)\r
- # <super> 0279\r
-02B5 MODIFIER LETTER SMALL TURNED R WITH HOOK\r
- x (latin small letter turned r with hook - 027B)\r
- # <super> 027B\r
-02B6 MODIFIER LETTER SMALL CAPITAL INVERTED R\r
- * preceding four used for r-coloring or r-offglides\r
- x (latin letter small capital inverted r - 0281)\r
- # <super> 0281\r
-02B7 MODIFIER LETTER SMALL W\r
- * labialization\r
- x (combining inverted double arch below - 032B)\r
- # <super> 0077\r
-02B8 MODIFIER LETTER SMALL Y\r
- * palatalization\r
- * common Americanist substitution for 02B2\r
- # <super> 0079\r
-@ Miscellaneous phonetic modifiers\r
-02B9 MODIFIER LETTER PRIME\r
- * primary stress, emphasis\r
- * transliteration of mjagkij znak (Cyrillic soft sign: palatalization)\r
- x (apostrophe - 0027)\r
- x (acute accent - 00B4)\r
- x (modifier letter acute accent - 02CA)\r
- x (combining acute accent - 0301)\r
- x (greek numeral sign - 0374)\r
- x (prime - 2032)\r
-02BA MODIFIER LETTER DOUBLE PRIME\r
- * exaggerated stress, contrastive stress\r
- * transliteration of tverdyj znak (Cyrillic hard sign: no palatalization)\r
- x (quotation mark - 0022)\r
- x (combining double acute accent - 030B)\r
- x (double prime - 2033)\r
-02BB MODIFIER LETTER TURNED COMMA\r
- * typographical alternate for 02BD or 02BF\r
- x (combining turned comma above - 0312)\r
- x (left single quotation mark - 2018)\r
-02BC MODIFIER LETTER APOSTROPHE\r
- = apostrophe\r
- * glottal stop, glottalization, ejective\r
- * spacing clone of Greek smooth breathing mark\r
- * many languages use this as a letter of their alphabets\r
- x (apostrophe - 0027)\r
- x (combining comma above - 0313)\r
- x (combining comma above right - 0315)\r
- x (armenian apostrophe - 055A)\r
- x (right single quotation mark - 2019)\r
-02BD MODIFIER LETTER REVERSED COMMA\r
- * weak aspiration\r
- * spacing clone of Greek rough breathing mark\r
- x (combining reversed comma above - 0314)\r
- x (armenian modifier letter left half ring - 0559)\r
- x (single high-reversed-9 quotation mark - 201B)\r
-02BE MODIFIER LETTER RIGHT HALF RING\r
- * transliteration of Arabic hamza (glottal stop)\r
- x (armenian apostrophe - 055A)\r
- x (arabic letter hamza - 0621)\r
-02BF MODIFIER LETTER LEFT HALF RING\r
- * transliteration of Arabic ain (voiced pharyngeal fricative)\r
- x (armenian modifier letter left half ring - 0559)\r
- x (arabic letter ain - 0639)\r
-02C0 MODIFIER LETTER GLOTTAL STOP\r
- * ejective or glottalized\r
- * typographical alternate for 02BC or 02BE\r
- x (latin letter glottal stop - 0294)\r
- x (combining hook above - 0309)\r
-02C1 MODIFIER LETTER REVERSED GLOTTAL STOP\r
- * typographical alternate for 02BF\r
- x (latin letter pharyngeal voiced fricative - 0295)\r
-02C2 MODIFIER LETTER LEFT ARROWHEAD\r
- * fronted articulation\r
-02C3 MODIFIER LETTER RIGHT ARROWHEAD\r
- * backed articulation\r
-02C4 MODIFIER LETTER UP ARROWHEAD\r
- * raised articulation\r
- x (circumflex accent - 005E)\r
- x (up arrowhead - 2303)\r
-02C5 MODIFIER LETTER DOWN ARROWHEAD\r
- * lowered articulation\r
-02C6 MODIFIER LETTER CIRCUMFLEX ACCENT\r
- * rising-falling tone, falling tone, secondary stress, etc.\r
- x (circumflex accent - 005E)\r
- x (combining circumflex accent - 0302)\r
-02C7 CARON (Mandarin Chinese third tone)\r
- = hacek\r
- * falling-rising tone\r
- * Mandarin Chinese third tone\r
- x (combining caron - 030C)\r
-02C8 MODIFIER LETTER VERTICAL LINE\r
- * primary stress, downstep\r
- * precedes letter or syllable modified\r
- x (apostrophe - 0027)\r
- x (combining vertical line above - 030D)\r
-02C9 MODIFIER LETTER MACRON (Mandarin Chinese first tone)\r
- * high level tone\r
- * precedes or follows letter or syllable modified\r
- * Mandarin Chinese first tone\r
- x (macron - 00AF)\r
- x (combining macron - 0304)\r
-02CA MODIFIER LETTER ACUTE ACCENT (Mandarin Chinese second tone)\r
- * high-rising tone (IPA), high tone, primary stress\r
- * Mandarin Chinese second tone\r
- x (acute accent - 00B4)\r
- x (modifier letter prime - 02B9)\r
- x (combining acute accent - 0301)\r
- x (greek numeral sign - 0374)\r
- x (armenian emphasis mark - 055B)\r
-02CB MODIFIER LETTER GRAVE ACCENT (Mandarin Chinese fourth tone)\r
- * high-falling tone (IPA), low tone, secondary or tertiary stress\r
- * Mandarin Chinese fourth tone\r
- x (grave accent - 0060)\r
- x (combining grave accent - 0300)\r
- x (armenian comma - 055D)\r
-02CC MODIFIER LETTER LOW VERTICAL LINE\r
- * secondary stress\r
- * precedes letter or syllable modified\r
- x (combining vertical line below - 0329)\r
-02CD MODIFIER LETTER LOW MACRON\r
- * low level tone\r
- x (low line - 005F)\r
- x (combining macron below - 0331)\r
-02CE MODIFIER LETTER LOW GRAVE ACCENT\r
- * low-falling tone\r
-02CF MODIFIER LETTER LOW ACUTE ACCENT\r
- * low-rising tone\r
- x (greek lower numeral sign - 0375)\r
-02D0 MODIFIER LETTER TRIANGULAR COLON\r
- * length mark\r
- x (colon - 003A)\r
-02D1 MODIFIER LETTER HALF TRIANGULAR COLON\r
- * half-length mark\r
- x (middle dot - 00B7)\r
-02D2 MODIFIER LETTER CENTRED RIGHT HALF RING\r
- * more rounded articulation\r
-02D3 MODIFIER LETTER CENTRED LEFT HALF RING\r
- * less rounded articulation\r
-02D4 MODIFIER LETTER UP TACK\r
- * vowel raising or closing\r
- x (combining up tack below - 031D)\r
- x (combining dot below - 0323)\r
-02D5 MODIFIER LETTER DOWN TACK\r
- * vowel lowering or opening\r
- x (combining left half ring below - 031C)\r
- x (combining down tack below - 031E)\r
-02D6 MODIFIER LETTER PLUS SIGN\r
- * advanced or fronted articulation\r
- x (combining plus sign below - 031F)\r
-02D7 MODIFIER LETTER MINUS SIGN\r
- * retracted or backed articulation\r
- * glyph may have small end-serifs\r
- x (combining minus sign below - 0320)\r
-@ Spacing clones of diacritics\r
-02D8 BREVE\r
- x (combining breve - 0306)\r
- # 0020 0306\r
-02D9 DOT ABOVE (Mandarin Chinese light tone)\r
- * Mandarin Chinese fifth tone (light or neutral)\r
- x (combining dot above - 0307)\r
- # 0020 0307\r
-02DA RING ABOVE\r
- x (degree sign - 00B0)\r
- x (combining ring above - 030A)\r
- # 0020 030A\r
-02DB OGONEK\r
- x (combining ogonek - 0328)\r
- # 0020 0328\r
-02DC SMALL TILDE\r
- x (tilde - 007E)\r
- x (combining tilde - 0303)\r
- x (tilde operator - 223C)\r
- # 0020 0303\r
-02DD DOUBLE ACUTE ACCENT\r
- x (combining double acute accent - 030B)\r
- # 0020 030B\r
-@ Additions based on 1989 IPA\r
-02DE MODIFIER LETTER RHOTIC HOOK\r
- * rhotacization in vowel\r
- * often ligated: 025A = 0259 + 02DE; 025D = 025C + 02DE\r
-02DF MODIFIER LETTER CROSS ACCENT\r
- * Swedish grave accent\r
-02E0 MODIFIER LETTER SMALL GAMMA\r
- * these modifier letters are occasionally used in transcription of affricates\r
- # <super> 0263\r
-02E1 MODIFIER LETTER SMALL L\r
- # <super> 006C\r
-02E2 MODIFIER LETTER SMALL S\r
- # <super> 0073\r
-02E3 MODIFIER LETTER SMALL X\r
- # <super> 0078\r
-02E4 MODIFIER LETTER SMALL REVERSED GLOTTAL STOP\r
- # <super> 0295\r
-@ Tone letters\r
-02E5 MODIFIER LETTER EXTRA-HIGH TONE BAR\r
-02E6 MODIFIER LETTER HIGH TONE BAR\r
-02E7 MODIFIER LETTER MID TONE BAR\r
-02E8 MODIFIER LETTER LOW TONE BAR\r
-02E9 MODIFIER LETTER EXTRA-LOW TONE BAR\r
-02EA MODIFIER LETTER YIN DEPARTING TONE MARK\r
-02EB MODIFIER LETTER YANG DEPARTING TONE MARK\r
-@ IPA modifiers\r
-02EC MODIFIER LETTER VOICING\r
-02ED MODIFIER LETTER UNASPIRATED\r
-@ Other modifier letters\r
-02EE MODIFIER LETTER DOUBLE APOSTROPHE\r
-\r
-2000 EN QUAD\r
- : 2002 en space\r
-2001 EM QUAD\r
- = mutton quad\r
- : 2003 em space\r
-2002 EN SPACE\r
- = nut\r
- * half an em\r
- # 0020 space\r
-2003 EM SPACE\r
- = mutton\r
- * nominally, a space equal to the type size in points\r
- * may scale by the condensation factor of a font\r
- # 0020 space\r
-2004 THREE-PER-EM SPACE\r
- = thick space\r
- # 0020 space\r
-2005 FOUR-PER-EM SPACE\r
- = mid space\r
- # 0020 space\r
-2006 SIX-PER-EM SPACE\r
- * in computer typography sometimes equated to thin space\r
- # 0020 space\r
-2007 FIGURE SPACE\r
- * space equal to tabular width of a font\r
- * this is equivalent to the digit width of fonts with fixed-width digits\r
- # <noBreak> 0020\r
-2008 PUNCTUATION SPACE\r
- * space equal to narrow punctuation of a font\r
- # 0020 space\r
-2009 THIN SPACE\r
- * a fifth of an em (or sometimes a sixth)\r
- # 0020 space\r
-200A HAIR SPACE\r
- * thinner than a thin space\r
- * in traditional typography, the thinnest space available\r
- # 0020 space\r
-200B ZERO WIDTH SPACE\r
- * nominally zero width, but may expand in justification\r
-@ Formatting characters\r
-200C ZERO WIDTH NON-JOINER\r
- = ZWNJ\r
-200D ZERO WIDTH JOINER\r
- = ZWJ\r
-200E LEFT-TO-RIGHT MARK\r
- = LRM\r
-200F RIGHT-TO-LEFT MARK\r
- = RLM\r
-@ Dashes\r
-2010 HYPHEN\r
- x (hyphen-minus - 002D)\r
-2011 NON-BREAKING HYPHEN\r
- x (hyphen-minus - 002D)\r
- # <noBreak> 2010\r
-2012 FIGURE DASH\r
-2013 EN DASH\r
-2014 EM DASH\r
- * may be used in pairs to offset parenthetical text\r
- x (katakana-hiragana prolonged sound mark - 30FC)\r
-2015 HORIZONTAL BAR\r
- = QUOTATION DASH\r
- * long dash introducing quoted text\r
-@ General punctuation\r
-2016 DOUBLE VERTICAL LINE\r
- * used in pairs to indicate norm of a matrix\r
- x (parallel to - 2225)\r
-2017 DOUBLE LOW LINE\r
- * this is a spacing character\r
- x (low line - 005F)\r
- x (combining double low line - 0333)\r
- # 0020 0333\r
-2018 LEFT SINGLE QUOTATION MARK\r
- = SINGLE TURNED COMMA QUOTATION MARK\r
- * this is the preferred glyph (as opposed to 201B)\r
- x (apostrophe - 0027)\r
- x (modifier letter turned comma - 02BB)\r
- x (heavy single turned comma quotation mark ornament - 275B)\r
-2019 RIGHT SINGLE QUOTATION MARK\r
- = SINGLE COMMA QUOTATION MARK\r
- * this is the preferred character to use for apostrophe\r
- x (apostrophe - 0027)\r
- x (modifier letter apostrophe - 02BC)\r
- x (heavy single comma quotation mark ornament - 275C)\r
-201A SINGLE LOW-9 QUOTATION MARK\r
- = LOW SINGLE COMMA QUOTATION MARK\r
- * used as opening single quotation mark in some languages\r
-201B SINGLE HIGH-REVERSED-9 QUOTATION MARK\r
- = SINGLE REVERSED COMMA QUOTATION MARK\r
- * glyph variant of 2018\r
- x (modifier letter reversed comma - 02BD)\r
-201C LEFT DOUBLE QUOTATION MARK\r
- = DOUBLE TURNED COMMA QUOTATION MARK\r
- * this is the preferred glyph (as opposed to 201F)\r
- x (quotation mark - 0022)\r
- x (heavy double turned comma quotation mark ornament - 275D)\r
- x (reversed double prime quotation mark - 301D)\r
-201D RIGHT DOUBLE QUOTATION MARK\r
- = DOUBLE COMMA QUOTATION MARK\r
- x (quotation mark - 0022)\r
- x (double prime - 2033)\r
- x (heavy double comma quotation mark ornament - 275E)\r
- x (double prime quotation mark - 301E)\r
-201E DOUBLE LOW-9 QUOTATION MARK\r
- = LOW DOUBLE COMMA QUOTATION MARK\r
- * used as opening double quotation mark in some languages\r
- x (low double prime quotation mark - 301F)\r
-201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK\r
- = DOUBLE REVERSED COMMA QUOTATION MARK\r
- * glyph variant of 201C\r
-2020 DAGGER\r
- = obelisk, obelus, long cross\r
-2021 DOUBLE DAGGER\r
- = diesis, double obelisk\r
-2022 BULLET\r
- = black small circle\r
- x (middle dot - 00B7)\r
- x (one dot leader - 2024)\r
- x (bullet operator - 2219)\r
- x (inverse bullet - 25D8)\r
- x (white bullet - 25E6)\r
-2023 TRIANGULAR BULLET\r
- x (end of proof - 220E)\r
- x (black right-pointing small triangle - 25B8)\r
-2024 ONE DOT LEADER\r
- x (middle dot - 00B7)\r
- x (bullet - 2022)\r
- x (bullet operator - 2219)\r
- # 002E full stop\r
-2025 TWO DOT LEADER\r
- # 002E 002E\r
-2026 HORIZONTAL ELLIPSIS\r
- = three dot leader\r
- x (vertical ellipsis - 22EE)\r
- # 002E 002E 002E\r
-2027 HYPHENATION POINT\r
-@ Formatting characters\r
-2028 LINE SEPARATOR\r
- * may be used to represent this semantic unambiguously\r
-2029 PARAGRAPH SEPARATOR\r
- * may be used to represent this semantic unambiguously\r
-202A LEFT-TO-RIGHT EMBEDDING\r
- = LRE\r
-202B RIGHT-TO-LEFT EMBEDDING\r
- = RLE\r
-202C POP DIRECTIONAL FORMATTING\r
- = PDF\r
-202D LEFT-TO-RIGHT OVERRIDE\r
- = LRO\r
-202E RIGHT-TO-LEFT OVERRIDE\r
- = RLO\r
-202F NARROW NO-BREAK SPACE\r
- x (no-break space - 00A0)\r
- # <noBreak> 0020\r
-@ General punctuation\r
-2030 PER MILLE SIGN\r
- x (percent sign - 0025)\r
-2031 PER TEN THOUSAND SIGN\r
- x (percent sign - 0025)\r
-2032 PRIME\r
- = minutes, feet\r
- x (apostrophe - 0027)\r
- x (acute accent - 00B4)\r
- x (modifier letter prime - 02B9)\r
-2033 DOUBLE PRIME\r
- = seconds, inches\r
- x (quotation mark - 0022)\r
- x (modifier letter double prime - 02BA)\r
- x (right double quotation mark - 201D)\r
- x (ditto mark - 3003)\r
- x (double prime quotation mark - 301E)\r
- # 2032 2032\r
-2034 TRIPLE PRIME\r
- # 2032 2032 2032\r
-2035 REVERSED PRIME\r
- x (grave accent - 0060)\r
-2036 REVERSED DOUBLE PRIME\r
- x (reversed double prime quotation mark - 301D)\r
- # 2035 2035\r
-2037 REVERSED TRIPLE PRIME\r
- # 2035 2035 2035\r
-2038 CARET\r
- x (up arrowhead - 2303)\r
-2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK\r
- = LEFT POINTING SINGLE GUILLEMET\r
- * usually opening, sometimes closing\r
- x (less-than sign - 003C)\r
- x (left-pointing angle bracket - 2329)\r
- x (left angle bracket - 3008)\r
-203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK\r
- = RIGHT POINTING SINGLE GUILLEMET\r
- * usually closing, sometimes opening\r
- x (greater-than sign - 003E)\r
- x (right-pointing angle bracket - 232A)\r
- x (right angle bracket - 3009)\r
-203B REFERENCE MARK\r
- = Japanese kome\r
- = Urdu paragraph separator\r
- x (tibetan ku ru kha bzhi mig can - 0FBF)\r
-203C DOUBLE EXCLAMATION MARK\r
- x (exclamation mark - 0021)\r
- # 0021 0021\r
-203D INTERROBANG\r
- x (exclamation mark - 0021)\r
- x (question mark - 003F)\r
-203E OVERLINE\r
- = SPACING OVERSCORE\r
- # 0020 0305\r
-203F UNDERTIE (Enotikon)\r
- = Greek enotikon\r
- x (smile - 2323)\r
-2040 CHARACTER TIE\r
- x (frown - 2322)\r
-2041 CARET INSERTION POINT\r
- * proofreader's mark: insert here\r
- x (right semidirect product - 22CC)\r
-2042 ASTERISM\r
-2043 HYPHEN BULLET\r
-2044 FRACTION SLASH\r
- = solidus (in typography)\r
- * for composing arbitrary fractions\r
- x (solidus - 002F)\r
- x (division slash - 2215)\r
-2045 LEFT SQUARE BRACKET WITH QUILL\r
-2046 RIGHT SQUARE BRACKET WITH QUILL\r
-2048 QUESTION EXCLAMATION MARK\r
- * designed for use in vertical text\r
- # 003F 0021\r
-2049 EXCLAMATION QUESTION MARK\r
- * designed for use in vertical text\r
- # 0021 003F\r
-204A TIRONIAN SIGN ET\r
- * Irish Gaelic, ...\r
-204B REVERSED PILCROW SIGN\r
- x (pilcrow sign - 00B6)\r
-204C BLACK LEFTWARDS BULLET\r
-204D BLACK RIGHTWARDS BULLET\r
-@ Deprecated\r
-206A INHIBIT SYMMETRIC SWAPPING\r
-206B ACTIVATE SYMMETRIC SWAPPING\r
-206C INHIBIT ARABIC FORM SHAPING\r
-206D ACTIVATE ARABIC FORM SHAPING\r
-206E NATIONAL DIGIT SHAPES\r
-206F NOMINAL DIGIT SHAPES\r
-@@ 2070 Superscripts and Subscripts 209F\r
-@ Superscripts\r
-2070 SUPERSCRIPT ZERO\r
- # <super> 0030\r
-2071 <reserved>\r
- x (superscript one - 00B9)\r
-2072 <reserved>\r
- x (superscript two - 00B2)\r
-2073 <reserved>\r
- x (superscript three - 00B3)\r
-2074 SUPERSCRIPT FOUR\r
- # <super> 0034\r
-2075 SUPERSCRIPT FIVE\r
- # <super> 0035\r
-2076 SUPERSCRIPT SIX\r
- # <super> 0036\r
-2077 SUPERSCRIPT SEVEN\r
- # <super> 0037\r
-2078 SUPERSCRIPT EIGHT\r
- # <super> 0038\r
-2079 SUPERSCRIPT NINE\r
- # <super> 0039\r
-207A SUPERSCRIPT PLUS SIGN\r
- # <super> 002B\r
-207B SUPERSCRIPT MINUS\r
- # <super> 2212\r
-207C SUPERSCRIPT EQUALS SIGN\r
- # <super> 003D\r
-207D SUPERSCRIPT LEFT PARENTHESIS\r
- # <super> 0028\r
-207E SUPERSCRIPT RIGHT PARENTHESIS\r
- # <super> 0029\r
-207F SUPERSCRIPT LATIN SMALL LETTER N\r
- # <super> 006E\r
-@ Subscripts\r
-2080 SUBSCRIPT ZERO\r
- # <sub> 0030\r
-2081 SUBSCRIPT ONE\r
- # <sub> 0031\r
-2082 SUBSCRIPT TWO\r
- # <sub> 0032\r
-2083 SUBSCRIPT THREE\r
- # <sub> 0033\r
-2084 SUBSCRIPT FOUR\r
- # <sub> 0034\r
-2085 SUBSCRIPT FIVE\r
- # <sub> 0035\r
-2086 SUBSCRIPT SIX\r
- # <sub> 0036\r
-2087 SUBSCRIPT SEVEN\r
- # <sub> 0037\r
-2088 SUBSCRIPT EIGHT\r
- # <sub> 0038\r
-2089 SUBSCRIPT NINE\r
- # <sub> 0039\r
-208A SUBSCRIPT PLUS SIGN\r
- # <sub> 002B\r
-208B SUBSCRIPT MINUS\r
- # <sub> 2212\r
-208C SUBSCRIPT EQUALS SIGN\r
- # <sub> 003D\r
-208D SUBSCRIPT LEFT PARENTHESIS\r
- # <sub> 0028\r
-208E SUBSCRIPT RIGHT PARENTHESIS\r
- # <sub> 0029\r
-@@ 20A0 Currency Symbols 20CF\r
-@ Currency symbols\r
-@+ A number of currency symbols are found in other blocks.\r
- x (dollar sign - 0024)\r
- x (cent sign - 00A2)\r
- x (pound sign - 00A3)\r
- x (currency sign - 00A4)\r
- x (yen sign - 00A5)\r
- x (bengali rupee mark - 09F2)\r
- x (bengali rupee sign - 09F3)\r
- x (thai currency symbol baht - 0E3F)\r
- x (khmer currency symbol riel - 17DB)\r
-20A0 EURO-CURRENCY SIGN\r
- * intended for ECU, but not widely used\r
- * historical character, this is NOT the euro!\r
- x (euro sign - 20AC)\r
-20A1 COLON SIGN\r
- * Costa Rica, El Salvador\r
-20A2 CRUZEIRO SIGN\r
- * Brazil\r
-20A3 FRENCH FRANC SIGN\r
- * France\r
-20A4 LIRA SIGN\r
- * Italy, Turkey\r
- x (pound sign - 00A3)\r
-20A5 MILL SIGN\r
- * USA (1/10 cent)\r
-20A6 NAIRA SIGN\r
- * Nigeria\r
-20A7 PESETA SIGN\r
- * Spain\r
-20A8 RUPEE SIGN\r
- * India\r
- # 0052 0073\r
-20A9 WON SIGN\r
- * Korea\r
-20AA NEW SHEQEL SIGN\r
- * Israel\r
-20AB DONG SIGN\r
- * Vietnam\r
-20AC EURO SIGN\r
- * currency sign for the European Monetary Union\r
- * euro, not ECU\r
- x (euro-currency sign - 20A0)\r
-20AD KIP SIGN\r
- * Laos\r
-20AE TUGRIK SIGN\r
- * Mongolia\r
- * also transliterated as tugrug, tugric, tugrog, togrog\r
-20AF DRACHMA SIGN\r
- * Greece\r
-@@ 20D0 Combining Diacritical Marks for Symbols 20FF\r
-@ Combining diacritical marks for symbols\r
-20D0 COMBINING LEFT HARPOON ABOVE\r
-20D1 COMBINING RIGHT HARPOON ABOVE\r
- * vector\r
-20D2 COMBINING LONG VERTICAL LINE OVERLAY\r
-20D3 COMBINING SHORT VERTICAL LINE OVERLAY\r
- * negation\r
-20D4 COMBINING ANTICLOCKWISE ARROW ABOVE\r
-20D5 COMBINING CLOCKWISE ARROW ABOVE\r
- * rotation\r
-20D6 COMBINING LEFT ARROW ABOVE\r
-20D7 COMBINING RIGHT ARROW ABOVE\r
- * vector\r
-20D8 COMBINING RING OVERLAY\r
-20D9 COMBINING CLOCKWISE RING OVERLAY\r
-20DA COMBINING ANTICLOCKWISE RING OVERLAY\r
-20DB COMBINING THREE DOTS ABOVE\r
- = third derivative\r
-20DC COMBINING FOUR DOTS ABOVE\r
- = fourth derivative\r
-@ Enclosing diacritics\r
-20DD COMBINING ENCLOSING CIRCLE\r
- = JIS composition circle\r
- x (white circle - 25CB)\r
- x (large circle - 25EF)\r
- x (ideographic number zero - 3007)\r
-20DE COMBINING ENCLOSING SQUARE\r
- x (white square - 25A1)\r
-20DF COMBINING ENCLOSING DIAMOND\r
- x (white diamond - 25C7)\r
-20E0 COMBINING ENCLOSING CIRCLE BACKSLASH\r
- * prohibition\r
-@ Additional diacritical mark for symbols\r
-20E1 COMBINING LEFT RIGHT ARROW ABOVE\r
- * tensor\r
-@ Additional enclosing diacritics\r
-20E2 COMBINING ENCLOSING SCREEN\r
- x (clear screen symbol - 239A)\r
-20E3 COMBINING ENCLOSING KEYCAP\r
-\r
-*/\r
-\r
+//
+// CHARNAMES.CPP
+//
+// A header file that links Unicode character names to character numbers.
+// by James L. Hammons
+// (C) 2004 Underground Software
+//
+// JLH = James L. Hammons <jlhamm@acm.org>
+//
+// Who When What
+// --- ---------- -------------------------------------------------------------
+// JLH ??/??/200? Created this file
+//
+
+unsigned char macStdNames[] = {
+ "\x06""notdef"
+ "\x05"".null"
+ "\x02""CR"
+ "\x05""space"
+ "\x06""exclam"
+ "\x08""quotedbl"
+ "\x0A""numbersign"
+ "\x06""dollar"
+ "\x07""percent"
+ "\x09""ampersand"
+ "\x0B""quotesingle"
+ "\x09""parenleft"
+ "\x0A""parenright"
+ "\x08""asterisk"
+ "\x04""plus"
+ "\x05""comma"
+ "\x06""hyphen"
+ "\x06""period"
+ "\x05""slash"
+ "\x04""zero"
+ "\x03""one"
+ "\x03""two"
+ "\x05""three"
+ "\x04""four"
+ "\x04""five"
+ "\x03""six"
+ "\x05""seven"
+ "\x05""eight"
+ "\x04""nine"
+ "\x05""colon"
+ "\x09""semicolon"
+ "\x04""less"
+ "\x05""equal"
+ "\x07""greater"
+ "\x08""question"
+ "\x02""at"
+ "\x01""A"
+ "\x01""B"
+ "\x01""C"
+ "\x01""D"
+ "\x01""E"
+ "\x01""F"
+ "\x01""G"
+ "\x01""H"
+ "\x01""I"
+ "\x01""J"
+ "\x01""K"
+ "\x01""L"
+ "\x01""M"
+ "\x01""N"
+ "\x01""O"
+ "\x01""P"
+ "\x01""Q"
+ "\x01""R"
+ "\x01""S"
+ "\x01""T"
+ "\x01""U"
+ "\x01""V"
+ "\x01""W"
+ "\x01""X"
+ "\x01""Y"
+ "\x01""Z"
+ "\x0B""bracketleft"
+ "\x09""backslash"
+ "\x0C""bracketright"
+ "\x0B""asciicircum"
+ "\x0A""underscore"
+ "\x05""grave"
+ "\x01""a"
+ "\x01""b"
+ "\x01""c"
+ "\x01""d"
+ "\x01""e"
+ "\x01""f"
+ "\x01""g"
+ "\x01""h"
+ "\x01""i"
+ "\x01""j"
+ "\x01""k"
+ "\x01""l"
+ "\x01""m"
+ "\x01""n"
+ "\x01""o"
+ "\x01""p"
+ "\x01""q"
+ "\x01""r"
+ "\x01""s"
+ "\x01""t"
+ "\x01""u"
+ "\x01""v"
+ "\x01""w"
+ "\x01""x"
+ "\x01""y"
+ "\x01""z"
+ "\x09""braceleft"
+ "\x03""bar"
+ "\x0A""braceright"
+ "\x0A""asciitilde"
+ "\x09""Adieresis"
+ "\x05""Aring"
+ "\x08""Ccedilla"
+ "\x06""Eacute"
+ "\x06""Ntilde"
+ "\x09""Odieresis"
+ "\x09""Udieresis"
+ "\x06""aacute"
+ "\x06""agrave"
+ "\x0B""acircumflex"
+ "\x09""adieresis"
+ "\x06""atilde"
+ "\x05""aring"
+ "\x08""ccedilla"
+ "\x06""eacute"
+ "\x06""egrave"
+ "\x0B""ecircumflex"
+ "\x09""edieresis"
+ "\x06""iacute"
+ "\x06""igrave"
+ "\x0B""icircumflex"
+ "\x09""idieresis"
+ "\x06""ntilde"
+ "\x06""oacute"
+ "\x06""ograve"
+ "\x0B""ocircumflex"
+ "\x09""odieresis"
+ "\x06""otilde"
+ "\x06""uacute"
+ "\x06""ugrave"
+ "\x0B""ucircumflex"
+ "\x09""udieresis"
+ "\x06""dagger"
+ "\x06""degree"
+ "\x04""cent"
+ "\x08""sterling"
+ "\x07""section"
+ "\x06""bullet"
+ "\x09""paragraph"
+ "\x0A""germandbls"
+ "\x0A""registered"
+ "\x09""copyright"
+ "\x09""trademark"
+ "\x05""acute"
+ "\x08""dieresis"
+ "\x08""notequal"
+ "\x02""AE"
+ "\x06""Oslash"
+ "\x08""infinity"
+ "\x09""plusminus"
+ "\x09""lessequal"
+ "\x0C""greaterequal"
+ "\x03""yen"
+ "\x03""mu1"
+ "\x0B""partialdiff"
+ "\x09""summation"
+ "\x07""product"
+ "\x02""pi"
+ "\x08""integral"
+ "\x0B""ordfeminine"
+ "\x0C""ordmasculine"
+ "\x03""Ohm"
+ "\x02""ae"
+ "\x06""oslash"
+ "\x0C""questiondown"
+ "\x0A""exclamdown"
+ "\x0A""logicalnot"
+ "\x07""radical"
+ "\x06""florin"
+ "\x0B""approxequal"
+ "\x09""increment"
+ "\x0D""guillemotleft"
+ "\x0E""guillemotright"
+ "\x08""ellipsis"
+ "\x07""nbspace"
+ "\x06""Agrave"
+ "\x06""Atilde"
+ "\x06""Otilde"
+ "\x02""OE"
+ "\x02""oe"
+ "\x06""endash"
+ "\x06""emdash"
+ "\x0C""quotedblleft"
+ "\x0D""quotedblright"
+ "\x09""quoteleft"
+ "\x0A""quoteright"
+ "\x06""divide"
+ "\x07""lozenge"
+ "\x09""ydieresis"
+ "\x09""Ydieresis"
+ "\x08""fraction"
+ "\x08""currency"
+ "\x0D""guilsinglleft"
+ "\x0E""guilsinglright"
+ "\x02""fi"
+ "\x02""fl"
+ "\x09""daggerdbl"
+ "\x0E""periodcentered"
+ "\x0E""quotesinglbase"
+ "\x0C""quotedblbase"
+ "\x0B""perthousand"
+ "\x0B""Acircumflex"
+ "\x0B""Ecircumflex"
+ "\x06""Aacute"
+ "\x09""Edieresis"
+ "\x06""Egrave"
+ "\x06""Iacute"
+ "\x0B""Icircumflex"
+ "\x09""Idieresis"
+ "\x06""Igrave"
+ "\x06""Oacute"
+ "\x0B""Ocircumflex"
+ "\x09""applelogo"
+ "\x06""Ograve"
+ "\x06""Uacute"
+ "\x0B""Ucircumflex"
+ "\x06""Ugrave"
+ "\x08""dotlessi"
+ "\x0A""circumflex"
+ "\x05""tilde"
+ "\x09""overscore"
+ "\x05""breve"
+ "\x09""dotaccent"
+ "\x04""ring"
+ "\x07""cedilla"
+ "\x0C""hungarumlaut"
+ "\x06""ogonek"
+ "\x05""caron"
+ "\x06""Lslash"
+ "\x06""lslash"
+ "\x06""Scaron"
+ "\x06""scaron"
+ "\x06""Zcaron"
+ "\x06""zcaron"
+ "\x09""brokenbar"
+ "\x03""Eth"
+ "\x03""eth"
+ "\x06""Yacute"
+ "\x06""yacute"
+ "\x05""Thorn"
+ "\x05""thorn"
+ "\x05""minus"
+ "\x08""multiply"
+ "\x0B""onesuperior"
+ "\x0B""twosuperior"
+ "\x0D""threesuperior"
+ "\x07""onehalf"
+ "\x0A""onequarter"
+ "\x0D""threequarters"
+ "\x05""franc"
+ "\x06""Gbreve"
+ "\x06""gbreve"
+ "\x04""Idot"
+ "\x08""Scedilla"
+ "\x08""scedilla"
+ "\x06""Cacute"
+ "\x06""cacute"
+ "\x06""Ccaron"
+ "\x06""ccaron"
+ "\x07""dmacron"
+};
+
+/*struct unicodeChar
+{
+ int cNum;
+
+};*/
+
+unsigned char unicodeChars[] = {
+ "\x00\x20""space\0"
+ "\x00\x21""exclamation mark\0"
+ "\x00\x22""quotation mark\0"
+ "\x00\x23""number sign\0"
+
+};
+
+/*
+
+0023 NUMBER SIGN
+ = pound sign, hash, crosshatch, octothorpe
+0024 DOLLAR SIGN
+ = milreis, escudo
+ * glyph may have one or two vertical bars
+ * other currency symbol characters: 20A0-20AF
+ x (currency sign - 00A4)
+0025 PERCENT SIGN
+ x (arabic percent sign - 066A)
+ x (per mille sign - 2030)
+ x (per ten thousand sign - 2031)
+0026 AMPERSAND
+0027 APOSTROPHE
+ = APOSTROPHE-QUOTE
+ = APL quote
+ * neutral (vertical) glyph having mixed usage
+ * preferred character for apostrophe is 2019
+ * preferred characters in English for paired quotation marks are 2018 & 2019
+ x (modifier letter prime - 02B9)
+ x (modifier letter apostrophe - 02BC)
+ x (modifier letter vertical line - 02C8)
+ x (combining acute accent - 0301)
+ x (prime - 2032)
+0028 LEFT PARENTHESIS
+ = OPENING PARENTHESIS
+0029 RIGHT PARENTHESIS
+ = CLOSING PARENTHESIS
+ * see discussion on semantics of paired bracketing characters
+002A ASTERISK
+ = star (on phone keypads)
+ x (arabic five pointed star - 066D)
+ x (asterisk operator - 2217)
+ x (heavy asterisk - 2731)
+002B PLUS SIGN
+002C COMMA
+ = decimal separator
+ x (arabic comma - 060C)
+ x (single low-9 quotation mark - 201A)
+ x (ideographic comma - 3001)
+002D HYPHEN-MINUS
+ = hyphen or minus sign
+ * used for either hyphen or minus sign
+ x (hyphen - 2010)
+ x (non-breaking hyphen - 2011)
+ x (figure dash - 2012)
+ x (en dash - 2013)
+ x (minus sign - 2212)
+002E FULL STOP
+ = PERIOD
+ = dot, decimal point
+ * may be rendered as a raised decimal point in old style numbers
+ x (arabic full stop - 06D4)
+ x (ideographic full stop - 3002)
+002F SOLIDUS
+ = SLASH
+ = virgule, shilling (British)
+ x (latin letter dental click - 01C0)
+ x (combining long solidus overlay - 0338)
+ x (fraction slash - 2044)
+ x (division slash - 2215)
+0030 DIGIT ZERO
+0031 DIGIT ONE
+0032 DIGIT TWO
+0033 DIGIT THREE
+0034 DIGIT FOUR
+0035 DIGIT FIVE
+0036 DIGIT SIX
+0037 DIGIT SEVEN
+0038 DIGIT EIGHT
+0039 DIGIT NINE
+003A COLON
+ x (armenian full stop - 0589)
+ x (hebrew punctuation sof pasuq - 05C3)
+ x (ratio - 2236)
+003B SEMICOLON
+ x (greek question mark - 037E)
+ x (arabic semicolon - 061B)
+003C LESS-THAN SIGN
+ x (single left-pointing angle quotation mark - 2039)
+ x (left-pointing angle bracket - 2329)
+ x (left angle bracket - 3008)
+003D EQUALS SIGN
+ * other related characters: 2241-2263
+ x (not equal to - 2260)
+ x (identical to - 2261)
+003E GREATER-THAN SIGN
+ x (single right-pointing angle quotation mark - 203A)
+ x (right-pointing angle bracket - 232A)
+ x (right angle bracket - 3009)
+003F QUESTION MARK
+ x (inverted question mark - 00BF)
+ x (greek question mark - 037E)
+ x (arabic question mark - 061F)
+ x (interrobang - 203D)
+ x (question exclamation mark - 2048)
+ x (exclamation question mark - 2049)
+0040 COMMERCIAL AT
+0041 LATIN CAPITAL LETTER A
+0042 LATIN CAPITAL LETTER B
+ x (script capital b - 212C)
+0043 LATIN CAPITAL LETTER C
+ x (double-struck capital c - 2102)
+ x (black-letter capital c - 212D)
+0044 LATIN CAPITAL LETTER D
+0045 LATIN CAPITAL LETTER E
+ x (euler constant - 2107)
+ x (script capital e - 2130)
+0046 LATIN CAPITAL LETTER F
+ x (script capital f - 2131)
+ x (turned capital f - 2132)
+0047 LATIN CAPITAL LETTER G
+0048 LATIN CAPITAL LETTER H
+ x (script capital h - 210B)
+ x (black-letter capital h - 210C)
+ x (double-struck capital h - 210D)
+0049 LATIN CAPITAL LETTER I
+ * Turkish and Azerbaijani use 0131 for lowercase
+ x (latin capital letter i with dot above - 0130)
+ x (cyrillic capital letter byelorussian-ukrainian i - 0406)
+ x (cyrillic letter palochka - 04C0)
+ x (script capital i - 2110)
+ x (black-letter capital i - 2111)
+ x (roman numeral one - 2160)
+004A LATIN CAPITAL LETTER J
+004B LATIN CAPITAL LETTER K
+ x (kelvin sign - 212A)
+004C LATIN CAPITAL LETTER L
+ x (script capital l - 2112)
+004D LATIN CAPITAL LETTER M
+ x (script capital m - 2133)
+004E LATIN CAPITAL LETTER N
+ x (double-struck capital n - 2115)
+004F LATIN CAPITAL LETTER O
+0050 LATIN CAPITAL LETTER P
+ x (double-struck capital p - 2119)
+0051 LATIN CAPITAL LETTER Q
+ x (double-struck capital q - 211A)
+0052 LATIN CAPITAL LETTER R
+ x (script capital r - 211B)
+ x (black-letter capital r - 211C)
+ x (double-struck capital r - 211D)
+0053 LATIN CAPITAL LETTER S
+0054 LATIN CAPITAL LETTER T
+0055 LATIN CAPITAL LETTER U
+0056 LATIN CAPITAL LETTER V
+0057 LATIN CAPITAL LETTER W
+0058 LATIN CAPITAL LETTER X
+0059 LATIN CAPITAL LETTER Y
+005A LATIN CAPITAL LETTER Z
+ x (double-struck capital z - 2124)
+ x (black-letter capital z - 2128)
+005B LEFT SQUARE BRACKET
+ = OPENING SQUARE BRACKET
+ * other bracket characters: 3008-301B
+005C REVERSE SOLIDUS
+ = BACKSLASH
+ x (set minus - 2216)
+005D RIGHT SQUARE BRACKET
+ = CLOSING SQUARE BRACKET
+005E CIRCUMFLEX ACCENT
+ * this is a spacing character
+ x (modifier letter up arrowhead - 02C4)
+ x (modifier letter circumflex accent - 02C6)
+ x (combining circumflex accent - 0302)
+ x (up arrowhead - 2303)
+005F LOW LINE
+ = SPACING UNDERSCORE
+ * this is a spacing character
+ x (modifier letter low macron - 02CD)
+ x (combining macron below - 0331)
+ x (combining low line - 0332)
+ x (double low line - 2017)
+0060 GRAVE ACCENT
+ * this is a spacing character
+ x (modifier letter grave accent - 02CB)
+ x (combining grave accent - 0300)
+ x (reversed prime - 2035)
+0061 LATIN SMALL LETTER A
+0062 LATIN SMALL LETTER B
+0063 LATIN SMALL LETTER C
+0064 LATIN SMALL LETTER D
+0065 LATIN SMALL LETTER E
+ x (estimated symbol - 212E)
+ x (script small e - 212F)
+0066 LATIN SMALL LETTER F
+0067 LATIN SMALL LETTER G
+ x (latin small letter script g - 0261)
+ x (script small g - 210A)
+0068 LATIN SMALL LETTER H
+ x (cyrillic small letter shha - 04BB)
+ x (planck constant - 210E)
+0069 LATIN SMALL LETTER I
+ * Turkish and Azerbaijani use 0130 for uppercase
+ x (latin small letter dotless i - 0131)
+006A LATIN SMALL LETTER J
+006B LATIN SMALL LETTER K
+006C LATIN SMALL LETTER L
+ x (script small l - 2113)
+006D LATIN SMALL LETTER M
+006E LATIN SMALL LETTER N
+ x (superscript latin small letter n - 207F)
+006F LATIN SMALL LETTER O
+ x (script small o - 2134)
+0070 LATIN SMALL LETTER P
+0071 LATIN SMALL LETTER Q
+0072 LATIN SMALL LETTER R
+0073 LATIN SMALL LETTER S
+0074 LATIN SMALL LETTER T
+0075 LATIN SMALL LETTER U
+0076 LATIN SMALL LETTER V
+0077 LATIN SMALL LETTER W
+0078 LATIN SMALL LETTER X
+0079 LATIN SMALL LETTER Y
+007A LATIN SMALL LETTER Z
+ x (latin small letter z with stroke - 01B6)
+007B LEFT CURLY BRACKET
+ = OPENING CURLY BRACKET
+ = opening brace
+007C VERTICAL LINE
+ = VERTICAL BAR
+ * used in pairs to indicate absolute value
+ x (latin letter dental click - 01C0)
+ x (hebrew punctuation paseq - 05C0)
+ x (divides - 2223)
+ x (light vertical bar - 2758)
+007D RIGHT CURLY BRACKET
+ = CLOSING CURLY BRACKET
+ = closing brace
+007E TILDE
+ * this is a spacing character
+ x (small tilde - 02DC)
+ x (combining tilde - 0303)
+ x (tilde operator - 223C)
+ x (fullwidth tilde - FF5E)
+007F <control>
+ = DELETE
+@@ 0080 C1 Controls and Latin-1 Supplement (Latin-1 Supplement) 00FF
+@ C1 controls
+@+ Alias names are those for ISO 6429.
+0080 <control>
+0081 <control>
+0082 <control>
+ = BREAK PERMITTED HERE
+0083 <control>
+ = NO BREAK HERE
+0084 <control>
+0085 <control>
+ = NEXT LINE
+0086 <control>
+ = START OF SELECTED AREA
+0087 <control>
+ = END OF SELECTED AREA
+0088 <control>
+ = CHARACTER TABULATION SET
+0089 <control>
+ = CHARACTER TABULATION WITH JUSTIFICATION
+008A <control>
+ = LINE TABULATION SET
+008B <control>
+ = PARTIAL LINE DOWN
+008C <control>
+ = PARTIAL LINE UP
+008D <control>
+ = REVERSE LINE FEED
+008E <control>
+ = SINGLE SHIFT TWO
+008F <control>
+ = SINGLE SHIFT THREE
+0090 <control>
+ = DEVICE CONTROL STRING
+0091 <control>
+ = PRIVATE USE ONE
+0092 <control>
+ = PRIVATE USE TWO
+0093 <control>
+ = SET TRANSMIT STATE
+0094 <control>
+ = CANCEL CHARACTER
+0095 <control>
+ = MESSAGE WAITING
+0096 <control>
+ = START OF GUARDED AREA
+0097 <control>
+ = END OF GUARDED AREA
+0098 <control>
+ = START OF STRING
+0099 <control>
+009A <control>
+ = SINGLE CHARACTER INTRODUCER
+009B <control>
+ = CONTROL SEQUENCE INTRODUCER
+009C <control>
+ = STRING TERMINATOR
+009D <control>
+ = OPERATING SYSTEM COMMAND
+009E <control>
+ = PRIVACY MESSAGE
+009F <control>
+ = APPLICATION PROGRAM COMMAND
+@ ISO 8859-1 (aka Latin-1)
+00A0 NO-BREAK SPACE
+ x (space - 0020)
+ x (figure space - 2007)
+ x (narrow no-break space - 202F)
+ x (zero width no-break space - FEFF)
+ # <noBreak> 0020
+00A1 INVERTED EXCLAMATION MARK
+ * Spanish, Asturian, Galician
+ x (exclamation mark - 0021)
+00A2 CENT SIGN
+00A3 POUND SIGN
+ = pound sterling, Irish punt
+ x (lira sign - 20A4)
+00A4 CURRENCY SIGN
+ = Filzlaus, Ricardi-Sonne (German names)
+ * other currency symbol characters: 20A0-20AF
+ x (dollar sign - 0024)
+00A5 YEN SIGN
+ = yuan sign
+ * glyph may have one or two crossbars
+00A6 BROKEN BAR
+ = BROKEN VERTICAL BAR
+ = parted rule (in typography)
+00A7 SECTION SIGN
+ * paragraph sign in some European usage
+00A8 DIAERESIS
+ * this is a spacing character
+ x (combining diaeresis - 0308)
+ # 0020 0308
+00A9 COPYRIGHT SIGN
+ x (sound recording copyright - 2117)
+00AA FEMININE ORDINAL INDICATOR
+ * Spanish
+ # <super> 0061
+00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK *
+ = LEFT POINTING GUILLEMET
+ = chevrons (in typography)
+ * usually opening, sometimes closing
+ x (much less-than - 226A)
+ x (left double angle bracket - 300A)
+00AC NOT SIGN
+ = angled dash (in typography)
+ x (reversed not sign - 2310)
+00AD SOFT HYPHEN
+ = discretionary hyphen
+ x (mongolian todo soft hyphen - 1806)
+00AE REGISTERED SIGN
+ = REGISTERED TRADE MARK SIGN
+00AF MACRON
+ = overline, APL overbar
+ * this is a spacing character
+ x (modifier letter macron - 02C9)
+ x (combining macron - 0304)
+ x (combining overline - 0305)
+ # 0020 0304
+00B0 DEGREE SIGN
+ * this is a spacing character
+ x (ring above - 02DA)
+ x (combining ring above - 030A)
+ x (superscript zero - 2070)
+ x (ring operator - 2218)
+00B1 PLUS-MINUS SIGN
+ x (minus-or-plus sign - 2213)
+00B2 SUPERSCRIPT TWO
+ = squared
+ * other superscript digit characters: 2070-2079
+ x (superscript one - 00B9)
+ # <super> 0032
+00B3 SUPERSCRIPT THREE
+ = cubed
+ x (superscript one - 00B9)
+ # <super> 0033
+00B4 ACUTE ACCENT
+ * this is a spacing character
+ x (modifier letter prime - 02B9)
+ x (modifier letter acute accent - 02CA)
+ x (combining acute accent - 0301)
+ x (prime - 2032)
+ # 0020 0301
+00B5 MICRO SIGN
+ # 03BC greek small letter mu
+00B6 PILCROW SIGN
+ = PARAGRAPH SIGN
+ * section sign in some European usage
+ x (reversed pilcrow sign - 204B)
+ x (curved stem paragraph sign ornament - 2761)
+00B7 MIDDLE DOT
+ = midpoint (in typography)
+ = Georgian comma
+ = Greek middle dot
+ x (bullet - 2022)
+ x (one dot leader - 2024)
+ x (hyphenation point - 2027)
+ x (bullet operator - 2219)
+ x (dot operator - 22C5)
+ x (katakana middle dot - 30FB)
+00B8 CEDILLA
+ * this is a spacing character
+ * other spacing accent characters: 02D8-02DB
+ x (combining cedilla - 0327)
+ # 0020 0327
+00B9 SUPERSCRIPT ONE
+ x (superscript two - 00B2)
+ x (superscript three - 00B3)
+ # <super> 0031
+00BA MASCULINE ORDINAL INDICATOR
+ * Spanish
+ # <super> 006F
+00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK *
+ = RIGHT POINTING GUILLEMET
+ * usually closing, sometimes opening
+ x (much greater-than - 226B)
+ x (right double angle bracket - 300B)
+00BC VULGAR FRACTION ONE QUARTER
+ * bar may be horizontal or slanted
+ * other fraction characters: 2153-215E
+ # 0031 2044 0034
+00BD VULGAR FRACTION ONE HALF
+ * bar may be horizontal or slanted
+ # 0031 2044 0032
+00BE VULGAR FRACTION THREE QUARTERS
+ * bar may be horizontal or slanted
+ # 0033 2044 0034
+00BF INVERTED QUESTION MARK
+ = turned question mark
+ * Spanish
+ x (question mark - 003F)
+00C0 LATIN CAPITAL LETTER A WITH GRAVE
+ : 0041 0300
+00C1 LATIN CAPITAL LETTER A WITH ACUTE
+ : 0041 0301
+00C2 LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+ : 0041 0302
+00C3 LATIN CAPITAL LETTER A WITH TILDE
+ : 0041 0303
+00C4 LATIN CAPITAL LETTER A WITH DIAERESIS
+ : 0041 0308
+00C5 LATIN CAPITAL LETTER A WITH RING ABOVE
+ x (angstrom sign - 212B)
+ : 0041 030A
+00C6 LATIN CAPITAL LETTER AE (ash) *
+ = LATIN CAPITAL LIGATURE AE
+00C7 LATIN CAPITAL LETTER C WITH CEDILLA
+ : 0043 0327
+00C8 LATIN CAPITAL LETTER E WITH GRAVE
+ : 0045 0300
+00C9 LATIN CAPITAL LETTER E WITH ACUTE
+ : 0045 0301
+00CA LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+ : 0045 0302
+00CB LATIN CAPITAL LETTER E WITH DIAERESIS
+ : 0045 0308
+00CC LATIN CAPITAL LETTER I WITH GRAVE
+ : 0049 0300
+00CD LATIN CAPITAL LETTER I WITH ACUTE
+ : 0049 0301
+00CE LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+ : 0049 0302
+00CF LATIN CAPITAL LETTER I WITH DIAERESIS
+ : 0049 0308
+00D0 LATIN CAPITAL LETTER ETH (Icelandic)
+ x (latin small letter eth - 00F0)
+ x (latin capital letter d with stroke - 0110)
+ x (latin capital letter african d - 0189)
+00D1 LATIN CAPITAL LETTER N WITH TILDE
+ : 004E 0303
+00D2 LATIN CAPITAL LETTER O WITH GRAVE
+ : 004F 0300
+00D3 LATIN CAPITAL LETTER O WITH ACUTE
+ : 004F 0301
+00D4 LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+ : 004F 0302
+00D5 LATIN CAPITAL LETTER O WITH TILDE
+ : 004F 0303
+00D6 LATIN CAPITAL LETTER O WITH DIAERESIS
+ : 004F 0308
+00D7 MULTIPLICATION SIGN
+ = z notation Cartesian product
+00D8 LATIN CAPITAL LETTER O WITH STROKE
+ = LATIN CAPITAL LETTER O SLASH
+ x (empty set - 2205)
+00D9 LATIN CAPITAL LETTER U WITH GRAVE
+ : 0055 0300
+00DA LATIN CAPITAL LETTER U WITH ACUTE
+ : 0055 0301
+00DB LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+ : 0055 0302
+00DC LATIN CAPITAL LETTER U WITH DIAERESIS
+ : 0055 0308
+00DD LATIN CAPITAL LETTER Y WITH ACUTE
+ : 0059 0301
+00DE LATIN CAPITAL LETTER THORN (Icelandic)
+00DF LATIN SMALL LETTER SHARP S (German)
+ = Eszett
+ * German
+ * uppercase is "SS"
+ * in origin a ligature of 017F and 0073
+ x (greek small letter beta - 03B2)
+00E0 LATIN SMALL LETTER A WITH GRAVE
+ : 0061 0300
+00E1 LATIN SMALL LETTER A WITH ACUTE
+ : 0061 0301
+00E2 LATIN SMALL LETTER A WITH CIRCUMFLEX
+ : 0061 0302
+00E3 LATIN SMALL LETTER A WITH TILDE
+ * Portuguese
+ : 0061 0303
+00E4 LATIN SMALL LETTER A WITH DIAERESIS
+ : 0061 0308
+00E5 LATIN SMALL LETTER A WITH RING ABOVE
+ * Danish, Norwegian, Swedish, Walloon
+ : 0061 030A
+00E6 LATIN SMALL LETTER AE (ash) *
+ = LATIN SMALL LIGATURE AE
+ = ash (from Old English æsc)
+ * Danish, Norwegian, Icelandic, Faroese, Old English, French, IPA
+ x (latin small ligature oe - 0153)
+ x (cyrillic small ligature a ie - 04D5)
+00E7 LATIN SMALL LETTER C WITH CEDILLA
+ : 0063 0327
+00E8 LATIN SMALL LETTER E WITH GRAVE
+ : 0065 0300
+00E9 LATIN SMALL LETTER E WITH ACUTE
+ : 0065 0301
+00EA LATIN SMALL LETTER E WITH CIRCUMFLEX
+ : 0065 0302
+00EB LATIN SMALL LETTER E WITH DIAERESIS
+ : 0065 0308
+00EC LATIN SMALL LETTER I WITH GRAVE
+ * Italian, Malagasy
+ : 0069 0300
+00ED LATIN SMALL LETTER I WITH ACUTE
+ : 0069 0301
+00EE LATIN SMALL LETTER I WITH CIRCUMFLEX
+ : 0069 0302
+00EF LATIN SMALL LETTER I WITH DIAERESIS
+ : 0069 0308
+00F0 LATIN SMALL LETTER ETH (Icelandic)
+ * Icelandic, Faroese, Old English, IPA
+ x (latin capital letter eth - 00D0)
+ x (greek small letter delta - 03B4)
+ x (partial differential - 2202)
+00F1 LATIN SMALL LETTER N WITH TILDE
+ : 006E 0303
+00F2 LATIN SMALL LETTER O WITH GRAVE
+ : 006F 0300
+00F3 LATIN SMALL LETTER O WITH ACUTE
+ : 006F 0301
+00F4 LATIN SMALL LETTER O WITH CIRCUMFLEX
+ : 006F 0302
+00F5 LATIN SMALL LETTER O WITH TILDE
+ * Portuguese, Estonian
+ : 006F 0303
+00F6 LATIN SMALL LETTER O WITH DIAERESIS
+ : 006F 0308
+00F7 DIVISION SIGN
+00F8 LATIN SMALL LETTER O WITH STROKE
+ = LATIN SMALL LETTER O SLASH
+ * Danish, Norwegian, Faroese, IPA
+00F9 LATIN SMALL LETTER U WITH GRAVE
+ * French, Italian
+ : 0075 0300
+00FA LATIN SMALL LETTER U WITH ACUTE
+ : 0075 0301
+00FB LATIN SMALL LETTER U WITH CIRCUMFLEX
+ : 0075 0302
+00FC LATIN SMALL LETTER U WITH DIAERESIS
+ : 0075 0308
+00FD LATIN SMALL LETTER Y WITH ACUTE
+ * Czech, Slovak, Icelandic, Faroese, Welsh, Malagasy
+ : 0079 0301
+00FE LATIN SMALL LETTER THORN (Icelandic)
+ * Icelandic, Old English, phonetics
+ * Runic letter borrowed into Latin script
+ x (runic letter thurisaz thurs thorn - 16A6)
+00FF LATIN SMALL LETTER Y WITH DIAERESIS
+ * French
+ x (latin capital letter y with diaeresis - 0178)
+ : 0079 0308
+@@ 0100 Latin Extended-A 017F
+@ European Latin
+0100 LATIN CAPITAL LETTER A WITH MACRON
+ : 0041 0304
+0101 LATIN SMALL LETTER A WITH MACRON
+ * Latvian, Latin, ...
+ : 0061 0304
+0102 LATIN CAPITAL LETTER A WITH BREVE
+ : 0041 0306
+0103 LATIN SMALL LETTER A WITH BREVE
+ * Romanian, Vietnamese, Latin, ...
+ : 0061 0306
+0104 LATIN CAPITAL LETTER A WITH OGONEK
+ : 0041 0328
+0105 LATIN SMALL LETTER A WITH OGONEK
+ * Polish, Lithuanian, ...
+ : 0061 0328
+0106 LATIN CAPITAL LETTER C WITH ACUTE
+ : 0043 0301
+0107 LATIN SMALL LETTER C WITH ACUTE
+ * Polish, Croatian, ...
+ x (cyrillic small letter tshe - 045B)
+ : 0063 0301
+0108 LATIN CAPITAL LETTER C WITH CIRCUMFLEX
+ : 0043 0302
+0109 LATIN SMALL LETTER C WITH CIRCUMFLEX
+ * Esperanto
+ : 0063 0302
+010A LATIN CAPITAL LETTER C WITH DOT ABOVE
+ : 0043 0307
+010B LATIN SMALL LETTER C WITH DOT ABOVE
+ * Maltese, Irish Gaelic (old orthography)
+ : 0063 0307
+010C LATIN CAPITAL LETTER C WITH CARON
+ : 0043 030C
+010D LATIN SMALL LETTER C WITH CARON
+ * Czech, Slovak, Slovenian, and many other languages
+ : 0063 030C
+010E LATIN CAPITAL LETTER D WITH CARON
+ * the form using caron/hacek is preferred in all contexts
+ : 0044 030C
+010F LATIN SMALL LETTER D WITH CARON
+ * Czech, Slovak
+ * the form using apostrophe is preferred in typesetting
+ : 0064 030C
+0110 LATIN CAPITAL LETTER D WITH STROKE
+ x (latin capital letter eth - 00D0)
+ x (latin small letter d with stroke - 0111)
+ x (latin capital letter african d - 0189)
+0111 LATIN SMALL LETTER D WITH STROKE
+ * Croatian, Vietnamese, Sámi
+ x (latin capital letter d with stroke - 0110)
+ x (cyrillic small letter dje - 0452)
+0112 LATIN CAPITAL LETTER E WITH MACRON
+ : 0045 0304
+0113 LATIN SMALL LETTER E WITH MACRON
+ * Latvian, Latin, ...
+ : 0065 0304
+0114 LATIN CAPITAL LETTER E WITH BREVE
+ : 0045 0306
+0115 LATIN SMALL LETTER E WITH BREVE
+ * Malay, Latin, ...
+ : 0065 0306
+0116 LATIN CAPITAL LETTER E WITH DOT ABOVE
+ : 0045 0307
+0117 LATIN SMALL LETTER E WITH DOT ABOVE
+ * Lithuanian
+ : 0065 0307
+0118 LATIN CAPITAL LETTER E WITH OGONEK
+ : 0045 0328
+0119 LATIN SMALL LETTER E WITH OGONEK
+ * Polish, Lithuanian, ...
+ : 0065 0328
+011A LATIN CAPITAL LETTER E WITH CARON
+ : 0045 030C
+011B LATIN SMALL LETTER E WITH CARON
+ * Czech, ...
+ : 0065 030C
+011C LATIN CAPITAL LETTER G WITH CIRCUMFLEX
+ : 0047 0302
+011D LATIN SMALL LETTER G WITH CIRCUMFLEX
+ * Esperanto
+ : 0067 0302
+011E LATIN CAPITAL LETTER G WITH BREVE
+ : 0047 0306
+011F LATIN SMALL LETTER G WITH BREVE
+ * Turkish, Azerbaijani
+ x (latin small letter g with caron - 01E7)
+ : 0067 0306
+0120 LATIN CAPITAL LETTER G WITH DOT ABOVE
+ : 0047 0307
+0121 LATIN SMALL LETTER G WITH DOT ABOVE
+ * Maltese, Irish Gaelic (old orthography)
+ : 0067 0307
+0122 LATIN CAPITAL LETTER G WITH CEDILLA
+ : 0047 0327
+0123 LATIN SMALL LETTER G WITH CEDILLA
+ * Latvian
+ * there are three major glyph variants
+ : 0067 0327
+0124 LATIN CAPITAL LETTER H WITH CIRCUMFLEX
+ : 0048 0302
+0125 LATIN SMALL LETTER H WITH CIRCUMFLEX
+ * Esperanto
+ : 0068 0302
+0126 LATIN CAPITAL LETTER H WITH STROKE
+0127 LATIN SMALL LETTER H WITH STROKE
+ * Maltese, IPA, ...
+ x (cyrillic small letter tshe - 045B)
+ x (planck constant over two pi - 210F)
+0128 LATIN CAPITAL LETTER I WITH TILDE
+ : 0049 0303
+0129 LATIN SMALL LETTER I WITH TILDE
+ * Greenlandic (old orthography)
+ : 0069 0303
+012A LATIN CAPITAL LETTER I WITH MACRON
+ : 0049 0304
+012B LATIN SMALL LETTER I WITH MACRON
+ * Latvian, Latin, ...
+ : 0069 0304
+012C LATIN CAPITAL LETTER I WITH BREVE
+ : 0049 0306
+012D LATIN SMALL LETTER I WITH BREVE
+ * Latin, ...
+ : 0069 0306
+012E LATIN CAPITAL LETTER I WITH OGONEK
+ : 0049 0328
+012F LATIN SMALL LETTER I WITH OGONEK
+ * Lithuanian, ...
+ : 0069 0328
+0130 LATIN CAPITAL LETTER I WITH DOT ABOVE
+ = LATIN CAPITAL LETTER I DOT
+ * Turkish, Azerbaijani
+ * lowercase is 0069
+ x (latin capital letter i - 0049)
+ : 0049 0307
+0131 LATIN SMALL LETTER DOTLESS I
+ * Turkish, Azerbaijani
+ * uppercase is 0049
+ x (latin small letter i - 0069)
+0132 LATIN CAPITAL LIGATURE IJ
+ # 0049 004A
+0133 LATIN SMALL LIGATURE IJ
+ * Dutch
+ # 0069 006A
+0134 LATIN CAPITAL LETTER J WITH CIRCUMFLEX
+ : 004A 0302
+0135 LATIN SMALL LETTER J WITH CIRCUMFLEX
+ * Esperanto
+ : 006A 0302
+0136 LATIN CAPITAL LETTER K WITH CEDILLA
+ : 004B 0327
+0137 LATIN SMALL LETTER K WITH CEDILLA
+ * Latvian
+ : 006B 0327
+0138 LATIN SMALL LETTER KRA (Greenlandic)
+ * Greenlandic (old orthography)
+0139 LATIN CAPITAL LETTER L WITH ACUTE
+ : 004C 0301
+013A LATIN SMALL LETTER L WITH ACUTE
+ * Slovak
+ : 006C 0301
+013B LATIN CAPITAL LETTER L WITH CEDILLA
+ : 004C 0327
+013C LATIN SMALL LETTER L WITH CEDILLA
+ * Latvian
+ : 006C 0327
+013D LATIN CAPITAL LETTER L WITH CARON
+ : 004C 030C
+013E LATIN SMALL LETTER L WITH CARON
+ * Slovak
+ * the form using apostrophe is preferred in typesetting
+ : 006C 030C
+013F LATIN CAPITAL LETTER L WITH MIDDLE DOT
+ * some fonts show the middle dot inside the L, but the preferred form has the dot following the L
+ # 004C 00B7
+0140 LATIN SMALL LETTER L WITH MIDDLE DOT
+ * Catalan
+ # 006C 00B7
+0141 LATIN CAPITAL LETTER L WITH STROKE
+0142 LATIN SMALL LETTER L WITH STROKE
+ * Polish, ...
+ x (latin small letter l with bar - 019A)
+0143 LATIN CAPITAL LETTER N WITH ACUTE
+ : 004E 0301
+0144 LATIN SMALL LETTER N WITH ACUTE
+ * Polish, ...
+ : 006E 0301
+0145 LATIN CAPITAL LETTER N WITH CEDILLA
+ : 004E 0327
+0146 LATIN SMALL LETTER N WITH CEDILLA
+ * Latvian
+ : 006E 0327
+0147 LATIN CAPITAL LETTER N WITH CARON
+ : 004E 030C
+0148 LATIN SMALL LETTER N WITH CARON
+ * Czech, Slovak
+ : 006E 030C
+0149 LATIN SMALL LETTER N PRECEDED BY APOSTROPHE
+ = LATIN SMALL LETTER APOSTROPHE N
+ * Afrikaans
+ * this is not actually a single letter
+ # 02BC 006E
+014A LATIN CAPITAL LETTER ENG (Sami)
+ * glyph may also have appearance of large form of the small letter
+014B LATIN SMALL LETTER ENG (Sami)
+ * Sámi, Mende, IPA, ...
+014C LATIN CAPITAL LETTER O WITH MACRON
+ : 004F 0304
+014D LATIN SMALL LETTER O WITH MACRON
+ * Latvian, Latin, ...
+ : 006F 0304
+014E LATIN CAPITAL LETTER O WITH BREVE
+ : 004F 0306
+014F LATIN SMALL LETTER O WITH BREVE
+ * Latin
+ : 006F 0306
+0150 LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
+ : 004F 030B
+0151 LATIN SMALL LETTER O WITH DOUBLE ACUTE
+ * Hungarian
+ : 006F 030B
+0152 LATIN CAPITAL LIGATURE OE
+0153 LATIN SMALL LIGATURE OE
+ = LATIN SMALL LETTER O E
+ = ethel (from Old English eðel)
+ * French, IPA, Old Icelandic, Old English, ...
+ x (latin small letter ae - 00E6)
+ x (latin letter small capital oe - 0276)
+0154 LATIN CAPITAL LETTER R WITH ACUTE
+ : 0052 0301
+0155 LATIN SMALL LETTER R WITH ACUTE
+ * Slovak, ...
+ : 0072 0301
+0156 LATIN CAPITAL LETTER R WITH CEDILLA
+ : 0052 0327
+0157 LATIN SMALL LETTER R WITH CEDILLA
+ * Latvian
+ : 0072 0327
+0158 LATIN CAPITAL LETTER R WITH CARON
+ : 0052 030C
+0159 LATIN SMALL LETTER R WITH CARON
+ * Czech, ...
+ : 0072 030C
+015A LATIN CAPITAL LETTER S WITH ACUTE
+ : 0053 0301
+015B LATIN SMALL LETTER S WITH ACUTE
+ * Polish, Indic transliteration, ...
+ : 0073 0301
+015C LATIN CAPITAL LETTER S WITH CIRCUMFLEX
+ : 0053 0302
+015D LATIN SMALL LETTER S WITH CIRCUMFLEX
+ * Esperanto
+ : 0073 0302
+015E LATIN CAPITAL LETTER S WITH CEDILLA *
+ : 0053 0327
+015F LATIN SMALL LETTER S WITH CEDILLA *
+ * Turkish, Azerbaijani, Romanian, ...
+ * this character is used in both Turkish and Romanian data
+ * a glyph variant with comma below is preferred for Romanian
+ x (latin small letter s with comma below - 0219)
+ : 0073 0327
+0160 LATIN CAPITAL LETTER S WITH CARON
+ : 0053 030C
+0161 LATIN SMALL LETTER S WITH CARON
+ * Czech, Estonian, Finnish, Slovak, and many other languages
+ : 0073 030C
+0162 LATIN CAPITAL LETTER T WITH CEDILLA *
+ : 0054 0327
+0163 LATIN SMALL LETTER T WITH CEDILLA *
+ * Romanian, Semitic transliteration, ...
+ * this character is used in Romanian data
+ * a glyph variant with comma below is preferred for Romanian
+ x (latin small letter t with comma below - 021B)
+ : 0074 0327
+0164 LATIN CAPITAL LETTER T WITH CARON
+ * the form using caron/hacek is preferred in all contexts
+ : 0054 030C
+0165 LATIN SMALL LETTER T WITH CARON
+ * Czech, Slovak
+ * the form using apostrophe is preferred in typesetting
+ : 0074 030C
+0166 LATIN CAPITAL LETTER T WITH STROKE
+0167 LATIN SMALL LETTER T WITH STROKE
+ * Sámi
+0168 LATIN CAPITAL LETTER U WITH TILDE
+ : 0055 0303
+0169 LATIN SMALL LETTER U WITH TILDE
+ * Greenlandic (old orthography)
+ : 0075 0303
+016A LATIN CAPITAL LETTER U WITH MACRON
+ : 0055 0304
+016B LATIN SMALL LETTER U WITH MACRON
+ * Latvian, Lithuanian, Latin, ...
+ : 0075 0304
+016C LATIN CAPITAL LETTER U WITH BREVE
+ : 0055 0306
+016D LATIN SMALL LETTER U WITH BREVE
+ * Latin, Esperanto, ...
+ : 0075 0306
+016E LATIN CAPITAL LETTER U WITH RING ABOVE
+ : 0055 030A
+016F LATIN SMALL LETTER U WITH RING ABOVE
+ * Czech, ...
+ : 0075 030A
+0170 LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
+ : 0055 030B
+0171 LATIN SMALL LETTER U WITH DOUBLE ACUTE
+ * Hungarian
+ : 0075 030B
+0172 LATIN CAPITAL LETTER U WITH OGONEK
+ : 0055 0328
+0173 LATIN SMALL LETTER U WITH OGONEK
+ * Lithuanian
+ : 0075 0328
+0174 LATIN CAPITAL LETTER W WITH CIRCUMFLEX
+ : 0057 0302
+0175 LATIN SMALL LETTER W WITH CIRCUMFLEX
+ * Welsh
+ : 0077 0302
+0176 LATIN CAPITAL LETTER Y WITH CIRCUMFLEX
+ : 0059 0302
+0177 LATIN SMALL LETTER Y WITH CIRCUMFLEX
+ * Welsh
+ : 0079 0302
+0178 LATIN CAPITAL LETTER Y WITH DIAERESIS
+ * French, Igbo
+ x (latin small letter y with diaeresis - 00FF)
+ : 0059 0308
+0179 LATIN CAPITAL LETTER Z WITH ACUTE
+ : 005A 0301
+017A LATIN SMALL LETTER Z WITH ACUTE
+ * Polish, ...
+ : 007A 0301
+017B LATIN CAPITAL LETTER Z WITH DOT ABOVE
+ : 005A 0307
+017C LATIN SMALL LETTER Z WITH DOT ABOVE
+ * Polish, ...
+ : 007A 0307
+017D LATIN CAPITAL LETTER Z WITH CARON
+ : 005A 030C
+017E LATIN SMALL LETTER Z WITH CARON
+ * Czech, Estonian, Finnish, Slovak, Slovenian, and many other languages
+ : 007A 030C
+017F LATIN SMALL LETTER LONG S
+ * in common use in Roman types until the 18th century
+ * in current use in Fraktur and Gaelic types
+ # 0073 latin small letter s
+@@ 0180 Latin Extended-B 024F
+@ Latin extended-B
+0180 LATIN SMALL LETTER B WITH STROKE
+ * Americanist and Indo-Europeanist usage for phonetic beta
+ * Old Saxon
+ x (greek small letter beta - 03B2)
+ x (blank symbol - 2422)
+0181 LATIN CAPITAL LETTER B WITH HOOK
+ * Zulu, Pan-Nigerian alphabet
+ x (latin small letter b with hook - 0253)
+0182 LATIN CAPITAL LETTER B WITH TOPBAR
+0183 LATIN SMALL LETTER B WITH TOPBAR
+ * Zhuang
+ * former Soviet minority language scripts
+ x (cyrillic capital letter be - 0411)
+0184 LATIN CAPITAL LETTER TONE SIX
+0185 LATIN SMALL LETTER TONE SIX
+ * Zhuang
+ * Zhuang tone three is Cyrillic ze
+ * Zhuang tone four is Cyrillic che
+ x (latin small letter tone two - 01A8)
+ x (latin small letter tone five - 01BD)
+ x (cyrillic small letter ze - 0437)
+ x (cyrillic small letter che - 0447)
+ x (cyrillic small letter soft sign - 044C)
+0186 LATIN CAPITAL LETTER OPEN O
+ * typographically a turned C
+ x (latin small letter open o - 0254)
+0187 LATIN CAPITAL LETTER C WITH HOOK
+0188 LATIN SMALL LETTER C WITH HOOK
+ * African
+0189 LATIN CAPITAL LETTER AFRICAN D *
+ * Ewe
+ x (latin capital letter eth - 00D0)
+ x (latin capital letter d with stroke - 0110)
+ x (latin small letter d with tail - 0256)
+018A LATIN CAPITAL LETTER D WITH HOOK
+ * Pan-Nigerian alphabet
+ x (latin small letter d with hook - 0257)
+018B LATIN CAPITAL LETTER D WITH TOPBAR
+018C LATIN SMALL LETTER D WITH TOPBAR
+ * former-Soviet minority language scripts
+018D LATIN SMALL LETTER TURNED DELTA
+ * archaic phonetic for labialized dental fricative
+ * recommended spellings 007A 02B7 or 007A 032B
+018E LATIN CAPITAL LETTER REVERSED E
+ = LATIN CAPITAL LETTER TURNED E
+ * Pan-Nigerian alphabet
+ * lowercase is 01DD
+018F LATIN CAPITAL LETTER SCHWA
+ * Azerbaijani, ...
+ x (latin small letter schwa - 0259)
+ x (cyrillic capital letter schwa - 04D8)
+0190 LATIN CAPITAL LETTER OPEN E
+ = LATIN CAPITAL LETTER EPSILON
+ * African
+ x (latin small letter open e - 025B)
+ x (euler constant - 2107)
+0191 LATIN CAPITAL LETTER F WITH HOOK
+ * African
+0192 LATIN SMALL LETTER F WITH HOOK
+ = LATIN SMALL LETTER SCRIPT F
+ = Florin currency symbol (Netherlands)
+ = function symbol
+ = abbreviation convention for folder
+0193 LATIN CAPITAL LETTER G WITH HOOK
+ * African
+ x (latin small letter g with hook - 0260)
+0194 LATIN CAPITAL LETTER GAMMA
+ * African
+ x (latin small letter gamma - 0263)
+0195 LATIN SMALL LETTER HV (hwair)
+ * Gothic transliteration
+ * uppercase is 01F6
+0196 LATIN CAPITAL LETTER IOTA
+ * African
+ x (latin small letter iota - 0269)
+0197 LATIN CAPITAL LETTER I WITH STROKE
+ = barred i, i bar
+ * African
+ * ISO 6438 gives lowercase as 026A, not 0268
+ x (latin letter small capital i - 026A)
+0198 LATIN CAPITAL LETTER K WITH HOOK
+0199 LATIN SMALL LETTER K WITH HOOK
+ * Hausa, Pan-Nigerian alphabet
+019A LATIN SMALL LETTER L WITH BAR
+ = barred l
+ * Americanist phonetic usage for 026C
+ x (latin small letter l with stroke - 0142)
+019B LATIN SMALL LETTER LAMBDA WITH STROKE
+ = barred lambda, lambda bar
+ * Americanist phonetic usage
+019C LATIN CAPITAL LETTER TURNED M
+ * Zhuang
+ x (latin small letter turned m - 026F)
+019D LATIN CAPITAL LETTER N WITH LEFT HOOK
+ * African
+ x (latin small letter n with left hook - 0272)
+019E LATIN SMALL LETTER N WITH LONG RIGHT LEG
+ * archaic phonetic for Japanese syllabic "n"
+ * recommended spelling 006E 0329
+019F LATIN CAPITAL LETTER O WITH MIDDLE TILDE *
+ = barred o, o bar
+ * lowercase is 0275
+ * African
+ x (cyrillic capital letter barred o - 04E8)
+01A0 LATIN CAPITAL LETTER O WITH HORN
+ : 004F 031B
+01A1 LATIN SMALL LETTER O WITH HORN
+ * Vietnamese
+ : 006F 031B
+01A2 LATIN CAPITAL LETTER OI (gha)
+01A3 LATIN SMALL LETTER OI (gha)
+ = gha
+ * Pan-Turkic Latin alphabets
+01A4 LATIN CAPITAL LETTER P WITH HOOK
+01A5 LATIN SMALL LETTER P WITH HOOK
+ * African
+01A6 LATIN LETTER YR *
+ * old Norse
+ * from German Standard DIN 31624 and ISO 5246-2
+ * lowercase is 0280
+01A7 LATIN CAPITAL LETTER TONE TWO
+01A8 LATIN SMALL LETTER TONE TWO
+ * Zhuang
+ * typographically a reversed S
+ x (latin small letter tone six - 0185)
+01A9 LATIN CAPITAL LETTER ESH
+ * African
+ x (latin small letter esh - 0283)
+ x (greek capital letter sigma - 03A3)
+01AA LATIN LETTER REVERSED ESH LOOP
+ * archaic phonetic for labialized palatoalveolar or palatal fricative
+ * Twi
+ * recommended spellings 0283 02B7, 00E7 02B7, 0068 0265, etc.
+01AB LATIN SMALL LETTER T WITH PALATAL HOOK
+ * archaic phonetic for palatalized alveolar or dental stop
+ * recommended spelling 0074 02B2
+01AC LATIN CAPITAL LETTER T WITH HOOK
+01AD LATIN SMALL LETTER T WITH HOOK
+ * African
+01AE LATIN CAPITAL LETTER T WITH RETROFLEX HOOK
+ * African
+ x (latin small letter t with retroflex hook - 0288)
+01AF LATIN CAPITAL LETTER U WITH HORN
+ : 0055 031B
+01B0 LATIN SMALL LETTER U WITH HORN
+ * Vietnamese
+ : 0075 031B
+01B1 LATIN CAPITAL LETTER UPSILON
+ * African
+ * typographically based on turned capital Greek omega
+ x (latin small letter upsilon - 028A)
+ x (inverted ohm sign - 2127)
+01B2 LATIN CAPITAL LETTER V WITH HOOK
+ = LATIN CAPITAL LETTER SCRIPT V
+ * African
+ x (latin small letter v with hook - 028B)
+01B3 LATIN CAPITAL LETTER Y WITH HOOK
+01B4 LATIN SMALL LETTER Y WITH HOOK
+ * Bini, Esoko, and other Edo languages in West Africa
+01B5 LATIN CAPITAL LETTER Z WITH STROKE
+01B6 LATIN SMALL LETTER Z WITH STROKE
+ = barred z, z bar
+ * Pan-Turkic Latin orthography
+ * handwritten variant of Latin "z"
+ x (latin small letter z - 007A)
+01B7 LATIN CAPITAL LETTER EZH
+ * African, Skolt Sámi
+ * lowercase is 0292
+ x (latin capital letter yogh - 021C)
+ x (cyrillic capital letter abkhasian dze - 04E0)
+01B8 LATIN CAPITAL LETTER EZH REVERSED
+01B9 LATIN SMALL LETTER EZH REVERSED
+ * archaic phonetic for voiced pharyngeal fricative
+ * sometimes typographically rendered with a turned digit 3
+ * recommended spelling 0295
+ x (latin letter pharyngeal voiced fricative - 0295)
+ x (arabic letter ain - 0639)
+01BA LATIN SMALL LETTER EZH WITH TAIL
+ * archaic phonetic for labialized voiced palatoalveolar or palatal fricative
+ * Twi
+ * recommended spellings 0292 02B7 or 006A 02B7
+01BB LATIN LETTER TWO WITH STROKE
+ * archaic phonetic for [dz] affricate
+ * recommended spellings 0292 or 0064 007A
+01BC LATIN CAPITAL LETTER TONE FIVE
+01BD LATIN SMALL LETTER TONE FIVE
+ * Zhuang
+ x (latin small letter tone six - 0185)
+01BE LATIN LETTER INVERTED GLOTTAL STOP WITH STROKE
+ * archaic phonetic for [ts] affricate
+ * recommended spelling 0074 0073
+ * letter form is actually derived from ligation of ts, rather than inverted glottal stop
+01BF LATIN LETTER WYNN
+ = wen
+ * Runic letter borrowed into Latin script
+ * replaced by "w" in modern transcriptions of Old English
+ * uppercase is 01F7
+ x (runic letter wunjo wynn w - 16B9)
+01C0 LATIN LETTER DENTAL CLICK
+ = pipe
+ * Khoisan tradition
+ * "c" in Zulu orthography
+ x (solidus - 002F)
+ x (vertical line - 007C)
+ x (latin small letter turned t - 0287)
+ x (divides - 2223)
+01C1 LATIN LETTER LATERAL CLICK
+ = double pipe
+ * Khoisan tradition
+ * "x" in Zulu orthography
+ x (latin letter inverted glottal stop - 0296)
+ x (parallel to - 2225)
+01C2 LATIN LETTER ALVEOLAR CLICK
+ = double-barred pipe
+ * Khoisan tradition
+ x (not equal to - 2260)
+01C3 LATIN LETTER RETROFLEX CLICK
+ = LATIN LETTER EXCLAMATION MARK
+ * Khoisan tradition
+ * "q" in Zulu orthography
+ x (exclamation mark - 0021)
+ x (latin letter stretched c - 0297)
+@ Croatian digraphs matching Serbian Cyrillic letters
+01C4 LATIN CAPITAL LETTER DZ WITH CARON
+ # 0044 017D
+01C5 LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON
+ # 0044 017E
+01C6 LATIN SMALL LETTER DZ WITH CARON
+ x (cyrillic small letter dzhe - 045F)
+ # 0064 017E
+01C7 LATIN CAPITAL LETTER LJ
+ # 004C 004A
+01C8 LATIN CAPITAL LETTER L WITH SMALL LETTER J
+ # 004C 006A
+01C9 LATIN SMALL LETTER LJ
+ x (cyrillic small letter lje - 0459)
+ # 006C 006A
+01CA LATIN CAPITAL LETTER NJ
+ # 004E 004A
+01CB LATIN CAPITAL LETTER N WITH SMALL LETTER J
+ # 004E 006A
+01CC LATIN SMALL LETTER NJ
+ x (cyrillic small letter nje - 045A)
+ # 006E 006A
+@ Pinyin diacritic-vowel combinations
+01CD LATIN CAPITAL LETTER A WITH CARON
+ : 0041 030C
+01CE LATIN SMALL LETTER A WITH CARON
+ * Pinyin third tone
+ : 0061 030C
+01CF LATIN CAPITAL LETTER I WITH CARON
+ : 0049 030C
+01D0 LATIN SMALL LETTER I WITH CARON
+ * Pinyin third tone
+ : 0069 030C
+01D1 LATIN CAPITAL LETTER O WITH CARON
+ : 004F 030C
+01D2 LATIN SMALL LETTER O WITH CARON
+ * Pinyin third tone
+ : 006F 030C
+01D3 LATIN CAPITAL LETTER U WITH CARON
+ : 0055 030C
+01D4 LATIN SMALL LETTER U WITH CARON
+ * Pinyin third tone
+ : 0075 030C
+01D5 LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON
+ : 00DC 0304
+01D6 LATIN SMALL LETTER U WITH DIAERESIS AND MACRON
+ * Pinyin first tone
+ : 00FC 0304
+01D7 LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE
+ : 00DC 0301
+01D8 LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE
+ * Pinyin second tone
+ : 00FC 0301
+01D9 LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON
+ : 00DC 030C
+01DA LATIN SMALL LETTER U WITH DIAERESIS AND CARON
+ * Pinyin third tone
+ : 00FC 030C
+01DB LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE
+ : 00DC 0300
+01DC LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE
+ * Pinyin fourth tone
+ : 00FC 0300
+@ Additions
+01DD LATIN SMALL LETTER TURNED E
+ * Pan-Nigerian alphabet
+ * all other usages of schwa are 0259
+ * uppercase is 018E
+ x (latin small letter schwa - 0259)
+01DE LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON
+ : 00C4 0304
+01DF LATIN SMALL LETTER A WITH DIAERESIS AND MACRON
+ * Livonian, Uralicist usage
+ : 00E4 0304
+01E0 LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON
+ : 0226 0304
+01E1 LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON
+ * Uralicist usage
+ : 0227 0304
+01E2 LATIN CAPITAL LETTER AE WITH MACRON (ash) *
+ : 00C6 0304
+01E3 LATIN SMALL LETTER AE WITH MACRON (ash) *
+ * Old Norse, Old English
+ : 00E6 0304
+01E4 LATIN CAPITAL LETTER G WITH STROKE
+01E5 LATIN SMALL LETTER G WITH STROKE
+ * Skolt Sámi
+01E6 LATIN CAPITAL LETTER G WITH CARON
+ : 0047 030C
+01E7 LATIN SMALL LETTER G WITH CARON
+ * Skolt Sámi
+ x (latin small letter g with breve - 011F)
+ : 0067 030C
+01E8 LATIN CAPITAL LETTER K WITH CARON
+ : 004B 030C
+01E9 LATIN SMALL LETTER K WITH CARON
+ * Skolt Sámi
+ : 006B 030C
+01EA LATIN CAPITAL LETTER O WITH OGONEK
+ : 004F 0328
+01EB LATIN SMALL LETTER O WITH OGONEK
+ * Sámi, Iroquoian, Old Icelandic
+ : 006F 0328
+01EC LATIN CAPITAL LETTER O WITH OGONEK AND MACRON
+ : 01EA 0304
+01ED LATIN SMALL LETTER O WITH OGONEK AND MACRON
+ * Old Icelandic
+ : 01EB 0304
+01EE LATIN CAPITAL LETTER EZH WITH CARON
+ : 01B7 030C
+01EF LATIN SMALL LETTER EZH WITH CARON
+ * Skolt Sámi
+ : 0292 030C
+01F0 LATIN SMALL LETTER J WITH CARON
+ * IPA and many languages
+ : 006A 030C
+01F1 LATIN CAPITAL LETTER DZ
+ # 0044 005A
+01F2 LATIN CAPITAL LETTER D WITH SMALL LETTER Z
+ # 0044 007A
+01F3 LATIN SMALL LETTER DZ
+ # 0064 007A
+01F4 LATIN CAPITAL LETTER G WITH ACUTE
+ : 0047 0301
+01F5 LATIN SMALL LETTER G WITH ACUTE
+ * Macedonian and Serbian transliteration
+ : 0067 0301
+01F6 LATIN CAPITAL LETTER HWAIR
+ * lowercase is 0195
+01F7 LATIN CAPITAL LETTER WYNN
+ = wen
+ * lowercase is 01BF
+01F8 LATIN CAPITAL LETTER N WITH GRAVE
+ : 004E 0300
+01F9 LATIN SMALL LETTER N WITH GRAVE
+ * Pinyin
+ : 006E 0300
+01FA LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE
+ : 00C5 0301
+01FB LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE
+ : 00E5 0301
+01FC LATIN CAPITAL LETTER AE WITH ACUTE (ash) *
+ : 00C6 0301
+01FD LATIN SMALL LETTER AE WITH ACUTE (ash) *
+ : 00E6 0301
+01FE LATIN CAPITAL LETTER O WITH STROKE AND ACUTE
+ : 00D8 0301
+01FF LATIN SMALL LETTER O WITH STROKE AND ACUTE
+ : 00F8 0301
+@ Additions for Slovenian and Croatian
+0200 LATIN CAPITAL LETTER A WITH DOUBLE GRAVE
+ : 0041 030F
+0201 LATIN SMALL LETTER A WITH DOUBLE GRAVE
+ : 0061 030F
+0202 LATIN CAPITAL LETTER A WITH INVERTED BREVE
+ : 0041 0311
+0203 LATIN SMALL LETTER A WITH INVERTED BREVE
+ : 0061 0311
+0204 LATIN CAPITAL LETTER E WITH DOUBLE GRAVE
+ : 0045 030F
+0205 LATIN SMALL LETTER E WITH DOUBLE GRAVE
+ : 0065 030F
+0206 LATIN CAPITAL LETTER E WITH INVERTED BREVE
+ : 0045 0311
+0207 LATIN SMALL LETTER E WITH INVERTED BREVE
+ : 0065 0311
+0208 LATIN CAPITAL LETTER I WITH DOUBLE GRAVE
+ : 0049 030F
+0209 LATIN SMALL LETTER I WITH DOUBLE GRAVE
+ : 0069 030F
+020A LATIN CAPITAL LETTER I WITH INVERTED BREVE
+ : 0049 0311
+020B LATIN SMALL LETTER I WITH INVERTED BREVE
+ : 0069 0311
+020C LATIN CAPITAL LETTER O WITH DOUBLE GRAVE
+ : 004F 030F
+020D LATIN SMALL LETTER O WITH DOUBLE GRAVE
+ : 006F 030F
+020E LATIN CAPITAL LETTER O WITH INVERTED BREVE
+ : 004F 0311
+020F LATIN SMALL LETTER O WITH INVERTED BREVE
+ : 006F 0311
+0210 LATIN CAPITAL LETTER R WITH DOUBLE GRAVE
+ : 0052 030F
+0211 LATIN SMALL LETTER R WITH DOUBLE GRAVE
+ : 0072 030F
+0212 LATIN CAPITAL LETTER R WITH INVERTED BREVE
+ : 0052 0311
+0213 LATIN SMALL LETTER R WITH INVERTED BREVE
+ : 0072 0311
+0214 LATIN CAPITAL LETTER U WITH DOUBLE GRAVE
+ : 0055 030F
+0215 LATIN SMALL LETTER U WITH DOUBLE GRAVE
+ : 0075 030F
+0216 LATIN CAPITAL LETTER U WITH INVERTED BREVE
+ : 0055 0311
+0217 LATIN SMALL LETTER U WITH INVERTED BREVE
+ : 0075 0311
+@ Additions for Romanian
+0218 LATIN CAPITAL LETTER S WITH COMMA BELOW *
+ : 0053 0326
+0219 LATIN SMALL LETTER S WITH COMMA BELOW *
+ * Romanian, when distinct comma below form is required
+ x (latin small letter s with cedilla - 015F)
+ : 0073 0326
+021A LATIN CAPITAL LETTER T WITH COMMA BELOW *
+ : 0054 0326
+021B LATIN SMALL LETTER T WITH COMMA BELOW *
+ * Romanian, when distinct comma below form is required
+ x (latin small letter t with cedilla - 0163)
+ : 0074 0326
+@ Miscellaneous additions
+021C LATIN CAPITAL LETTER YOGH
+ x (latin capital letter ezh - 01B7)
+021D LATIN SMALL LETTER YOGH
+ * Middle English, Scots
+ x (latin small letter ezh - 0292)
+ x (ounce sign - 2125)
+021E LATIN CAPITAL LETTER H WITH CARON
+ : 0048 030C
+021F LATIN SMALL LETTER H WITH CARON
+ * Finnish Romany
+ : 0068 030C
+0222 LATIN CAPITAL LETTER OU
+0223 LATIN SMALL LETTER OU
+ * Algonquin, Huron
+ x (digit eight - 0038)
+0224 LATIN CAPITAL LETTER Z WITH HOOK
+0225 LATIN SMALL LETTER Z WITH HOOK
+ * Middle High German
+0226 LATIN CAPITAL LETTER A WITH DOT ABOVE
+ : 0041 0307
+0227 LATIN SMALL LETTER A WITH DOT ABOVE
+ * Uralicist usage
+ : 0061 0307
+0228 LATIN CAPITAL LETTER E WITH CEDILLA
+ : 0045 0327
+0229 LATIN SMALL LETTER E WITH CEDILLA
+ : 0065 0327
+@ Additions for Livonian
+022A LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON
+ : 00D6 0304
+022B LATIN SMALL LETTER O WITH DIAERESIS AND MACRON
+ * Livonian
+ : 00F6 0304
+022C LATIN CAPITAL LETTER O WITH TILDE AND MACRON
+ : 00D5 0304
+022D LATIN SMALL LETTER O WITH TILDE AND MACRON
+ * Livonian
+ : 00F5 0304
+022E LATIN CAPITAL LETTER O WITH DOT ABOVE
+ : 004F 0307
+022F LATIN SMALL LETTER O WITH DOT ABOVE
+ * Livonian
+ : 006F 0307
+0230 LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON
+ : 022E 0304
+0231 LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON
+ * Livonian
+ : 022F 0304
+0232 LATIN CAPITAL LETTER Y WITH MACRON
+ : 0059 0304
+0233 LATIN SMALL LETTER Y WITH MACRON
+ * Livonian, Cornish
+ : 0079 0304
+@@ 0250 IPA Extensions 02AF
+@ IPA extensions
+@+ IPA includes basic Latin letters and a number of Latin letters from other blocks.
+ x (latin small letter ae - 00E6)
+ x (latin small letter c with cedilla - 00E7)
+ x (latin small letter eth - 00F0)
+ x (latin small letter o with stroke - 00F8)
+ x (latin small letter h with stroke - 0127)
+ x (latin small letter eng - 014B)
+ x (latin small ligature oe - 0153)
+ x (greek small letter beta - 03B2)
+ x (greek small letter theta - 03B8)
+ x (greek small letter lamda - 03BB)
+ x (greek small letter chi - 03C7)
+0250 LATIN SMALL LETTER TURNED A
+ * low central unrounded vowel
+0251 LATIN SMALL LETTER ALPHA
+ = LATIN SMALL LETTER SCRIPT A
+ * low back unrounded vowel
+ x (greek small letter alpha - 03B1)
+0252 LATIN SMALL LETTER TURNED ALPHA
+ * low back rounded vowel
+0253 LATIN SMALL LETTER B WITH HOOK
+ * implosive bilabial stop
+ * Pan-Nigerian alphabet
+ x (latin capital letter b with hook - 0181)
+0254 LATIN SMALL LETTER OPEN O
+ * typographically a turned c
+ * lower-mid back rounded vowel
+ x (latin capital letter open o - 0186)
+0255 LATIN SMALL LETTER C WITH CURL
+ * voiceless alveolo-palatal laminal fricative
+ * used in transcription of Mandarin Chinese
+ * sound spelled with 015B in Polish
+0256 LATIN SMALL LETTER D WITH TAIL
+ = LATIN SMALL LETTER D RETROFLEX HOOK
+ * voiced retroflex stop
+ x (latin capital letter african d - 0189)
+0257 LATIN SMALL LETTER D WITH HOOK
+ * implosive dental or alveolar stop
+ * Ewe, Pan-Nigerian alphabet
+ x (latin capital letter d with hook - 018A)
+0258 LATIN SMALL LETTER REVERSED E
+ * upper-mid central unrounded vowel
+0259 LATIN SMALL LETTER SCHWA
+ * mid-central unrounded vowel
+ * variant uppercase form 018E is associated with 01DD
+ x (latin capital letter schwa - 018F)
+ x (latin small letter turned e - 01DD)
+ x (cyrillic small letter schwa - 04D9)
+025A LATIN SMALL LETTER SCHWA WITH HOOK
+ * rhotacized schwa
+025B LATIN SMALL LETTER OPEN E
+ = LATIN SMALL LETTER EPSILON
+ * lower-mid front unrounded vowel
+ x (latin capital letter open e - 0190)
+ x (greek small letter epsilon - 03B5)
+025C LATIN SMALL LETTER REVERSED OPEN E
+ * lower-mid central unrounded vowel
+025D LATIN SMALL LETTER REVERSED OPEN E WITH HOOK
+ * rhotacized lower-mid central vowel
+025E LATIN SMALL LETTER CLOSED REVERSED OPEN E
+ = LATIN SMALL LETTER CLOSED REVERSED EPSILON
+ * lower-mid central rounded vowel
+025F LATIN SMALL LETTER DOTLESS J WITH STROKE
+ * voiced palatal stop
+ * typographically a turned f, but better thought of as a form of j
+ * "gy" in Hungarian orthography
+ * also archaic phonetic for palatoalveolar affricate 02A4
+0260 LATIN SMALL LETTER G WITH HOOK
+ * implosive velar stop
+ x (latin capital letter g with hook - 0193)
+0261 LATIN SMALL LETTER SCRIPT G
+ * voiced velar stop
+ x (latin small letter g - 0067)
+0262 LATIN LETTER SMALL CAPITAL G
+ * voiced uvular stop
+0263 LATIN SMALL LETTER GAMMA
+ * voiced velar fricative
+ x (latin capital letter gamma - 0194)
+ x (greek small letter gamma - 03B3)
+0264 LATIN SMALL LETTER RAMS HORN
+ = LATIN SMALL LETTER BABY GAMMA
+ * upper-mid back unrounded vowel
+0265 LATIN SMALL LETTER TURNED H
+ * voiced rounded palatal approximant
+0266 LATIN SMALL LETTER H WITH HOOK
+ * breathy-voiced glottal fricative
+ x (modifier letter small h with hook - 02B1)
+0267 LATIN SMALL LETTER HENG WITH HOOK
+ * voiceless coarticulated velar and palatoalveolar fricative
+ * "tj" or "kj" or "sj" in some Swedish dialects
+0268 LATIN SMALL LETTER I WITH STROKE
+ = barred i, i bar
+ * high central unrounded vowel
+ * ISO 6438 gives lowercase of 0197 as 026A, not 0268
+0269 LATIN SMALL LETTER IOTA
+ * semi-high front unrounded vowel
+@+ * obsoleted by IPA in 1989
+ * preferred use is 026A LATIN LETTER SMALL CAPITAL I
+ x (latin capital letter iota - 0196)
+ x (greek small letter iota - 03B9)
+026A LATIN LETTER SMALL CAPITAL I
+ * semi-high front unrounded vowel
+ * preferred IPA alternate for 0269
+ x (latin capital letter i with stroke - 0197)
+026B LATIN SMALL LETTER L WITH MIDDLE TILDE
+ * velarized voiced alveolar lateral approximant
+026C LATIN SMALL LETTER L WITH BELT
+ * voiceless alveolar lateral fricative
+026D LATIN SMALL LETTER L WITH RETROFLEX HOOK
+ * voiced retroflex lateral
+026E LATIN SMALL LETTER LEZH
+ * voiced lateral fricative
+ * "dhl" in Zulu orthography
+026F LATIN SMALL LETTER TURNED M
+ * high back unrounded vowel
+ x (latin capital letter turned m - 019C)
+0270 LATIN SMALL LETTER TURNED M WITH LONG LEG
+ * voiced velar approximant
+0271 LATIN SMALL LETTER M WITH HOOK
+ * voiced labiodental nasal
+0272 LATIN SMALL LETTER N WITH LEFT HOOK
+ * voiced palatal nasal
+ x (latin capital letter n with left hook - 019D)
+0273 LATIN SMALL LETTER N WITH RETROFLEX HOOK
+ * voiced retroflex nasal
+0274 LATIN LETTER SMALL CAPITAL N
+ * voiced uvular nasal
+0275 LATIN SMALL LETTER BARRED O
+ = o bar
+ * rounded mid-central vowel, i.e. rounded schwa
+ * uppercase is 019F
+ x (greek small letter theta - 03B8)
+ x (cyrillic small letter fita - 0473)
+ x (cyrillic small letter barred o - 04E9)
+0276 LATIN LETTER SMALL CAPITAL OE
+ * low front rounded vowel
+ x (latin small ligature oe - 0153)
+0277 LATIN SMALL LETTER CLOSED OMEGA
+ * semi-high back rounded vowel
+@+ * obsoleted by IPA in 1989
+ * preferred use is 028A latin small letter upsilon
+0278 LATIN SMALL LETTER PHI
+ * voiceless bilabial fricative
+ x (greek small letter phi - 03C6)
+0279 LATIN SMALL LETTER TURNED R
+ * voiced alveolar approximant
+ x (modifier letter small turned r - 02B4)
+027A LATIN SMALL LETTER TURNED R WITH LONG LEG
+ * voiced lateral flap
+027B LATIN SMALL LETTER TURNED R WITH HOOK
+ * voiced retroflex approximant
+ x (modifier letter small turned r with hook - 02B5)
+027C LATIN SMALL LETTER R WITH LONG LEG
+ * voiced strident apico-alveolar trill
+@+ * obsoleted by IPA in 1989
+ * sound spelled with 0159 in Czech
+ * preferred phonetic representation for Czech is 0072 031D
+ * in current use in Gaelic types (as glyph variant of 0072)
+027D LATIN SMALL LETTER R WITH TAIL
+ * voiced retroflex flap
+027E LATIN SMALL LETTER R WITH FISHHOOK
+ * voiced alveolar flap or tap
+027F LATIN SMALL LETTER REVERSED R WITH FISHHOOK
+ * apical dental vowel
+ * used in Sinological tradition
+ * IPA spelling - 007A 0329
+0280 LATIN LETTER SMALL CAPITAL R *
+ * voiced uvular trill
+ * Germanic, Old Norse
+ * uppercase is 01A6
+0281 LATIN LETTER SMALL CAPITAL INVERTED R
+ * voiced uvular fricative or approximant
+ x (modifier letter small capital inverted r - 02B6)
+0282 LATIN SMALL LETTER S WITH HOOK
+ * voiceless retroflex fricative
+0283 LATIN SMALL LETTER ESH
+ * voiceless postalveolar fricative
+ x (latin capital letter esh - 01A9)
+ x (integral - 222B)
+0284 LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK
+ * implosive palatal stop
+ * typographically based on 025F, not on 0283
+0285 LATIN SMALL LETTER SQUAT REVERSED ESH
+ * apical retroflex vowel
+ * used in Sinological tradition
+ * IPA spelling - 0290 0329
+0286 LATIN SMALL LETTER ESH WITH CURL
+ * palatalized voiceless postalveolar fricative
+ * suggested spelling - 0283 02B2
+0287 LATIN SMALL LETTER TURNED T
+ * dental click (sound of "tsk tsk")
+ x (latin letter dental click - 01C0)
+0288 LATIN SMALL LETTER T WITH RETROFLEX HOOK
+ * voiceless retroflex stop
+ x (latin capital letter t with retroflex hook - 01AE)
+0289 LATIN SMALL LETTER U BAR
+ * high central rounded vowel
+028A LATIN SMALL LETTER UPSILON
+ * semi-high back rounded vowel
+ * preferred IPA alternate to 0277
+ x (latin capital letter upsilon - 01B1)
+ x (greek small letter upsilon - 03C5)
+028B LATIN SMALL LETTER V WITH HOOK
+ = LATIN SMALL LETTER SCRIPT V
+ * voiced labiodental approximant
+ x (latin capital letter v with hook - 01B2)
+ x (greek small letter upsilon - 03C5)
+028C LATIN SMALL LETTER TURNED V
+ = caret, wedge
+ * lower-mid back unrounded vowel
+ x (greek capital letter lamda - 039B)
+ x (caret - 2038)
+ x (logical and - 2227)
+028D LATIN SMALL LETTER TURNED W
+ * voiceless rounded labiovelar approximant
+028E LATIN SMALL LETTER TURNED Y
+ * voiced lateral approximant
+028F LATIN LETTER SMALL CAPITAL Y
+ * semi-high front rounded vowel
+0290 LATIN SMALL LETTER Z WITH RETROFLEX HOOK
+ * voiced retroflex fricative
+0291 LATIN SMALL LETTER Z WITH CURL
+ * voiced alveolo-palatal laminal fricative
+ * sound spelled with 017A in Polish
+0292 LATIN SMALL LETTER EZH
+ = LATIN SMALL LETTER YOGH
+ = dram
+ * voiced postalveolar fricative
+ * uppercase is 01B7
+ * Skolt Sámi
+ x (latin small letter yogh - 021D)
+ x (cyrillic small letter abkhasian dze - 04E1)
+ x (ounce sign - 2125)
+0293 LATIN SMALL LETTER EZH WITH CURL
+ * palatalized voiced postalveolar fricative
+0294 LATIN LETTER GLOTTAL STOP
+ x (modifier letter glottal stop - 02C0)
+0295 LATIN LETTER PHARYNGEAL VOICED FRICATIVE
+ = LATIN LETTER REVERSED GLOTTAL STOP
+ * voiced pharyngeal fricative
+ * ain
+ x (latin small letter ezh reversed - 01B9)
+ x (modifier letter reversed glottal stop - 02C1)
+0296 LATIN LETTER INVERTED GLOTTAL STOP
+ * lateral click
+ x (latin letter lateral click - 01C1)
+0297 LATIN LETTER STRETCHED C
+ * palatal (or alveolar) click
+ x (latin letter retroflex click - 01C3)
+ x (complement - 2201)
+0298 LATIN LETTER BILABIAL CLICK
+ = LATIN LETTER BULLSEYE
+ x (circled dot operator - 2299)
+0299 LATIN LETTER SMALL CAPITAL B
+ * bilabial trill
+029A LATIN SMALL LETTER CLOSED OPEN E
+ = LATIN SMALL LETTER CLOSED EPSILON
+ * lower-mid front rounded vowel
+ * non-IPA alternate for the preferred 0153
+029B LATIN LETTER SMALL CAPITAL G WITH HOOK
+ * voiced uvular implosive
+029C LATIN LETTER SMALL CAPITAL H
+ * voiceless epiglottal fricative
+029D LATIN SMALL LETTER J WITH CROSSED-TAIL
+ * voiced palatal fricative
+029E LATIN SMALL LETTER TURNED K
+ * proposed for velar click
+@+ * withdrawn by IPA in 1970
+029F LATIN LETTER SMALL CAPITAL L
+ * velar lateral approximant
+02A0 LATIN SMALL LETTER Q WITH HOOK
+ * voiceless uvular implosive
+02A1 LATIN LETTER GLOTTAL STOP WITH STROKE
+ * voiced epiglottal stop
+02A2 LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE
+ * voiced epiglottal fricative
+02A3 LATIN SMALL LETTER DZ DIGRAPH
+ * voiced dental affricate
+02A4 LATIN SMALL LETTER DEZH DIGRAPH
+ * voiced postalveolar affricate
+02A5 LATIN SMALL LETTER DZ DIGRAPH WITH CURL
+ * voiced alveolo-palatal affricate
+02A6 LATIN SMALL LETTER TS DIGRAPH
+ * voiceless dental affricate
+02A7 LATIN SMALL LETTER TESH DIGRAPH
+ * voiceless postalveolar affricate
+02A8 LATIN SMALL LETTER TC DIGRAPH WITH CURL
+ * voiceless alveolo-palatal affricate
+@ IPA characters for disordered speech
+02A9 LATIN SMALL LETTER FENG DIGRAPH
+ * velopharyngeal fricative
+02AA LATIN SMALL LETTER LS DIGRAPH
+ * lateral alveolar fricative (lisp)
+02AB LATIN SMALL LETTER LZ DIGRAPH
+ * voiced lateral alveolar fricative
+02AC LATIN LETTER BILABIAL PERCUSSIVE
+ * audible lip smack
+02AD LATIN LETTER BIDENTAL PERCUSSIVE
+ * audible teeth gnashing
+@@ 02B0 Spacing Modifier Letters 02FF
+@ Phonetic modifiers derived from Latin letters
+02B0 MODIFIER LETTER SMALL H
+ * aspiration
+ # <super> 0068
+02B1 MODIFIER LETTER SMALL H WITH HOOK
+ * breathy voiced, murmured
+ x (latin small letter h with hook - 0266)
+ x (combining diaeresis below - 0324)
+ # <super> 0266
+02B2 MODIFIER LETTER SMALL J
+ * palatalization
+ x (combining palatalized hook below - 0321)
+ # <super> 006A
+02B3 MODIFIER LETTER SMALL R
+ # <super> 0072
+02B4 MODIFIER LETTER SMALL TURNED R
+ x (latin small letter turned r - 0279)
+ # <super> 0279
+02B5 MODIFIER LETTER SMALL TURNED R WITH HOOK
+ x (latin small letter turned r with hook - 027B)
+ # <super> 027B
+02B6 MODIFIER LETTER SMALL CAPITAL INVERTED R
+ * preceding four used for r-coloring or r-offglides
+ x (latin letter small capital inverted r - 0281)
+ # <super> 0281
+02B7 MODIFIER LETTER SMALL W
+ * labialization
+ x (combining inverted double arch below - 032B)
+ # <super> 0077
+02B8 MODIFIER LETTER SMALL Y
+ * palatalization
+ * common Americanist substitution for 02B2
+ # <super> 0079
+@ Miscellaneous phonetic modifiers
+02B9 MODIFIER LETTER PRIME
+ * primary stress, emphasis
+ * transliteration of mjagkij znak (Cyrillic soft sign: palatalization)
+ x (apostrophe - 0027)
+ x (acute accent - 00B4)
+ x (modifier letter acute accent - 02CA)
+ x (combining acute accent - 0301)
+ x (greek numeral sign - 0374)
+ x (prime - 2032)
+02BA MODIFIER LETTER DOUBLE PRIME
+ * exaggerated stress, contrastive stress
+ * transliteration of tverdyj znak (Cyrillic hard sign: no palatalization)
+ x (quotation mark - 0022)
+ x (combining double acute accent - 030B)
+ x (double prime - 2033)
+02BB MODIFIER LETTER TURNED COMMA
+ * typographical alternate for 02BD or 02BF
+ x (combining turned comma above - 0312)
+ x (left single quotation mark - 2018)
+02BC MODIFIER LETTER APOSTROPHE
+ = apostrophe
+ * glottal stop, glottalization, ejective
+ * spacing clone of Greek smooth breathing mark
+ * many languages use this as a letter of their alphabets
+ x (apostrophe - 0027)
+ x (combining comma above - 0313)
+ x (combining comma above right - 0315)
+ x (armenian apostrophe - 055A)
+ x (right single quotation mark - 2019)
+02BD MODIFIER LETTER REVERSED COMMA
+ * weak aspiration
+ * spacing clone of Greek rough breathing mark
+ x (combining reversed comma above - 0314)
+ x (armenian modifier letter left half ring - 0559)
+ x (single high-reversed-9 quotation mark - 201B)
+02BE MODIFIER LETTER RIGHT HALF RING
+ * transliteration of Arabic hamza (glottal stop)
+ x (armenian apostrophe - 055A)
+ x (arabic letter hamza - 0621)
+02BF MODIFIER LETTER LEFT HALF RING
+ * transliteration of Arabic ain (voiced pharyngeal fricative)
+ x (armenian modifier letter left half ring - 0559)
+ x (arabic letter ain - 0639)
+02C0 MODIFIER LETTER GLOTTAL STOP
+ * ejective or glottalized
+ * typographical alternate for 02BC or 02BE
+ x (latin letter glottal stop - 0294)
+ x (combining hook above - 0309)
+02C1 MODIFIER LETTER REVERSED GLOTTAL STOP
+ * typographical alternate for 02BF
+ x (latin letter pharyngeal voiced fricative - 0295)
+02C2 MODIFIER LETTER LEFT ARROWHEAD
+ * fronted articulation
+02C3 MODIFIER LETTER RIGHT ARROWHEAD
+ * backed articulation
+02C4 MODIFIER LETTER UP ARROWHEAD
+ * raised articulation
+ x (circumflex accent - 005E)
+ x (up arrowhead - 2303)
+02C5 MODIFIER LETTER DOWN ARROWHEAD
+ * lowered articulation
+02C6 MODIFIER LETTER CIRCUMFLEX ACCENT
+ * rising-falling tone, falling tone, secondary stress, etc.
+ x (circumflex accent - 005E)
+ x (combining circumflex accent - 0302)
+02C7 CARON (Mandarin Chinese third tone)
+ = hacek
+ * falling-rising tone
+ * Mandarin Chinese third tone
+ x (combining caron - 030C)
+02C8 MODIFIER LETTER VERTICAL LINE
+ * primary stress, downstep
+ * precedes letter or syllable modified
+ x (apostrophe - 0027)
+ x (combining vertical line above - 030D)
+02C9 MODIFIER LETTER MACRON (Mandarin Chinese first tone)
+ * high level tone
+ * precedes or follows letter or syllable modified
+ * Mandarin Chinese first tone
+ x (macron - 00AF)
+ x (combining macron - 0304)
+02CA MODIFIER LETTER ACUTE ACCENT (Mandarin Chinese second tone)
+ * high-rising tone (IPA), high tone, primary stress
+ * Mandarin Chinese second tone
+ x (acute accent - 00B4)
+ x (modifier letter prime - 02B9)
+ x (combining acute accent - 0301)
+ x (greek numeral sign - 0374)
+ x (armenian emphasis mark - 055B)
+02CB MODIFIER LETTER GRAVE ACCENT (Mandarin Chinese fourth tone)
+ * high-falling tone (IPA), low tone, secondary or tertiary stress
+ * Mandarin Chinese fourth tone
+ x (grave accent - 0060)
+ x (combining grave accent - 0300)
+ x (armenian comma - 055D)
+02CC MODIFIER LETTER LOW VERTICAL LINE
+ * secondary stress
+ * precedes letter or syllable modified
+ x (combining vertical line below - 0329)
+02CD MODIFIER LETTER LOW MACRON
+ * low level tone
+ x (low line - 005F)
+ x (combining macron below - 0331)
+02CE MODIFIER LETTER LOW GRAVE ACCENT
+ * low-falling tone
+02CF MODIFIER LETTER LOW ACUTE ACCENT
+ * low-rising tone
+ x (greek lower numeral sign - 0375)
+02D0 MODIFIER LETTER TRIANGULAR COLON
+ * length mark
+ x (colon - 003A)
+02D1 MODIFIER LETTER HALF TRIANGULAR COLON
+ * half-length mark
+ x (middle dot - 00B7)
+02D2 MODIFIER LETTER CENTRED RIGHT HALF RING
+ * more rounded articulation
+02D3 MODIFIER LETTER CENTRED LEFT HALF RING
+ * less rounded articulation
+02D4 MODIFIER LETTER UP TACK
+ * vowel raising or closing
+ x (combining up tack below - 031D)
+ x (combining dot below - 0323)
+02D5 MODIFIER LETTER DOWN TACK
+ * vowel lowering or opening
+ x (combining left half ring below - 031C)
+ x (combining down tack below - 031E)
+02D6 MODIFIER LETTER PLUS SIGN
+ * advanced or fronted articulation
+ x (combining plus sign below - 031F)
+02D7 MODIFIER LETTER MINUS SIGN
+ * retracted or backed articulation
+ * glyph may have small end-serifs
+ x (combining minus sign below - 0320)
+@ Spacing clones of diacritics
+02D8 BREVE
+ x (combining breve - 0306)
+ # 0020 0306
+02D9 DOT ABOVE (Mandarin Chinese light tone)
+ * Mandarin Chinese fifth tone (light or neutral)
+ x (combining dot above - 0307)
+ # 0020 0307
+02DA RING ABOVE
+ x (degree sign - 00B0)
+ x (combining ring above - 030A)
+ # 0020 030A
+02DB OGONEK
+ x (combining ogonek - 0328)
+ # 0020 0328
+02DC SMALL TILDE
+ x (tilde - 007E)
+ x (combining tilde - 0303)
+ x (tilde operator - 223C)
+ # 0020 0303
+02DD DOUBLE ACUTE ACCENT
+ x (combining double acute accent - 030B)
+ # 0020 030B
+@ Additions based on 1989 IPA
+02DE MODIFIER LETTER RHOTIC HOOK
+ * rhotacization in vowel
+ * often ligated: 025A = 0259 + 02DE; 025D = 025C + 02DE
+02DF MODIFIER LETTER CROSS ACCENT
+ * Swedish grave accent
+02E0 MODIFIER LETTER SMALL GAMMA
+ * these modifier letters are occasionally used in transcription of affricates
+ # <super> 0263
+02E1 MODIFIER LETTER SMALL L
+ # <super> 006C
+02E2 MODIFIER LETTER SMALL S
+ # <super> 0073
+02E3 MODIFIER LETTER SMALL X
+ # <super> 0078
+02E4 MODIFIER LETTER SMALL REVERSED GLOTTAL STOP
+ # <super> 0295
+@ Tone letters
+02E5 MODIFIER LETTER EXTRA-HIGH TONE BAR
+02E6 MODIFIER LETTER HIGH TONE BAR
+02E7 MODIFIER LETTER MID TONE BAR
+02E8 MODIFIER LETTER LOW TONE BAR
+02E9 MODIFIER LETTER EXTRA-LOW TONE BAR
+02EA MODIFIER LETTER YIN DEPARTING TONE MARK
+02EB MODIFIER LETTER YANG DEPARTING TONE MARK
+@ IPA modifiers
+02EC MODIFIER LETTER VOICING
+02ED MODIFIER LETTER UNASPIRATED
+@ Other modifier letters
+02EE MODIFIER LETTER DOUBLE APOSTROPHE
+
+2000 EN QUAD
+ : 2002 en space
+2001 EM QUAD
+ = mutton quad
+ : 2003 em space
+2002 EN SPACE
+ = nut
+ * half an em
+ # 0020 space
+2003 EM SPACE
+ = mutton
+ * nominally, a space equal to the type size in points
+ * may scale by the condensation factor of a font
+ # 0020 space
+2004 THREE-PER-EM SPACE
+ = thick space
+ # 0020 space
+2005 FOUR-PER-EM SPACE
+ = mid space
+ # 0020 space
+2006 SIX-PER-EM SPACE
+ * in computer typography sometimes equated to thin space
+ # 0020 space
+2007 FIGURE SPACE
+ * space equal to tabular width of a font
+ * this is equivalent to the digit width of fonts with fixed-width digits
+ # <noBreak> 0020
+2008 PUNCTUATION SPACE
+ * space equal to narrow punctuation of a font
+ # 0020 space
+2009 THIN SPACE
+ * a fifth of an em (or sometimes a sixth)
+ # 0020 space
+200A HAIR SPACE
+ * thinner than a thin space
+ * in traditional typography, the thinnest space available
+ # 0020 space
+200B ZERO WIDTH SPACE
+ * nominally zero width, but may expand in justification
+@ Formatting characters
+200C ZERO WIDTH NON-JOINER
+ = ZWNJ
+200D ZERO WIDTH JOINER
+ = ZWJ
+200E LEFT-TO-RIGHT MARK
+ = LRM
+200F RIGHT-TO-LEFT MARK
+ = RLM
+@ Dashes
+2010 HYPHEN
+ x (hyphen-minus - 002D)
+2011 NON-BREAKING HYPHEN
+ x (hyphen-minus - 002D)
+ # <noBreak> 2010
+2012 FIGURE DASH
+2013 EN DASH
+2014 EM DASH
+ * may be used in pairs to offset parenthetical text
+ x (katakana-hiragana prolonged sound mark - 30FC)
+2015 HORIZONTAL BAR
+ = QUOTATION DASH
+ * long dash introducing quoted text
+@ General punctuation
+2016 DOUBLE VERTICAL LINE
+ * used in pairs to indicate norm of a matrix
+ x (parallel to - 2225)
+2017 DOUBLE LOW LINE
+ * this is a spacing character
+ x (low line - 005F)
+ x (combining double low line - 0333)
+ # 0020 0333
+2018 LEFT SINGLE QUOTATION MARK
+ = SINGLE TURNED COMMA QUOTATION MARK
+ * this is the preferred glyph (as opposed to 201B)
+ x (apostrophe - 0027)
+ x (modifier letter turned comma - 02BB)
+ x (heavy single turned comma quotation mark ornament - 275B)
+2019 RIGHT SINGLE QUOTATION MARK
+ = SINGLE COMMA QUOTATION MARK
+ * this is the preferred character to use for apostrophe
+ x (apostrophe - 0027)
+ x (modifier letter apostrophe - 02BC)
+ x (heavy single comma quotation mark ornament - 275C)
+201A SINGLE LOW-9 QUOTATION MARK
+ = LOW SINGLE COMMA QUOTATION MARK
+ * used as opening single quotation mark in some languages
+201B SINGLE HIGH-REVERSED-9 QUOTATION MARK
+ = SINGLE REVERSED COMMA QUOTATION MARK
+ * glyph variant of 2018
+ x (modifier letter reversed comma - 02BD)
+201C LEFT DOUBLE QUOTATION MARK
+ = DOUBLE TURNED COMMA QUOTATION MARK
+ * this is the preferred glyph (as opposed to 201F)
+ x (quotation mark - 0022)
+ x (heavy double turned comma quotation mark ornament - 275D)
+ x (reversed double prime quotation mark - 301D)
+201D RIGHT DOUBLE QUOTATION MARK
+ = DOUBLE COMMA QUOTATION MARK
+ x (quotation mark - 0022)
+ x (double prime - 2033)
+ x (heavy double comma quotation mark ornament - 275E)
+ x (double prime quotation mark - 301E)
+201E DOUBLE LOW-9 QUOTATION MARK
+ = LOW DOUBLE COMMA QUOTATION MARK
+ * used as opening double quotation mark in some languages
+ x (low double prime quotation mark - 301F)
+201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK
+ = DOUBLE REVERSED COMMA QUOTATION MARK
+ * glyph variant of 201C
+2020 DAGGER
+ = obelisk, obelus, long cross
+2021 DOUBLE DAGGER
+ = diesis, double obelisk
+2022 BULLET
+ = black small circle
+ x (middle dot - 00B7)
+ x (one dot leader - 2024)
+ x (bullet operator - 2219)
+ x (inverse bullet - 25D8)
+ x (white bullet - 25E6)
+2023 TRIANGULAR BULLET
+ x (end of proof - 220E)
+ x (black right-pointing small triangle - 25B8)
+2024 ONE DOT LEADER
+ x (middle dot - 00B7)
+ x (bullet - 2022)
+ x (bullet operator - 2219)
+ # 002E full stop
+2025 TWO DOT LEADER
+ # 002E 002E
+2026 HORIZONTAL ELLIPSIS
+ = three dot leader
+ x (vertical ellipsis - 22EE)
+ # 002E 002E 002E
+2027 HYPHENATION POINT
+@ Formatting characters
+2028 LINE SEPARATOR
+ * may be used to represent this semantic unambiguously
+2029 PARAGRAPH SEPARATOR
+ * may be used to represent this semantic unambiguously
+202A LEFT-TO-RIGHT EMBEDDING
+ = LRE
+202B RIGHT-TO-LEFT EMBEDDING
+ = RLE
+202C POP DIRECTIONAL FORMATTING
+ = PDF
+202D LEFT-TO-RIGHT OVERRIDE
+ = LRO
+202E RIGHT-TO-LEFT OVERRIDE
+ = RLO
+202F NARROW NO-BREAK SPACE
+ x (no-break space - 00A0)
+ # <noBreak> 0020
+@ General punctuation
+2030 PER MILLE SIGN
+ x (percent sign - 0025)
+2031 PER TEN THOUSAND SIGN
+ x (percent sign - 0025)
+2032 PRIME
+ = minutes, feet
+ x (apostrophe - 0027)
+ x (acute accent - 00B4)
+ x (modifier letter prime - 02B9)
+2033 DOUBLE PRIME
+ = seconds, inches
+ x (quotation mark - 0022)
+ x (modifier letter double prime - 02BA)
+ x (right double quotation mark - 201D)
+ x (ditto mark - 3003)
+ x (double prime quotation mark - 301E)
+ # 2032 2032
+2034 TRIPLE PRIME
+ # 2032 2032 2032
+2035 REVERSED PRIME
+ x (grave accent - 0060)
+2036 REVERSED DOUBLE PRIME
+ x (reversed double prime quotation mark - 301D)
+ # 2035 2035
+2037 REVERSED TRIPLE PRIME
+ # 2035 2035 2035
+2038 CARET
+ x (up arrowhead - 2303)
+2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK
+ = LEFT POINTING SINGLE GUILLEMET
+ * usually opening, sometimes closing
+ x (less-than sign - 003C)
+ x (left-pointing angle bracket - 2329)
+ x (left angle bracket - 3008)
+203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
+ = RIGHT POINTING SINGLE GUILLEMET
+ * usually closing, sometimes opening
+ x (greater-than sign - 003E)
+ x (right-pointing angle bracket - 232A)
+ x (right angle bracket - 3009)
+203B REFERENCE MARK
+ = Japanese kome
+ = Urdu paragraph separator
+ x (tibetan ku ru kha bzhi mig can - 0FBF)
+203C DOUBLE EXCLAMATION MARK
+ x (exclamation mark - 0021)
+ # 0021 0021
+203D INTERROBANG
+ x (exclamation mark - 0021)
+ x (question mark - 003F)
+203E OVERLINE
+ = SPACING OVERSCORE
+ # 0020 0305
+203F UNDERTIE (Enotikon)
+ = Greek enotikon
+ x (smile - 2323)
+2040 CHARACTER TIE
+ x (frown - 2322)
+2041 CARET INSERTION POINT
+ * proofreader's mark: insert here
+ x (right semidirect product - 22CC)
+2042 ASTERISM
+2043 HYPHEN BULLET
+2044 FRACTION SLASH
+ = solidus (in typography)
+ * for composing arbitrary fractions
+ x (solidus - 002F)
+ x (division slash - 2215)
+2045 LEFT SQUARE BRACKET WITH QUILL
+2046 RIGHT SQUARE BRACKET WITH QUILL
+2048 QUESTION EXCLAMATION MARK
+ * designed for use in vertical text
+ # 003F 0021
+2049 EXCLAMATION QUESTION MARK
+ * designed for use in vertical text
+ # 0021 003F
+204A TIRONIAN SIGN ET
+ * Irish Gaelic, ...
+204B REVERSED PILCROW SIGN
+ x (pilcrow sign - 00B6)
+204C BLACK LEFTWARDS BULLET
+204D BLACK RIGHTWARDS BULLET
+@ Deprecated
+206A INHIBIT SYMMETRIC SWAPPING
+206B ACTIVATE SYMMETRIC SWAPPING
+206C INHIBIT ARABIC FORM SHAPING
+206D ACTIVATE ARABIC FORM SHAPING
+206E NATIONAL DIGIT SHAPES
+206F NOMINAL DIGIT SHAPES
+@@ 2070 Superscripts and Subscripts 209F
+@ Superscripts
+2070 SUPERSCRIPT ZERO
+ # <super> 0030
+2071 <reserved>
+ x (superscript one - 00B9)
+2072 <reserved>
+ x (superscript two - 00B2)
+2073 <reserved>
+ x (superscript three - 00B3)
+2074 SUPERSCRIPT FOUR
+ # <super> 0034
+2075 SUPERSCRIPT FIVE
+ # <super> 0035
+2076 SUPERSCRIPT SIX
+ # <super> 0036
+2077 SUPERSCRIPT SEVEN
+ # <super> 0037
+2078 SUPERSCRIPT EIGHT
+ # <super> 0038
+2079 SUPERSCRIPT NINE
+ # <super> 0039
+207A SUPERSCRIPT PLUS SIGN
+ # <super> 002B
+207B SUPERSCRIPT MINUS
+ # <super> 2212
+207C SUPERSCRIPT EQUALS SIGN
+ # <super> 003D
+207D SUPERSCRIPT LEFT PARENTHESIS
+ # <super> 0028
+207E SUPERSCRIPT RIGHT PARENTHESIS
+ # <super> 0029
+207F SUPERSCRIPT LATIN SMALL LETTER N
+ # <super> 006E
+@ Subscripts
+2080 SUBSCRIPT ZERO
+ # <sub> 0030
+2081 SUBSCRIPT ONE
+ # <sub> 0031
+2082 SUBSCRIPT TWO
+ # <sub> 0032
+2083 SUBSCRIPT THREE
+ # <sub> 0033
+2084 SUBSCRIPT FOUR
+ # <sub> 0034
+2085 SUBSCRIPT FIVE
+ # <sub> 0035
+2086 SUBSCRIPT SIX
+ # <sub> 0036
+2087 SUBSCRIPT SEVEN
+ # <sub> 0037
+2088 SUBSCRIPT EIGHT
+ # <sub> 0038
+2089 SUBSCRIPT NINE
+ # <sub> 0039
+208A SUBSCRIPT PLUS SIGN
+ # <sub> 002B
+208B SUBSCRIPT MINUS
+ # <sub> 2212
+208C SUBSCRIPT EQUALS SIGN
+ # <sub> 003D
+208D SUBSCRIPT LEFT PARENTHESIS
+ # <sub> 0028
+208E SUBSCRIPT RIGHT PARENTHESIS
+ # <sub> 0029
+@@ 20A0 Currency Symbols 20CF
+@ Currency symbols
+@+ A number of currency symbols are found in other blocks.
+ x (dollar sign - 0024)
+ x (cent sign - 00A2)
+ x (pound sign - 00A3)
+ x (currency sign - 00A4)
+ x (yen sign - 00A5)
+ x (bengali rupee mark - 09F2)
+ x (bengali rupee sign - 09F3)
+ x (thai currency symbol baht - 0E3F)
+ x (khmer currency symbol riel - 17DB)
+20A0 EURO-CURRENCY SIGN
+ * intended for ECU, but not widely used
+ * historical character, this is NOT the euro!
+ x (euro sign - 20AC)
+20A1 COLON SIGN
+ * Costa Rica, El Salvador
+20A2 CRUZEIRO SIGN
+ * Brazil
+20A3 FRENCH FRANC SIGN
+ * France
+20A4 LIRA SIGN
+ * Italy, Turkey
+ x (pound sign - 00A3)
+20A5 MILL SIGN
+ * USA (1/10 cent)
+20A6 NAIRA SIGN
+ * Nigeria
+20A7 PESETA SIGN
+ * Spain
+20A8 RUPEE SIGN
+ * India
+ # 0052 0073
+20A9 WON SIGN
+ * Korea
+20AA NEW SHEQEL SIGN
+ * Israel
+20AB DONG SIGN
+ * Vietnam
+20AC EURO SIGN
+ * currency sign for the European Monetary Union
+ * euro, not ECU
+ x (euro-currency sign - 20A0)
+20AD KIP SIGN
+ * Laos
+20AE TUGRIK SIGN
+ * Mongolia
+ * also transliterated as tugrug, tugric, tugrog, togrog
+20AF DRACHMA SIGN
+ * Greece
+@@ 20D0 Combining Diacritical Marks for Symbols 20FF
+@ Combining diacritical marks for symbols
+20D0 COMBINING LEFT HARPOON ABOVE
+20D1 COMBINING RIGHT HARPOON ABOVE
+ * vector
+20D2 COMBINING LONG VERTICAL LINE OVERLAY
+20D3 COMBINING SHORT VERTICAL LINE OVERLAY
+ * negation
+20D4 COMBINING ANTICLOCKWISE ARROW ABOVE
+20D5 COMBINING CLOCKWISE ARROW ABOVE
+ * rotation
+20D6 COMBINING LEFT ARROW ABOVE
+20D7 COMBINING RIGHT ARROW ABOVE
+ * vector
+20D8 COMBINING RING OVERLAY
+20D9 COMBINING CLOCKWISE RING OVERLAY
+20DA COMBINING ANTICLOCKWISE RING OVERLAY
+20DB COMBINING THREE DOTS ABOVE
+ = third derivative
+20DC COMBINING FOUR DOTS ABOVE
+ = fourth derivative
+@ Enclosing diacritics
+20DD COMBINING ENCLOSING CIRCLE
+ = JIS composition circle
+ x (white circle - 25CB)
+ x (large circle - 25EF)
+ x (ideographic number zero - 3007)
+20DE COMBINING ENCLOSING SQUARE
+ x (white square - 25A1)
+20DF COMBINING ENCLOSING DIAMOND
+ x (white diamond - 25C7)
+20E0 COMBINING ENCLOSING CIRCLE BACKSLASH
+ * prohibition
+@ Additional diacritical mark for symbols
+20E1 COMBINING LEFT RIGHT ARROW ABOVE
+ * tensor
+@ Additional enclosing diacritics
+20E2 COMBINING ENCLOSING SCREEN
+ x (clear screen symbol - 239A)
+20E3 COMBINING ENCLOSING KEYCAP
+
+*/
+