+//\r
+// CHARNAMES.CPP\r
+//\r
+// A header file that links Unicode character names to character numbers.\r
+// by James L. Hammons\r
+// (C) 2004 Underground Software\r
+//\r
+// JLH = James L. Hammons <jlhamm@acm.org>\r
+//\r
+// Who When What\r
+// --- ---------- -------------------------------------------------------------\r
+// JLH ??/??/200? Created this file\r
+//\r
+\r
+unsigned char macStdNames[] = {\r
+ "\x06""notdef"\r
+ "\x05"".null"\r
+ "\x02""CR"\r
+ "\x05""space"\r
+ "\x06""exclam"\r
+ "\x08""quotedbl"\r
+ "\x0A""numbersign"\r
+ "\x06""dollar"\r
+ "\x07""percent"\r
+ "\x09""ampersand"\r
+ "\x0B""quotesingle"\r
+ "\x09""parenleft"\r
+ "\x0A""parenright"\r
+ "\x08""asterisk"\r
+ "\x04""plus"\r
+ "\x05""comma"\r
+ "\x06""hyphen"\r
+ "\x06""period"\r
+ "\x05""slash"\r
+ "\x04""zero"\r
+ "\x03""one"\r
+ "\x03""two"\r
+ "\x05""three"\r
+ "\x04""four"\r
+ "\x04""five"\r
+ "\x03""six"\r
+ "\x05""seven"\r
+ "\x05""eight"\r
+ "\x04""nine"\r
+ "\x05""colon"\r
+ "\x09""semicolon"\r
+ "\x04""less"\r
+ "\x05""equal"\r
+ "\x07""greater"\r
+ "\x08""question"\r
+ "\x02""at"\r
+ "\x01""A"\r
+ "\x01""B"\r
+ "\x01""C"\r
+ "\x01""D"\r
+ "\x01""E"\r
+ "\x01""F"\r
+ "\x01""G"\r
+ "\x01""H"\r
+ "\x01""I"\r
+ "\x01""J"\r
+ "\x01""K"\r
+ "\x01""L"\r
+ "\x01""M"\r
+ "\x01""N"\r
+ "\x01""O"\r
+ "\x01""P"\r
+ "\x01""Q"\r
+ "\x01""R"\r
+ "\x01""S"\r
+ "\x01""T"\r
+ "\x01""U"\r
+ "\x01""V"\r
+ "\x01""W"\r
+ "\x01""X"\r
+ "\x01""Y"\r
+ "\x01""Z"\r
+ "\x0B""bracketleft"\r
+ "\x09""backslash"\r
+ "\x0C""bracketright"\r
+ "\x0B""asciicircum"\r
+ "\x0A""underscore"\r
+ "\x05""grave"\r
+ "\x01""a"\r
+ "\x01""b"\r
+ "\x01""c"\r
+ "\x01""d"\r
+ "\x01""e"\r
+ "\x01""f"\r
+ "\x01""g"\r
+ "\x01""h"\r
+ "\x01""i"\r
+ "\x01""j"\r
+ "\x01""k"\r
+ "\x01""l"\r
+ "\x01""m"\r
+ "\x01""n"\r
+ "\x01""o"\r
+ "\x01""p"\r
+ "\x01""q"\r
+ "\x01""r"\r
+ "\x01""s"\r
+ "\x01""t"\r
+ "\x01""u"\r
+ "\x01""v"\r
+ "\x01""w"\r
+ "\x01""x"\r
+ "\x01""y"\r
+ "\x01""z"\r
+ "\x09""braceleft"\r
+ "\x03""bar"\r
+ "\x0A""braceright"\r
+ "\x0A""asciitilde"\r
+ "\x09""Adieresis"\r
+ "\x05""Aring"\r
+ "\x08""Ccedilla"\r
+ "\x06""Eacute"\r
+ "\x06""Ntilde"\r
+ "\x09""Odieresis"\r
+ "\x09""Udieresis"\r
+ "\x06""aacute"\r
+ "\x06""agrave"\r
+ "\x0B""acircumflex"\r
+ "\x09""adieresis"\r
+ "\x06""atilde"\r
+ "\x05""aring"\r
+ "\x08""ccedilla"\r
+ "\x06""eacute"\r
+ "\x06""egrave"\r
+ "\x0B""ecircumflex"\r
+ "\x09""edieresis"\r
+ "\x06""iacute"\r
+ "\x06""igrave"\r
+ "\x0B""icircumflex"\r
+ "\x09""idieresis"\r
+ "\x06""ntilde"\r
+ "\x06""oacute"\r
+ "\x06""ograve"\r
+ "\x0B""ocircumflex"\r
+ "\x09""odieresis"\r
+ "\x06""otilde"\r
+ "\x06""uacute"\r
+ "\x06""ugrave"\r
+ "\x0B""ucircumflex"\r
+ "\x09""udieresis"\r
+ "\x06""dagger"\r
+ "\x06""degree"\r
+ "\x04""cent"\r
+ "\x08""sterling"\r
+ "\x07""section"\r
+ "\x06""bullet"\r
+ "\x09""paragraph"\r
+ "\x0A""germandbls"\r
+ "\x0A""registered"\r
+ "\x09""copyright"\r
+ "\x09""trademark"\r
+ "\x05""acute"\r
+ "\x08""dieresis"\r
+ "\x08""notequal"\r
+ "\x02""AE"\r
+ "\x06""Oslash"\r
+ "\x08""infinity"\r
+ "\x09""plusminus"\r
+ "\x09""lessequal"\r
+ "\x0C""greaterequal"\r
+ "\x03""yen"\r
+ "\x03""mu1"\r
+ "\x0B""partialdiff"\r
+ "\x09""summation"\r
+ "\x07""product"\r
+ "\x02""pi"\r
+ "\x08""integral"\r
+ "\x0B""ordfeminine"\r
+ "\x0C""ordmasculine"\r
+ "\x03""Ohm"\r
+ "\x02""ae"\r
+ "\x06""oslash"\r
+ "\x0C""questiondown"\r
+ "\x0A""exclamdown"\r
+ "\x0A""logicalnot"\r
+ "\x07""radical"\r
+ "\x06""florin"\r
+ "\x0B""approxequal"\r
+ "\x09""increment"\r
+ "\x0D""guillemotleft"\r
+ "\x0E""guillemotright"\r
+ "\x08""ellipsis"\r
+ "\x07""nbspace"\r
+ "\x06""Agrave"\r
+ "\x06""Atilde"\r
+ "\x06""Otilde"\r
+ "\x02""OE"\r
+ "\x02""oe"\r
+ "\x06""endash"\r
+ "\x06""emdash"\r
+ "\x0C""quotedblleft"\r
+ "\x0D""quotedblright"\r
+ "\x09""quoteleft"\r
+ "\x0A""quoteright"\r
+ "\x06""divide"\r
+ "\x07""lozenge"\r
+ "\x09""ydieresis"\r
+ "\x09""Ydieresis"\r
+ "\x08""fraction"\r
+ "\x08""currency"\r
+ "\x0D""guilsinglleft"\r
+ "\x0E""guilsinglright"\r
+ "\x02""fi"\r
+ "\x02""fl"\r
+ "\x09""daggerdbl"\r
+ "\x0E""periodcentered"\r
+ "\x0E""quotesinglbase"\r
+ "\x0C""quotedblbase"\r
+ "\x0B""perthousand"\r
+ "\x0B""Acircumflex"\r
+ "\x0B""Ecircumflex"\r
+ "\x06""Aacute"\r
+ "\x09""Edieresis"\r
+ "\x06""Egrave"\r
+ "\x06""Iacute"\r
+ "\x0B""Icircumflex"\r
+ "\x09""Idieresis"\r
+ "\x06""Igrave"\r
+ "\x06""Oacute"\r
+ "\x0B""Ocircumflex"\r
+ "\x09""applelogo"\r
+ "\x06""Ograve"\r
+ "\x06""Uacute"\r
+ "\x0B""Ucircumflex"\r
+ "\x06""Ugrave"\r
+ "\x08""dotlessi"\r
+ "\x0A""circumflex"\r
+ "\x05""tilde"\r
+ "\x09""overscore"\r
+ "\x05""breve"\r
+ "\x09""dotaccent"\r
+ "\x04""ring"\r
+ "\x07""cedilla"\r
+ "\x0C""hungarumlaut"\r
+ "\x06""ogonek"\r
+ "\x05""caron"\r
+ "\x06""Lslash"\r
+ "\x06""lslash"\r
+ "\x06""Scaron"\r
+ "\x06""scaron"\r
+ "\x06""Zcaron"\r
+ "\x06""zcaron"\r
+ "\x09""brokenbar"\r
+ "\x03""Eth"\r
+ "\x03""eth"\r
+ "\x06""Yacute"\r
+ "\x06""yacute"\r
+ "\x05""Thorn"\r
+ "\x05""thorn"\r
+ "\x05""minus"\r
+ "\x08""multiply"\r
+ "\x0B""onesuperior"\r
+ "\x0B""twosuperior"\r
+ "\x0D""threesuperior"\r
+ "\x07""onehalf"\r
+ "\x0A""onequarter"\r
+ "\x0D""threequarters"\r
+ "\x05""franc"\r
+ "\x06""Gbreve"\r
+ "\x06""gbreve"\r
+ "\x04""Idot"\r
+ "\x08""Scedilla"\r
+ "\x08""scedilla"\r
+ "\x06""Cacute"\r
+ "\x06""cacute"\r
+ "\x06""Ccaron"\r
+ "\x06""ccaron"\r
+ "\x07""dmacron"\r
+};\r
+\r
+/*struct unicodeChar\r
+{\r
+ int cNum;\r
+\r
+};*/\r
+\r
+unsigned char unicodeChars[] = {\r
+ "\x00\x20""space\0"\r
+ "\x00\x21""exclamation mark\0"\r
+ "\x00\x22""quotation mark\0"\r
+ "\x00\x23""number sign\0"\r
+\r
+};\r
+\r
+/*\r
+\r
+0023 NUMBER SIGN\r
+ = pound sign, hash, crosshatch, octothorpe\r
+0024 DOLLAR SIGN\r
+ = milreis, escudo\r
+ * glyph may have one or two vertical bars\r
+ * other currency symbol characters: 20A0-20AF\r
+ x (currency sign - 00A4)\r
+0025 PERCENT SIGN\r
+ x (arabic percent sign - 066A)\r
+ x (per mille sign - 2030)\r
+ x (per ten thousand sign - 2031)\r
+0026 AMPERSAND\r
+0027 APOSTROPHE\r
+ = APOSTROPHE-QUOTE\r
+ = APL quote\r
+ * neutral (vertical) glyph having mixed usage\r
+ * preferred character for apostrophe is 2019\r
+ * preferred characters in English for paired quotation marks are 2018 & 2019\r
+ x (modifier letter prime - 02B9)\r
+ x (modifier letter apostrophe - 02BC)\r
+ x (modifier letter vertical line - 02C8)\r
+ x (combining acute accent - 0301)\r
+ x (prime - 2032)\r
+0028 LEFT PARENTHESIS\r
+ = OPENING PARENTHESIS\r
+0029 RIGHT PARENTHESIS\r
+ = CLOSING PARENTHESIS\r
+ * see discussion on semantics of paired bracketing characters\r
+002A ASTERISK\r
+ = star (on phone keypads)\r
+ x (arabic five pointed star - 066D)\r
+ x (asterisk operator - 2217)\r
+ x (heavy asterisk - 2731)\r
+002B PLUS SIGN\r
+002C COMMA\r
+ = decimal separator\r
+ x (arabic comma - 060C)\r
+ x (single low-9 quotation mark - 201A)\r
+ x (ideographic comma - 3001)\r
+002D HYPHEN-MINUS\r
+ = hyphen or minus sign\r
+ * used for either hyphen or minus sign\r
+ x (hyphen - 2010)\r
+ x (non-breaking hyphen - 2011)\r
+ x (figure dash - 2012)\r
+ x (en dash - 2013)\r
+ x (minus sign - 2212)\r
+002E FULL STOP\r
+ = PERIOD\r
+ = dot, decimal point\r
+ * may be rendered as a raised decimal point in old style numbers\r
+ x (arabic full stop - 06D4)\r
+ x (ideographic full stop - 3002)\r
+002F SOLIDUS\r
+ = SLASH\r
+ = virgule, shilling (British)\r
+ x (latin letter dental click - 01C0)\r
+ x (combining long solidus overlay - 0338)\r
+ x (fraction slash - 2044)\r
+ x (division slash - 2215)\r
+0030 DIGIT ZERO\r
+0031 DIGIT ONE\r
+0032 DIGIT TWO\r
+0033 DIGIT THREE\r
+0034 DIGIT FOUR\r
+0035 DIGIT FIVE\r
+0036 DIGIT SIX\r
+0037 DIGIT SEVEN\r
+0038 DIGIT EIGHT\r
+0039 DIGIT NINE\r
+003A COLON\r
+ x (armenian full stop - 0589)\r
+ x (hebrew punctuation sof pasuq - 05C3)\r
+ x (ratio - 2236)\r
+003B SEMICOLON\r
+ x (greek question mark - 037E)\r
+ x (arabic semicolon - 061B)\r
+003C LESS-THAN SIGN\r
+ x (single left-pointing angle quotation mark - 2039)\r
+ x (left-pointing angle bracket - 2329)\r
+ x (left angle bracket - 3008)\r
+003D EQUALS SIGN\r
+ * other related characters: 2241-2263\r
+ x (not equal to - 2260)\r
+ x (identical to - 2261)\r
+003E GREATER-THAN SIGN\r
+ x (single right-pointing angle quotation mark - 203A)\r
+ x (right-pointing angle bracket - 232A)\r
+ x (right angle bracket - 3009)\r
+003F QUESTION MARK\r
+ x (inverted question mark - 00BF)\r
+ x (greek question mark - 037E)\r
+ x (arabic question mark - 061F)\r
+ x (interrobang - 203D)\r
+ x (question exclamation mark - 2048)\r
+ x (exclamation question mark - 2049)\r
+0040 COMMERCIAL AT\r
+0041 LATIN CAPITAL LETTER A\r
+0042 LATIN CAPITAL LETTER B\r
+ x (script capital b - 212C)\r
+0043 LATIN CAPITAL LETTER C\r
+ x (double-struck capital c - 2102)\r
+ x (black-letter capital c - 212D)\r
+0044 LATIN CAPITAL LETTER D\r
+0045 LATIN CAPITAL LETTER E\r
+ x (euler constant - 2107)\r
+ x (script capital e - 2130)\r
+0046 LATIN CAPITAL LETTER F\r
+ x (script capital f - 2131)\r
+ x (turned capital f - 2132)\r
+0047 LATIN CAPITAL LETTER G\r
+0048 LATIN CAPITAL LETTER H\r
+ x (script capital h - 210B)\r
+ x (black-letter capital h - 210C)\r
+ x (double-struck capital h - 210D)\r
+0049 LATIN CAPITAL LETTER I\r
+ * Turkish and Azerbaijani use 0131 for lowercase\r
+ x (latin capital letter i with dot above - 0130)\r
+ x (cyrillic capital letter byelorussian-ukrainian i - 0406)\r
+ x (cyrillic letter palochka - 04C0)\r
+ x (script capital i - 2110)\r
+ x (black-letter capital i - 2111)\r
+ x (roman numeral one - 2160)\r
+004A LATIN CAPITAL LETTER J\r
+004B LATIN CAPITAL LETTER K\r
+ x (kelvin sign - 212A)\r
+004C LATIN CAPITAL LETTER L\r
+ x (script capital l - 2112)\r
+004D LATIN CAPITAL LETTER M\r
+ x (script capital m - 2133)\r
+004E LATIN CAPITAL LETTER N\r
+ x (double-struck capital n - 2115)\r
+004F LATIN CAPITAL LETTER O\r
+0050 LATIN CAPITAL LETTER P\r
+ x (double-struck capital p - 2119)\r
+0051 LATIN CAPITAL LETTER Q\r
+ x (double-struck capital q - 211A)\r
+0052 LATIN CAPITAL LETTER R\r
+ x (script capital r - 211B)\r
+ x (black-letter capital r - 211C)\r
+ x (double-struck capital r - 211D)\r
+0053 LATIN CAPITAL LETTER S\r
+0054 LATIN CAPITAL LETTER T\r
+0055 LATIN CAPITAL LETTER U\r
+0056 LATIN CAPITAL LETTER V\r
+0057 LATIN CAPITAL LETTER W\r
+0058 LATIN CAPITAL LETTER X\r
+0059 LATIN CAPITAL LETTER Y\r
+005A LATIN CAPITAL LETTER Z\r
+ x (double-struck capital z - 2124)\r
+ x (black-letter capital z - 2128)\r
+005B LEFT SQUARE BRACKET\r
+ = OPENING SQUARE BRACKET\r
+ * other bracket characters: 3008-301B\r
+005C REVERSE SOLIDUS\r
+ = BACKSLASH\r
+ x (set minus - 2216)\r
+005D RIGHT SQUARE BRACKET\r
+ = CLOSING SQUARE BRACKET\r
+005E CIRCUMFLEX ACCENT\r
+ * this is a spacing character\r
+ x (modifier letter up arrowhead - 02C4)\r
+ x (modifier letter circumflex accent - 02C6)\r
+ x (combining circumflex accent - 0302)\r
+ x (up arrowhead - 2303)\r
+005F LOW LINE\r
+ = SPACING UNDERSCORE\r
+ * this is a spacing character\r
+ x (modifier letter low macron - 02CD)\r
+ x (combining macron below - 0331)\r
+ x (combining low line - 0332)\r
+ x (double low line - 2017)\r
+0060 GRAVE ACCENT\r
+ * this is a spacing character\r
+ x (modifier letter grave accent - 02CB)\r
+ x (combining grave accent - 0300)\r
+ x (reversed prime - 2035)\r
+0061 LATIN SMALL LETTER A\r
+0062 LATIN SMALL LETTER B\r
+0063 LATIN SMALL LETTER C\r
+0064 LATIN SMALL LETTER D\r
+0065 LATIN SMALL LETTER E\r
+ x (estimated symbol - 212E)\r
+ x (script small e - 212F)\r
+0066 LATIN SMALL LETTER F\r
+0067 LATIN SMALL LETTER G\r
+ x (latin small letter script g - 0261)\r
+ x (script small g - 210A)\r
+0068 LATIN SMALL LETTER H\r
+ x (cyrillic small letter shha - 04BB)\r
+ x (planck constant - 210E)\r
+0069 LATIN SMALL LETTER I\r
+ * Turkish and Azerbaijani use 0130 for uppercase\r
+ x (latin small letter dotless i - 0131)\r
+006A LATIN SMALL LETTER J\r
+006B LATIN SMALL LETTER K\r
+006C LATIN SMALL LETTER L\r
+ x (script small l - 2113)\r
+006D LATIN SMALL LETTER M\r
+006E LATIN SMALL LETTER N\r
+ x (superscript latin small letter n - 207F)\r
+006F LATIN SMALL LETTER O\r
+ x (script small o - 2134)\r
+0070 LATIN SMALL LETTER P\r
+0071 LATIN SMALL LETTER Q\r
+0072 LATIN SMALL LETTER R\r
+0073 LATIN SMALL LETTER S\r
+0074 LATIN SMALL LETTER T\r
+0075 LATIN SMALL LETTER U\r
+0076 LATIN SMALL LETTER V\r
+0077 LATIN SMALL LETTER W\r
+0078 LATIN SMALL LETTER X\r
+0079 LATIN SMALL LETTER Y\r
+007A LATIN SMALL LETTER Z\r
+ x (latin small letter z with stroke - 01B6)\r
+007B LEFT CURLY BRACKET\r
+ = OPENING CURLY BRACKET\r
+ = opening brace\r
+007C VERTICAL LINE\r
+ = VERTICAL BAR\r
+ * used in pairs to indicate absolute value\r
+ x (latin letter dental click - 01C0)\r
+ x (hebrew punctuation paseq - 05C0)\r
+ x (divides - 2223)\r
+ x (light vertical bar - 2758)\r
+007D RIGHT CURLY BRACKET\r
+ = CLOSING CURLY BRACKET\r
+ = closing brace\r
+007E TILDE\r
+ * this is a spacing character\r
+ x (small tilde - 02DC)\r
+ x (combining tilde - 0303)\r
+ x (tilde operator - 223C)\r
+ x (fullwidth tilde - FF5E)\r
+007F <control>\r
+ = DELETE\r
+@@ 0080 C1 Controls and Latin-1 Supplement (Latin-1 Supplement) 00FF\r
+@ C1 controls\r
+@+ Alias names are those for ISO 6429.\r
+0080 <control>\r
+0081 <control>\r
+0082 <control>\r
+ = BREAK PERMITTED HERE\r
+0083 <control>\r
+ = NO BREAK HERE\r
+0084 <control>\r
+0085 <control>\r
+ = NEXT LINE\r
+0086 <control>\r
+ = START OF SELECTED AREA\r
+0087 <control>\r
+ = END OF SELECTED AREA\r
+0088 <control>\r
+ = CHARACTER TABULATION SET\r
+0089 <control>\r
+ = CHARACTER TABULATION WITH JUSTIFICATION\r
+008A <control>\r
+ = LINE TABULATION SET\r
+008B <control>\r
+ = PARTIAL LINE DOWN\r
+008C <control>\r
+ = PARTIAL LINE UP\r
+008D <control>\r
+ = REVERSE LINE FEED\r
+008E <control>\r
+ = SINGLE SHIFT TWO\r
+008F <control>\r
+ = SINGLE SHIFT THREE\r
+0090 <control>\r
+ = DEVICE CONTROL STRING\r
+0091 <control>\r
+ = PRIVATE USE ONE\r
+0092 <control>\r
+ = PRIVATE USE TWO\r
+0093 <control>\r
+ = SET TRANSMIT STATE\r
+0094 <control>\r
+ = CANCEL CHARACTER\r
+0095 <control>\r
+ = MESSAGE WAITING\r
+0096 <control>\r
+ = START OF GUARDED AREA\r
+0097 <control>\r
+ = END OF GUARDED AREA\r
+0098 <control>\r
+ = START OF STRING\r
+0099 <control>\r
+009A <control>\r
+ = SINGLE CHARACTER INTRODUCER\r
+009B <control>\r
+ = CONTROL SEQUENCE INTRODUCER\r
+009C <control>\r
+ = STRING TERMINATOR\r
+009D <control>\r
+ = OPERATING SYSTEM COMMAND\r
+009E <control>\r
+ = PRIVACY MESSAGE\r
+009F <control>\r
+ = APPLICATION PROGRAM COMMAND\r
+@ ISO 8859-1 (aka Latin-1)\r
+00A0 NO-BREAK SPACE\r
+ x (space - 0020)\r
+ x (figure space - 2007)\r
+ x (narrow no-break space - 202F)\r
+ x (zero width no-break space - FEFF)\r
+ # <noBreak> 0020\r
+00A1 INVERTED EXCLAMATION MARK\r
+ * Spanish, Asturian, Galician\r
+ x (exclamation mark - 0021)\r
+00A2 CENT SIGN\r
+00A3 POUND SIGN\r
+ = pound sterling, Irish punt\r
+ x (lira sign - 20A4)\r
+00A4 CURRENCY SIGN\r
+ = Filzlaus, Ricardi-Sonne (German names)\r
+ * other currency symbol characters: 20A0-20AF\r
+ x (dollar sign - 0024)\r
+00A5 YEN SIGN\r
+ = yuan sign\r
+ * glyph may have one or two crossbars\r
+00A6 BROKEN BAR\r
+ = BROKEN VERTICAL BAR\r
+ = parted rule (in typography)\r
+00A7 SECTION SIGN\r
+ * paragraph sign in some European usage\r
+00A8 DIAERESIS\r
+ * this is a spacing character\r
+ x (combining diaeresis - 0308)\r
+ # 0020 0308\r
+00A9 COPYRIGHT SIGN\r
+ x (sound recording copyright - 2117)\r
+00AA FEMININE ORDINAL INDICATOR\r
+ * Spanish\r
+ # <super> 0061\r
+00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK *\r
+ = LEFT POINTING GUILLEMET\r
+ = chevrons (in typography)\r
+ * usually opening, sometimes closing\r
+ x (much less-than - 226A)\r
+ x (left double angle bracket - 300A)\r
+00AC NOT SIGN\r
+ = angled dash (in typography)\r
+ x (reversed not sign - 2310)\r
+00AD SOFT HYPHEN\r
+ = discretionary hyphen\r
+ x (mongolian todo soft hyphen - 1806)\r
+00AE REGISTERED SIGN\r
+ = REGISTERED TRADE MARK SIGN\r
+00AF MACRON\r
+ = overline, APL overbar\r
+ * this is a spacing character\r
+ x (modifier letter macron - 02C9)\r
+ x (combining macron - 0304)\r
+ x (combining overline - 0305)\r
+ # 0020 0304\r
+00B0 DEGREE SIGN\r
+ * this is a spacing character\r
+ x (ring above - 02DA)\r
+ x (combining ring above - 030A)\r
+ x (superscript zero - 2070)\r
+ x (ring operator - 2218)\r
+00B1 PLUS-MINUS SIGN\r
+ x (minus-or-plus sign - 2213)\r
+00B2 SUPERSCRIPT TWO\r
+ = squared\r
+ * other superscript digit characters: 2070-2079\r
+ x (superscript one - 00B9)\r
+ # <super> 0032\r
+00B3 SUPERSCRIPT THREE\r
+ = cubed\r
+ x (superscript one - 00B9)\r
+ # <super> 0033\r
+00B4 ACUTE ACCENT\r
+ * this is a spacing character\r
+ x (modifier letter prime - 02B9)\r
+ x (modifier letter acute accent - 02CA)\r
+ x (combining acute accent - 0301)\r
+ x (prime - 2032)\r
+ # 0020 0301\r
+00B5 MICRO SIGN\r
+ # 03BC greek small letter mu\r
+00B6 PILCROW SIGN\r
+ = PARAGRAPH SIGN\r
+ * section sign in some European usage\r
+ x (reversed pilcrow sign - 204B)\r
+ x (curved stem paragraph sign ornament - 2761)\r
+00B7 MIDDLE DOT\r
+ = midpoint (in typography)\r
+ = Georgian comma\r
+ = Greek middle dot\r
+ x (bullet - 2022)\r
+ x (one dot leader - 2024)\r
+ x (hyphenation point - 2027)\r
+ x (bullet operator - 2219)\r
+ x (dot operator - 22C5)\r
+ x (katakana middle dot - 30FB)\r
+00B8 CEDILLA\r
+ * this is a spacing character\r
+ * other spacing accent characters: 02D8-02DB\r
+ x (combining cedilla - 0327)\r
+ # 0020 0327\r
+00B9 SUPERSCRIPT ONE\r
+ x (superscript two - 00B2)\r
+ x (superscript three - 00B3)\r
+ # <super> 0031\r
+00BA MASCULINE ORDINAL INDICATOR\r
+ * Spanish\r
+ # <super> 006F\r
+00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK *\r
+ = RIGHT POINTING GUILLEMET\r
+ * usually closing, sometimes opening\r
+ x (much greater-than - 226B)\r
+ x (right double angle bracket - 300B)\r
+00BC VULGAR FRACTION ONE QUARTER\r
+ * bar may be horizontal or slanted\r
+ * other fraction characters: 2153-215E\r
+ # 0031 2044 0034\r
+00BD VULGAR FRACTION ONE HALF\r
+ * bar may be horizontal or slanted\r
+ # 0031 2044 0032\r
+00BE VULGAR FRACTION THREE QUARTERS\r
+ * bar may be horizontal or slanted\r
+ # 0033 2044 0034\r
+00BF INVERTED QUESTION MARK\r
+ = turned question mark\r
+ * Spanish\r
+ x (question mark - 003F)\r
+00C0 LATIN CAPITAL LETTER A WITH GRAVE\r
+ : 0041 0300\r
+00C1 LATIN CAPITAL LETTER A WITH ACUTE\r
+ : 0041 0301\r
+00C2 LATIN CAPITAL LETTER A WITH CIRCUMFLEX\r
+ : 0041 0302\r
+00C3 LATIN CAPITAL LETTER A WITH TILDE\r
+ : 0041 0303\r
+00C4 LATIN CAPITAL LETTER A WITH DIAERESIS\r
+ : 0041 0308\r
+00C5 LATIN CAPITAL LETTER A WITH RING ABOVE\r
+ x (angstrom sign - 212B)\r
+ : 0041 030A\r
+00C6 LATIN CAPITAL LETTER AE (ash) *\r
+ = LATIN CAPITAL LIGATURE AE\r
+00C7 LATIN CAPITAL LETTER C WITH CEDILLA\r
+ : 0043 0327\r
+00C8 LATIN CAPITAL LETTER E WITH GRAVE\r
+ : 0045 0300\r
+00C9 LATIN CAPITAL LETTER E WITH ACUTE\r
+ : 0045 0301\r
+00CA LATIN CAPITAL LETTER E WITH CIRCUMFLEX\r
+ : 0045 0302\r
+00CB LATIN CAPITAL LETTER E WITH DIAERESIS\r
+ : 0045 0308\r
+00CC LATIN CAPITAL LETTER I WITH GRAVE\r
+ : 0049 0300\r
+00CD LATIN CAPITAL LETTER I WITH ACUTE\r
+ : 0049 0301\r
+00CE LATIN CAPITAL LETTER I WITH CIRCUMFLEX\r
+ : 0049 0302\r
+00CF LATIN CAPITAL LETTER I WITH DIAERESIS\r
+ : 0049 0308\r
+00D0 LATIN CAPITAL LETTER ETH (Icelandic)\r
+ x (latin small letter eth - 00F0)\r
+ x (latin capital letter d with stroke - 0110)\r
+ x (latin capital letter african d - 0189)\r
+00D1 LATIN CAPITAL LETTER N WITH TILDE\r
+ : 004E 0303\r
+00D2 LATIN CAPITAL LETTER O WITH GRAVE\r
+ : 004F 0300\r
+00D3 LATIN CAPITAL LETTER O WITH ACUTE\r
+ : 004F 0301\r
+00D4 LATIN CAPITAL LETTER O WITH CIRCUMFLEX\r
+ : 004F 0302\r
+00D5 LATIN CAPITAL LETTER O WITH TILDE\r
+ : 004F 0303\r
+00D6 LATIN CAPITAL LETTER O WITH DIAERESIS\r
+ : 004F 0308\r
+00D7 MULTIPLICATION SIGN\r
+ = z notation Cartesian product\r
+00D8 LATIN CAPITAL LETTER O WITH STROKE\r
+ = LATIN CAPITAL LETTER O SLASH\r
+ x (empty set - 2205)\r
+00D9 LATIN CAPITAL LETTER U WITH GRAVE\r
+ : 0055 0300\r
+00DA LATIN CAPITAL LETTER U WITH ACUTE\r
+ : 0055 0301\r
+00DB LATIN CAPITAL LETTER U WITH CIRCUMFLEX\r
+ : 0055 0302\r
+00DC LATIN CAPITAL LETTER U WITH DIAERESIS\r
+ : 0055 0308\r
+00DD LATIN CAPITAL LETTER Y WITH ACUTE\r
+ : 0059 0301\r
+00DE LATIN CAPITAL LETTER THORN (Icelandic)\r
+00DF LATIN SMALL LETTER SHARP S (German)\r
+ = Eszett\r
+ * German\r
+ * uppercase is "SS"\r
+ * in origin a ligature of 017F and 0073\r
+ x (greek small letter beta - 03B2)\r
+00E0 LATIN SMALL LETTER A WITH GRAVE\r
+ : 0061 0300\r
+00E1 LATIN SMALL LETTER A WITH ACUTE\r
+ : 0061 0301\r
+00E2 LATIN SMALL LETTER A WITH CIRCUMFLEX\r
+ : 0061 0302\r
+00E3 LATIN SMALL LETTER A WITH TILDE\r
+ * Portuguese\r
+ : 0061 0303\r
+00E4 LATIN SMALL LETTER A WITH DIAERESIS\r
+ : 0061 0308\r
+00E5 LATIN SMALL LETTER A WITH RING ABOVE\r
+ * Danish, Norwegian, Swedish, Walloon\r
+ : 0061 030A\r
+00E6 LATIN SMALL LETTER AE (ash) *\r
+ = LATIN SMALL LIGATURE AE\r
+ = ash (from Old English æsc)\r
+ * Danish, Norwegian, Icelandic, Faroese, Old English, French, IPA\r
+ x (latin small ligature oe - 0153)\r
+ x (cyrillic small ligature a ie - 04D5)\r
+00E7 LATIN SMALL LETTER C WITH CEDILLA\r
+ : 0063 0327\r
+00E8 LATIN SMALL LETTER E WITH GRAVE\r
+ : 0065 0300\r
+00E9 LATIN SMALL LETTER E WITH ACUTE\r
+ : 0065 0301\r
+00EA LATIN SMALL LETTER E WITH CIRCUMFLEX\r
+ : 0065 0302\r
+00EB LATIN SMALL LETTER E WITH DIAERESIS\r
+ : 0065 0308\r
+00EC LATIN SMALL LETTER I WITH GRAVE\r
+ * Italian, Malagasy\r
+ : 0069 0300\r
+00ED LATIN SMALL LETTER I WITH ACUTE\r
+ : 0069 0301\r
+00EE LATIN SMALL LETTER I WITH CIRCUMFLEX\r
+ : 0069 0302\r
+00EF LATIN SMALL LETTER I WITH DIAERESIS\r
+ : 0069 0308\r
+00F0 LATIN SMALL LETTER ETH (Icelandic)\r
+ * Icelandic, Faroese, Old English, IPA\r
+ x (latin capital letter eth - 00D0)\r
+ x (greek small letter delta - 03B4)\r
+ x (partial differential - 2202)\r
+00F1 LATIN SMALL LETTER N WITH TILDE\r
+ : 006E 0303\r
+00F2 LATIN SMALL LETTER O WITH GRAVE\r
+ : 006F 0300\r
+00F3 LATIN SMALL LETTER O WITH ACUTE\r
+ : 006F 0301\r
+00F4 LATIN SMALL LETTER O WITH CIRCUMFLEX\r
+ : 006F 0302\r
+00F5 LATIN SMALL LETTER O WITH TILDE\r
+ * Portuguese, Estonian\r
+ : 006F 0303\r
+00F6 LATIN SMALL LETTER O WITH DIAERESIS\r
+ : 006F 0308\r
+00F7 DIVISION SIGN\r
+00F8 LATIN SMALL LETTER O WITH STROKE\r
+ = LATIN SMALL LETTER O SLASH\r
+ * Danish, Norwegian, Faroese, IPA\r
+00F9 LATIN SMALL LETTER U WITH GRAVE\r
+ * French, Italian\r
+ : 0075 0300\r
+00FA LATIN SMALL LETTER U WITH ACUTE\r
+ : 0075 0301\r
+00FB LATIN SMALL LETTER U WITH CIRCUMFLEX\r
+ : 0075 0302\r
+00FC LATIN SMALL LETTER U WITH DIAERESIS\r
+ : 0075 0308\r
+00FD LATIN SMALL LETTER Y WITH ACUTE\r
+ * Czech, Slovak, Icelandic, Faroese, Welsh, Malagasy\r
+ : 0079 0301\r
+00FE LATIN SMALL LETTER THORN (Icelandic)\r
+ * Icelandic, Old English, phonetics\r
+ * Runic letter borrowed into Latin script\r
+ x (runic letter thurisaz thurs thorn - 16A6)\r
+00FF LATIN SMALL LETTER Y WITH DIAERESIS\r
+ * French\r
+ x (latin capital letter y with diaeresis - 0178)\r
+ : 0079 0308\r
+@@ 0100 Latin Extended-A 017F\r
+@ European Latin\r
+0100 LATIN CAPITAL LETTER A WITH MACRON\r
+ : 0041 0304\r
+0101 LATIN SMALL LETTER A WITH MACRON\r
+ * Latvian, Latin, ...\r
+ : 0061 0304\r
+0102 LATIN CAPITAL LETTER A WITH BREVE\r
+ : 0041 0306\r
+0103 LATIN SMALL LETTER A WITH BREVE\r
+ * Romanian, Vietnamese, Latin, ...\r
+ : 0061 0306\r
+0104 LATIN CAPITAL LETTER A WITH OGONEK\r
+ : 0041 0328\r
+0105 LATIN SMALL LETTER A WITH OGONEK\r
+ * Polish, Lithuanian, ...\r
+ : 0061 0328\r
+0106 LATIN CAPITAL LETTER C WITH ACUTE\r
+ : 0043 0301\r
+0107 LATIN SMALL LETTER C WITH ACUTE\r
+ * Polish, Croatian, ...\r
+ x (cyrillic small letter tshe - 045B)\r
+ : 0063 0301\r
+0108 LATIN CAPITAL LETTER C WITH CIRCUMFLEX\r
+ : 0043 0302\r
+0109 LATIN SMALL LETTER C WITH CIRCUMFLEX\r
+ * Esperanto\r
+ : 0063 0302\r
+010A LATIN CAPITAL LETTER C WITH DOT ABOVE\r
+ : 0043 0307\r
+010B LATIN SMALL LETTER C WITH DOT ABOVE\r
+ * Maltese, Irish Gaelic (old orthography)\r
+ : 0063 0307\r
+010C LATIN CAPITAL LETTER C WITH CARON\r
+ : 0043 030C\r
+010D LATIN SMALL LETTER C WITH CARON\r
+ * Czech, Slovak, Slovenian, and many other languages\r
+ : 0063 030C\r
+010E LATIN CAPITAL LETTER D WITH CARON\r
+ * the form using caron/hacek is preferred in all contexts\r
+ : 0044 030C\r
+010F LATIN SMALL LETTER D WITH CARON\r
+ * Czech, Slovak\r
+ * the form using apostrophe is preferred in typesetting\r
+ : 0064 030C\r
+0110 LATIN CAPITAL LETTER D WITH STROKE\r
+ x (latin capital letter eth - 00D0)\r
+ x (latin small letter d with stroke - 0111)\r
+ x (latin capital letter african d - 0189)\r
+0111 LATIN SMALL LETTER D WITH STROKE\r
+ * Croatian, Vietnamese, Sámi\r
+ x (latin capital letter d with stroke - 0110)\r
+ x (cyrillic small letter dje - 0452)\r
+0112 LATIN CAPITAL LETTER E WITH MACRON\r
+ : 0045 0304\r
+0113 LATIN SMALL LETTER E WITH MACRON\r
+ * Latvian, Latin, ...\r
+ : 0065 0304\r
+0114 LATIN CAPITAL LETTER E WITH BREVE\r
+ : 0045 0306\r
+0115 LATIN SMALL LETTER E WITH BREVE\r
+ * Malay, Latin, ...\r
+ : 0065 0306\r
+0116 LATIN CAPITAL LETTER E WITH DOT ABOVE\r
+ : 0045 0307\r
+0117 LATIN SMALL LETTER E WITH DOT ABOVE\r
+ * Lithuanian\r
+ : 0065 0307\r
+0118 LATIN CAPITAL LETTER E WITH OGONEK\r
+ : 0045 0328\r
+0119 LATIN SMALL LETTER E WITH OGONEK\r
+ * Polish, Lithuanian, ...\r
+ : 0065 0328\r
+011A LATIN CAPITAL LETTER E WITH CARON\r
+ : 0045 030C\r
+011B LATIN SMALL LETTER E WITH CARON\r
+ * Czech, ...\r
+ : 0065 030C\r
+011C LATIN CAPITAL LETTER G WITH CIRCUMFLEX\r
+ : 0047 0302\r
+011D LATIN SMALL LETTER G WITH CIRCUMFLEX\r
+ * Esperanto\r
+ : 0067 0302\r
+011E LATIN CAPITAL LETTER G WITH BREVE\r
+ : 0047 0306\r
+011F LATIN SMALL LETTER G WITH BREVE\r
+ * Turkish, Azerbaijani\r
+ x (latin small letter g with caron - 01E7)\r
+ : 0067 0306\r
+0120 LATIN CAPITAL LETTER G WITH DOT ABOVE\r
+ : 0047 0307\r
+0121 LATIN SMALL LETTER G WITH DOT ABOVE\r
+ * Maltese, Irish Gaelic (old orthography)\r
+ : 0067 0307\r
+0122 LATIN CAPITAL LETTER G WITH CEDILLA\r
+ : 0047 0327\r
+0123 LATIN SMALL LETTER G WITH CEDILLA\r
+ * Latvian\r
+ * there are three major glyph variants\r
+ : 0067 0327\r
+0124 LATIN CAPITAL LETTER H WITH CIRCUMFLEX\r
+ : 0048 0302\r
+0125 LATIN SMALL LETTER H WITH CIRCUMFLEX\r
+ * Esperanto\r
+ : 0068 0302\r
+0126 LATIN CAPITAL LETTER H WITH STROKE\r
+0127 LATIN SMALL LETTER H WITH STROKE\r
+ * Maltese, IPA, ...\r
+ x (cyrillic small letter tshe - 045B)\r
+ x (planck constant over two pi - 210F)\r
+0128 LATIN CAPITAL LETTER I WITH TILDE\r
+ : 0049 0303\r
+0129 LATIN SMALL LETTER I WITH TILDE\r
+ * Greenlandic (old orthography)\r
+ : 0069 0303\r
+012A LATIN CAPITAL LETTER I WITH MACRON\r
+ : 0049 0304\r
+012B LATIN SMALL LETTER I WITH MACRON\r
+ * Latvian, Latin, ...\r
+ : 0069 0304\r
+012C LATIN CAPITAL LETTER I WITH BREVE\r
+ : 0049 0306\r
+012D LATIN SMALL LETTER I WITH BREVE\r
+ * Latin, ...\r
+ : 0069 0306\r
+012E LATIN CAPITAL LETTER I WITH OGONEK\r
+ : 0049 0328\r
+012F LATIN SMALL LETTER I WITH OGONEK\r
+ * Lithuanian, ...\r
+ : 0069 0328\r
+0130 LATIN CAPITAL LETTER I WITH DOT ABOVE\r
+ = LATIN CAPITAL LETTER I DOT\r
+ * Turkish, Azerbaijani\r
+ * lowercase is 0069\r
+ x (latin capital letter i - 0049)\r
+ : 0049 0307\r
+0131 LATIN SMALL LETTER DOTLESS I\r
+ * Turkish, Azerbaijani\r
+ * uppercase is 0049\r
+ x (latin small letter i - 0069)\r
+0132 LATIN CAPITAL LIGATURE IJ\r
+ # 0049 004A\r
+0133 LATIN SMALL LIGATURE IJ\r
+ * Dutch\r
+ # 0069 006A\r
+0134 LATIN CAPITAL LETTER J WITH CIRCUMFLEX\r
+ : 004A 0302\r
+0135 LATIN SMALL LETTER J WITH CIRCUMFLEX\r
+ * Esperanto\r
+ : 006A 0302\r
+0136 LATIN CAPITAL LETTER K WITH CEDILLA\r
+ : 004B 0327\r
+0137 LATIN SMALL LETTER K WITH CEDILLA\r
+ * Latvian\r
+ : 006B 0327\r
+0138 LATIN SMALL LETTER KRA (Greenlandic)\r
+ * Greenlandic (old orthography)\r
+0139 LATIN CAPITAL LETTER L WITH ACUTE\r
+ : 004C 0301\r
+013A LATIN SMALL LETTER L WITH ACUTE\r
+ * Slovak\r
+ : 006C 0301\r
+013B LATIN CAPITAL LETTER L WITH CEDILLA\r
+ : 004C 0327\r
+013C LATIN SMALL LETTER L WITH CEDILLA\r
+ * Latvian\r
+ : 006C 0327\r
+013D LATIN CAPITAL LETTER L WITH CARON\r
+ : 004C 030C\r
+013E LATIN SMALL LETTER L WITH CARON\r
+ * Slovak\r
+ * the form using apostrophe is preferred in typesetting\r
+ : 006C 030C\r
+013F LATIN CAPITAL LETTER L WITH MIDDLE DOT\r
+ * some fonts show the middle dot inside the L, but the preferred form has the dot following the L\r
+ # 004C 00B7\r
+0140 LATIN SMALL LETTER L WITH MIDDLE DOT\r
+ * Catalan\r
+ # 006C 00B7\r
+0141 LATIN CAPITAL LETTER L WITH STROKE\r
+0142 LATIN SMALL LETTER L WITH STROKE\r
+ * Polish, ...\r
+ x (latin small letter l with bar - 019A)\r
+0143 LATIN CAPITAL LETTER N WITH ACUTE\r
+ : 004E 0301\r
+0144 LATIN SMALL LETTER N WITH ACUTE\r
+ * Polish, ...\r
+ : 006E 0301\r
+0145 LATIN CAPITAL LETTER N WITH CEDILLA\r
+ : 004E 0327\r
+0146 LATIN SMALL LETTER N WITH CEDILLA\r
+ * Latvian\r
+ : 006E 0327\r
+0147 LATIN CAPITAL LETTER N WITH CARON\r
+ : 004E 030C\r
+0148 LATIN SMALL LETTER N WITH CARON\r
+ * Czech, Slovak\r
+ : 006E 030C\r
+0149 LATIN SMALL LETTER N PRECEDED BY APOSTROPHE\r
+ = LATIN SMALL LETTER APOSTROPHE N\r
+ * Afrikaans\r
+ * this is not actually a single letter\r
+ # 02BC 006E\r
+014A LATIN CAPITAL LETTER ENG (Sami)\r
+ * glyph may also have appearance of large form of the small letter\r
+014B LATIN SMALL LETTER ENG (Sami)\r
+ * Sámi, Mende, IPA, ...\r
+014C LATIN CAPITAL LETTER O WITH MACRON\r
+ : 004F 0304\r
+014D LATIN SMALL LETTER O WITH MACRON\r
+ * Latvian, Latin, ...\r
+ : 006F 0304\r
+014E LATIN CAPITAL LETTER O WITH BREVE\r
+ : 004F 0306\r
+014F LATIN SMALL LETTER O WITH BREVE\r
+ * Latin\r
+ : 006F 0306\r
+0150 LATIN CAPITAL LETTER O WITH DOUBLE ACUTE\r
+ : 004F 030B\r
+0151 LATIN SMALL LETTER O WITH DOUBLE ACUTE\r
+ * Hungarian\r
+ : 006F 030B\r
+0152 LATIN CAPITAL LIGATURE OE\r
+0153 LATIN SMALL LIGATURE OE\r
+ = LATIN SMALL LETTER O E\r
+ = ethel (from Old English eðel)\r
+ * French, IPA, Old Icelandic, Old English, ...\r
+ x (latin small letter ae - 00E6)\r
+ x (latin letter small capital oe - 0276)\r
+0154 LATIN CAPITAL LETTER R WITH ACUTE\r
+ : 0052 0301\r
+0155 LATIN SMALL LETTER R WITH ACUTE\r
+ * Slovak, ...\r
+ : 0072 0301\r
+0156 LATIN CAPITAL LETTER R WITH CEDILLA\r
+ : 0052 0327\r
+0157 LATIN SMALL LETTER R WITH CEDILLA\r
+ * Latvian\r
+ : 0072 0327\r
+0158 LATIN CAPITAL LETTER R WITH CARON\r
+ : 0052 030C\r
+0159 LATIN SMALL LETTER R WITH CARON\r
+ * Czech, ...\r
+ : 0072 030C\r
+015A LATIN CAPITAL LETTER S WITH ACUTE\r
+ : 0053 0301\r
+015B LATIN SMALL LETTER S WITH ACUTE\r
+ * Polish, Indic transliteration, ...\r
+ : 0073 0301\r
+015C LATIN CAPITAL LETTER S WITH CIRCUMFLEX\r
+ : 0053 0302\r
+015D LATIN SMALL LETTER S WITH CIRCUMFLEX\r
+ * Esperanto\r
+ : 0073 0302\r
+015E LATIN CAPITAL LETTER S WITH CEDILLA *\r
+ : 0053 0327\r
+015F LATIN SMALL LETTER S WITH CEDILLA *\r
+ * Turkish, Azerbaijani, Romanian, ...\r
+ * this character is used in both Turkish and Romanian data\r
+ * a glyph variant with comma below is preferred for Romanian\r
+ x (latin small letter s with comma below - 0219)\r
+ : 0073 0327\r
+0160 LATIN CAPITAL LETTER S WITH CARON\r
+ : 0053 030C\r
+0161 LATIN SMALL LETTER S WITH CARON\r
+ * Czech, Estonian, Finnish, Slovak, and many other languages\r
+ : 0073 030C\r
+0162 LATIN CAPITAL LETTER T WITH CEDILLA *\r
+ : 0054 0327\r
+0163 LATIN SMALL LETTER T WITH CEDILLA *\r
+ * Romanian, Semitic transliteration, ...\r
+ * this character is used in Romanian data\r
+ * a glyph variant with comma below is preferred for Romanian\r
+ x (latin small letter t with comma below - 021B)\r
+ : 0074 0327\r
+0164 LATIN CAPITAL LETTER T WITH CARON\r
+ * the form using caron/hacek is preferred in all contexts\r
+ : 0054 030C\r
+0165 LATIN SMALL LETTER T WITH CARON\r
+ * Czech, Slovak\r
+ * the form using apostrophe is preferred in typesetting\r
+ : 0074 030C\r
+0166 LATIN CAPITAL LETTER T WITH STROKE\r
+0167 LATIN SMALL LETTER T WITH STROKE\r
+ * Sámi\r
+0168 LATIN CAPITAL LETTER U WITH TILDE\r
+ : 0055 0303\r
+0169 LATIN SMALL LETTER U WITH TILDE\r
+ * Greenlandic (old orthography)\r
+ : 0075 0303\r
+016A LATIN CAPITAL LETTER U WITH MACRON\r
+ : 0055 0304\r
+016B LATIN SMALL LETTER U WITH MACRON\r
+ * Latvian, Lithuanian, Latin, ...\r
+ : 0075 0304\r
+016C LATIN CAPITAL LETTER U WITH BREVE\r
+ : 0055 0306\r
+016D LATIN SMALL LETTER U WITH BREVE\r
+ * Latin, Esperanto, ...\r
+ : 0075 0306\r
+016E LATIN CAPITAL LETTER U WITH RING ABOVE\r
+ : 0055 030A\r
+016F LATIN SMALL LETTER U WITH RING ABOVE\r
+ * Czech, ...\r
+ : 0075 030A\r
+0170 LATIN CAPITAL LETTER U WITH DOUBLE ACUTE\r
+ : 0055 030B\r
+0171 LATIN SMALL LETTER U WITH DOUBLE ACUTE\r
+ * Hungarian\r
+ : 0075 030B\r
+0172 LATIN CAPITAL LETTER U WITH OGONEK\r
+ : 0055 0328\r
+0173 LATIN SMALL LETTER U WITH OGONEK\r
+ * Lithuanian\r
+ : 0075 0328\r
+0174 LATIN CAPITAL LETTER W WITH CIRCUMFLEX\r
+ : 0057 0302\r
+0175 LATIN SMALL LETTER W WITH CIRCUMFLEX\r
+ * Welsh\r
+ : 0077 0302\r
+0176 LATIN CAPITAL LETTER Y WITH CIRCUMFLEX\r
+ : 0059 0302\r
+0177 LATIN SMALL LETTER Y WITH CIRCUMFLEX\r
+ * Welsh\r
+ : 0079 0302\r
+0178 LATIN CAPITAL LETTER Y WITH DIAERESIS\r
+ * French, Igbo\r
+ x (latin small letter y with diaeresis - 00FF)\r
+ : 0059 0308\r
+0179 LATIN CAPITAL LETTER Z WITH ACUTE\r
+ : 005A 0301\r
+017A LATIN SMALL LETTER Z WITH ACUTE\r
+ * Polish, ...\r
+ : 007A 0301\r
+017B LATIN CAPITAL LETTER Z WITH DOT ABOVE\r
+ : 005A 0307\r
+017C LATIN SMALL LETTER Z WITH DOT ABOVE\r
+ * Polish, ...\r
+ : 007A 0307\r
+017D LATIN CAPITAL LETTER Z WITH CARON\r
+ : 005A 030C\r
+017E LATIN SMALL LETTER Z WITH CARON\r
+ * Czech, Estonian, Finnish, Slovak, Slovenian, and many other languages\r
+ : 007A 030C\r
+017F LATIN SMALL LETTER LONG S\r
+ * in common use in Roman types until the 18th century\r
+ * in current use in Fraktur and Gaelic types\r
+ # 0073 latin small letter s\r
+@@ 0180 Latin Extended-B 024F\r
+@ Latin extended-B\r
+0180 LATIN SMALL LETTER B WITH STROKE\r
+ * Americanist and Indo-Europeanist usage for phonetic beta\r
+ * Old Saxon\r
+ x (greek small letter beta - 03B2)\r
+ x (blank symbol - 2422)\r
+0181 LATIN CAPITAL LETTER B WITH HOOK\r
+ * Zulu, Pan-Nigerian alphabet\r
+ x (latin small letter b with hook - 0253)\r
+0182 LATIN CAPITAL LETTER B WITH TOPBAR\r
+0183 LATIN SMALL LETTER B WITH TOPBAR\r
+ * Zhuang\r
+ * former Soviet minority language scripts\r
+ x (cyrillic capital letter be - 0411)\r
+0184 LATIN CAPITAL LETTER TONE SIX\r
+0185 LATIN SMALL LETTER TONE SIX\r
+ * Zhuang\r
+ * Zhuang tone three is Cyrillic ze\r
+ * Zhuang tone four is Cyrillic che\r
+ x (latin small letter tone two - 01A8)\r
+ x (latin small letter tone five - 01BD)\r
+ x (cyrillic small letter ze - 0437)\r
+ x (cyrillic small letter che - 0447)\r
+ x (cyrillic small letter soft sign - 044C)\r
+0186 LATIN CAPITAL LETTER OPEN O\r
+ * typographically a turned C\r
+ x (latin small letter open o - 0254)\r
+0187 LATIN CAPITAL LETTER C WITH HOOK\r
+0188 LATIN SMALL LETTER C WITH HOOK\r
+ * African\r
+0189 LATIN CAPITAL LETTER AFRICAN D *\r
+ * Ewe\r
+ x (latin capital letter eth - 00D0)\r
+ x (latin capital letter d with stroke - 0110)\r
+ x (latin small letter d with tail - 0256)\r
+018A LATIN CAPITAL LETTER D WITH HOOK\r
+ * Pan-Nigerian alphabet\r
+ x (latin small letter d with hook - 0257)\r
+018B LATIN CAPITAL LETTER D WITH TOPBAR\r
+018C LATIN SMALL LETTER D WITH TOPBAR\r
+ * former-Soviet minority language scripts\r
+018D LATIN SMALL LETTER TURNED DELTA\r
+ * archaic phonetic for labialized dental fricative\r
+ * recommended spellings 007A 02B7 or 007A 032B\r
+018E LATIN CAPITAL LETTER REVERSED E\r
+ = LATIN CAPITAL LETTER TURNED E\r
+ * Pan-Nigerian alphabet\r
+ * lowercase is 01DD\r
+018F LATIN CAPITAL LETTER SCHWA\r
+ * Azerbaijani, ...\r
+ x (latin small letter schwa - 0259)\r
+ x (cyrillic capital letter schwa - 04D8)\r
+0190 LATIN CAPITAL LETTER OPEN E\r
+ = LATIN CAPITAL LETTER EPSILON\r
+ * African\r
+ x (latin small letter open e - 025B)\r
+ x (euler constant - 2107)\r
+0191 LATIN CAPITAL LETTER F WITH HOOK\r
+ * African\r
+0192 LATIN SMALL LETTER F WITH HOOK\r
+ = LATIN SMALL LETTER SCRIPT F\r
+ = Florin currency symbol (Netherlands)\r
+ = function symbol\r
+ = abbreviation convention for folder\r
+0193 LATIN CAPITAL LETTER G WITH HOOK\r
+ * African\r
+ x (latin small letter g with hook - 0260)\r
+0194 LATIN CAPITAL LETTER GAMMA\r
+ * African\r
+ x (latin small letter gamma - 0263)\r
+0195 LATIN SMALL LETTER HV (hwair)\r
+ * Gothic transliteration\r
+ * uppercase is 01F6\r
+0196 LATIN CAPITAL LETTER IOTA\r
+ * African\r
+ x (latin small letter iota - 0269)\r
+0197 LATIN CAPITAL LETTER I WITH STROKE\r
+ = barred i, i bar\r
+ * African\r
+ * ISO 6438 gives lowercase as 026A, not 0268\r
+ x (latin letter small capital i - 026A)\r
+0198 LATIN CAPITAL LETTER K WITH HOOK\r
+0199 LATIN SMALL LETTER K WITH HOOK\r
+ * Hausa, Pan-Nigerian alphabet\r
+019A LATIN SMALL LETTER L WITH BAR\r
+ = barred l\r
+ * Americanist phonetic usage for 026C\r
+ x (latin small letter l with stroke - 0142)\r
+019B LATIN SMALL LETTER LAMBDA WITH STROKE\r
+ = barred lambda, lambda bar\r
+ * Americanist phonetic usage\r
+019C LATIN CAPITAL LETTER TURNED M\r
+ * Zhuang\r
+ x (latin small letter turned m - 026F)\r
+019D LATIN CAPITAL LETTER N WITH LEFT HOOK\r
+ * African\r
+ x (latin small letter n with left hook - 0272)\r
+019E LATIN SMALL LETTER N WITH LONG RIGHT LEG\r
+ * archaic phonetic for Japanese syllabic "n"\r
+ * recommended spelling 006E 0329\r
+019F LATIN CAPITAL LETTER O WITH MIDDLE TILDE *\r
+ = barred o, o bar\r
+ * lowercase is 0275\r
+ * African\r
+ x (cyrillic capital letter barred o - 04E8)\r
+01A0 LATIN CAPITAL LETTER O WITH HORN\r
+ : 004F 031B\r
+01A1 LATIN SMALL LETTER O WITH HORN\r
+ * Vietnamese\r
+ : 006F 031B\r
+01A2 LATIN CAPITAL LETTER OI (gha)\r
+01A3 LATIN SMALL LETTER OI (gha)\r
+ = gha\r
+ * Pan-Turkic Latin alphabets\r
+01A4 LATIN CAPITAL LETTER P WITH HOOK\r
+01A5 LATIN SMALL LETTER P WITH HOOK\r
+ * African\r
+01A6 LATIN LETTER YR *\r
+ * old Norse\r
+ * from German Standard DIN 31624 and ISO 5246-2\r
+ * lowercase is 0280\r
+01A7 LATIN CAPITAL LETTER TONE TWO\r
+01A8 LATIN SMALL LETTER TONE TWO\r
+ * Zhuang\r
+ * typographically a reversed S\r
+ x (latin small letter tone six - 0185)\r
+01A9 LATIN CAPITAL LETTER ESH\r
+ * African\r
+ x (latin small letter esh - 0283)\r
+ x (greek capital letter sigma - 03A3)\r
+01AA LATIN LETTER REVERSED ESH LOOP\r
+ * archaic phonetic for labialized palatoalveolar or palatal fricative\r
+ * Twi\r
+ * recommended spellings 0283 02B7, 00E7 02B7, 0068 0265, etc.\r
+01AB LATIN SMALL LETTER T WITH PALATAL HOOK\r
+ * archaic phonetic for palatalized alveolar or dental stop\r
+ * recommended spelling 0074 02B2\r
+01AC LATIN CAPITAL LETTER T WITH HOOK\r
+01AD LATIN SMALL LETTER T WITH HOOK\r
+ * African\r
+01AE LATIN CAPITAL LETTER T WITH RETROFLEX HOOK\r
+ * African\r
+ x (latin small letter t with retroflex hook - 0288)\r
+01AF LATIN CAPITAL LETTER U WITH HORN\r
+ : 0055 031B\r
+01B0 LATIN SMALL LETTER U WITH HORN\r
+ * Vietnamese\r
+ : 0075 031B\r
+01B1 LATIN CAPITAL LETTER UPSILON\r
+ * African\r
+ * typographically based on turned capital Greek omega\r
+ x (latin small letter upsilon - 028A)\r
+ x (inverted ohm sign - 2127)\r
+01B2 LATIN CAPITAL LETTER V WITH HOOK\r
+ = LATIN CAPITAL LETTER SCRIPT V\r
+ * African\r
+ x (latin small letter v with hook - 028B)\r
+01B3 LATIN CAPITAL LETTER Y WITH HOOK\r
+01B4 LATIN SMALL LETTER Y WITH HOOK\r
+ * Bini, Esoko, and other Edo languages in West Africa\r
+01B5 LATIN CAPITAL LETTER Z WITH STROKE\r
+01B6 LATIN SMALL LETTER Z WITH STROKE\r
+ = barred z, z bar\r
+ * Pan-Turkic Latin orthography\r
+ * handwritten variant of Latin "z"\r
+ x (latin small letter z - 007A)\r
+01B7 LATIN CAPITAL LETTER EZH\r
+ * African, Skolt Sámi\r
+ * lowercase is 0292\r
+ x (latin capital letter yogh - 021C)\r
+ x (cyrillic capital letter abkhasian dze - 04E0)\r
+01B8 LATIN CAPITAL LETTER EZH REVERSED\r
+01B9 LATIN SMALL LETTER EZH REVERSED\r
+ * archaic phonetic for voiced pharyngeal fricative\r
+ * sometimes typographically rendered with a turned digit 3\r
+ * recommended spelling 0295\r
+ x (latin letter pharyngeal voiced fricative - 0295)\r
+ x (arabic letter ain - 0639)\r
+01BA LATIN SMALL LETTER EZH WITH TAIL\r
+ * archaic phonetic for labialized voiced palatoalveolar or palatal fricative\r
+ * Twi\r
+ * recommended spellings 0292 02B7 or 006A 02B7\r
+01BB LATIN LETTER TWO WITH STROKE\r
+ * archaic phonetic for [dz] affricate\r
+ * recommended spellings 0292 or 0064 007A\r
+01BC LATIN CAPITAL LETTER TONE FIVE\r
+01BD LATIN SMALL LETTER TONE FIVE\r
+ * Zhuang\r
+ x (latin small letter tone six - 0185)\r
+01BE LATIN LETTER INVERTED GLOTTAL STOP WITH STROKE\r
+ * archaic phonetic for [ts] affricate\r
+ * recommended spelling 0074 0073\r
+ * letter form is actually derived from ligation of ts, rather than inverted glottal stop\r
+01BF LATIN LETTER WYNN\r
+ = wen\r
+ * Runic letter borrowed into Latin script\r
+ * replaced by "w" in modern transcriptions of Old English\r
+ * uppercase is 01F7\r
+ x (runic letter wunjo wynn w - 16B9)\r
+01C0 LATIN LETTER DENTAL CLICK\r
+ = pipe\r
+ * Khoisan tradition\r
+ * "c" in Zulu orthography\r
+ x (solidus - 002F)\r
+ x (vertical line - 007C)\r
+ x (latin small letter turned t - 0287)\r
+ x (divides - 2223)\r
+01C1 LATIN LETTER LATERAL CLICK\r
+ = double pipe\r
+ * Khoisan tradition\r
+ * "x" in Zulu orthography\r
+ x (latin letter inverted glottal stop - 0296)\r
+ x (parallel to - 2225)\r
+01C2 LATIN LETTER ALVEOLAR CLICK\r
+ = double-barred pipe\r
+ * Khoisan tradition\r
+ x (not equal to - 2260)\r
+01C3 LATIN LETTER RETROFLEX CLICK\r
+ = LATIN LETTER EXCLAMATION MARK\r
+ * Khoisan tradition\r
+ * "q" in Zulu orthography\r
+ x (exclamation mark - 0021)\r
+ x (latin letter stretched c - 0297)\r
+@ Croatian digraphs matching Serbian Cyrillic letters\r
+01C4 LATIN CAPITAL LETTER DZ WITH CARON\r
+ # 0044 017D\r
+01C5 LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON\r
+ # 0044 017E\r
+01C6 LATIN SMALL LETTER DZ WITH CARON\r
+ x (cyrillic small letter dzhe - 045F)\r
+ # 0064 017E\r
+01C7 LATIN CAPITAL LETTER LJ\r
+ # 004C 004A\r
+01C8 LATIN CAPITAL LETTER L WITH SMALL LETTER J\r
+ # 004C 006A\r
+01C9 LATIN SMALL LETTER LJ\r
+ x (cyrillic small letter lje - 0459)\r
+ # 006C 006A\r
+01CA LATIN CAPITAL LETTER NJ\r
+ # 004E 004A\r
+01CB LATIN CAPITAL LETTER N WITH SMALL LETTER J\r
+ # 004E 006A\r
+01CC LATIN SMALL LETTER NJ\r
+ x (cyrillic small letter nje - 045A)\r
+ # 006E 006A\r
+@ Pinyin diacritic-vowel combinations\r
+01CD LATIN CAPITAL LETTER A WITH CARON\r
+ : 0041 030C\r
+01CE LATIN SMALL LETTER A WITH CARON\r
+ * Pinyin third tone\r
+ : 0061 030C\r
+01CF LATIN CAPITAL LETTER I WITH CARON\r
+ : 0049 030C\r
+01D0 LATIN SMALL LETTER I WITH CARON\r
+ * Pinyin third tone\r
+ : 0069 030C\r
+01D1 LATIN CAPITAL LETTER O WITH CARON\r
+ : 004F 030C\r
+01D2 LATIN SMALL LETTER O WITH CARON\r
+ * Pinyin third tone\r
+ : 006F 030C\r
+01D3 LATIN CAPITAL LETTER U WITH CARON\r
+ : 0055 030C\r
+01D4 LATIN SMALL LETTER U WITH CARON\r
+ * Pinyin third tone\r
+ : 0075 030C\r
+01D5 LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON\r
+ : 00DC 0304\r
+01D6 LATIN SMALL LETTER U WITH DIAERESIS AND MACRON\r
+ * Pinyin first tone\r
+ : 00FC 0304\r
+01D7 LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE\r
+ : 00DC 0301\r
+01D8 LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE\r
+ * Pinyin second tone\r
+ : 00FC 0301\r
+01D9 LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON\r
+ : 00DC 030C\r
+01DA LATIN SMALL LETTER U WITH DIAERESIS AND CARON\r
+ * Pinyin third tone\r
+ : 00FC 030C\r
+01DB LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE\r
+ : 00DC 0300\r
+01DC LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE\r
+ * Pinyin fourth tone\r
+ : 00FC 0300\r
+@ Additions\r
+01DD LATIN SMALL LETTER TURNED E\r
+ * Pan-Nigerian alphabet\r
+ * all other usages of schwa are 0259\r
+ * uppercase is 018E\r
+ x (latin small letter schwa - 0259)\r
+01DE LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON\r
+ : 00C4 0304\r
+01DF LATIN SMALL LETTER A WITH DIAERESIS AND MACRON\r
+ * Livonian, Uralicist usage\r
+ : 00E4 0304\r
+01E0 LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON\r
+ : 0226 0304\r
+01E1 LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON\r
+ * Uralicist usage\r
+ : 0227 0304\r
+01E2 LATIN CAPITAL LETTER AE WITH MACRON (ash) *\r
+ : 00C6 0304\r
+01E3 LATIN SMALL LETTER AE WITH MACRON (ash) *\r
+ * Old Norse, Old English\r
+ : 00E6 0304\r
+01E4 LATIN CAPITAL LETTER G WITH STROKE\r
+01E5 LATIN SMALL LETTER G WITH STROKE\r
+ * Skolt Sámi\r
+01E6 LATIN CAPITAL LETTER G WITH CARON\r
+ : 0047 030C\r
+01E7 LATIN SMALL LETTER G WITH CARON\r
+ * Skolt Sámi\r
+ x (latin small letter g with breve - 011F)\r
+ : 0067 030C\r
+01E8 LATIN CAPITAL LETTER K WITH CARON\r
+ : 004B 030C\r
+01E9 LATIN SMALL LETTER K WITH CARON\r
+ * Skolt Sámi\r
+ : 006B 030C\r
+01EA LATIN CAPITAL LETTER O WITH OGONEK\r
+ : 004F 0328\r
+01EB LATIN SMALL LETTER O WITH OGONEK\r
+ * Sámi, Iroquoian, Old Icelandic\r
+ : 006F 0328\r
+01EC LATIN CAPITAL LETTER O WITH OGONEK AND MACRON\r
+ : 01EA 0304\r
+01ED LATIN SMALL LETTER O WITH OGONEK AND MACRON\r
+ * Old Icelandic\r
+ : 01EB 0304\r
+01EE LATIN CAPITAL LETTER EZH WITH CARON\r
+ : 01B7 030C\r
+01EF LATIN SMALL LETTER EZH WITH CARON\r
+ * Skolt Sámi\r
+ : 0292 030C\r
+01F0 LATIN SMALL LETTER J WITH CARON\r
+ * IPA and many languages\r
+ : 006A 030C\r
+01F1 LATIN CAPITAL LETTER DZ\r
+ # 0044 005A\r
+01F2 LATIN CAPITAL LETTER D WITH SMALL LETTER Z\r
+ # 0044 007A\r
+01F3 LATIN SMALL LETTER DZ\r
+ # 0064 007A\r
+01F4 LATIN CAPITAL LETTER G WITH ACUTE\r
+ : 0047 0301\r
+01F5 LATIN SMALL LETTER G WITH ACUTE\r
+ * Macedonian and Serbian transliteration\r
+ : 0067 0301\r
+01F6 LATIN CAPITAL LETTER HWAIR\r
+ * lowercase is 0195\r
+01F7 LATIN CAPITAL LETTER WYNN\r
+ = wen\r
+ * lowercase is 01BF\r
+01F8 LATIN CAPITAL LETTER N WITH GRAVE\r
+ : 004E 0300\r
+01F9 LATIN SMALL LETTER N WITH GRAVE\r
+ * Pinyin\r
+ : 006E 0300\r
+01FA LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE\r
+ : 00C5 0301\r
+01FB LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE\r
+ : 00E5 0301\r
+01FC LATIN CAPITAL LETTER AE WITH ACUTE (ash) *\r
+ : 00C6 0301\r
+01FD LATIN SMALL LETTER AE WITH ACUTE (ash) *\r
+ : 00E6 0301\r
+01FE LATIN CAPITAL LETTER O WITH STROKE AND ACUTE\r
+ : 00D8 0301\r
+01FF LATIN SMALL LETTER O WITH STROKE AND ACUTE\r
+ : 00F8 0301\r
+@ Additions for Slovenian and Croatian\r
+0200 LATIN CAPITAL LETTER A WITH DOUBLE GRAVE\r
+ : 0041 030F\r
+0201 LATIN SMALL LETTER A WITH DOUBLE GRAVE\r
+ : 0061 030F\r
+0202 LATIN CAPITAL LETTER A WITH INVERTED BREVE\r
+ : 0041 0311\r
+0203 LATIN SMALL LETTER A WITH INVERTED BREVE\r
+ : 0061 0311\r
+0204 LATIN CAPITAL LETTER E WITH DOUBLE GRAVE\r
+ : 0045 030F\r
+0205 LATIN SMALL LETTER E WITH DOUBLE GRAVE\r
+ : 0065 030F\r
+0206 LATIN CAPITAL LETTER E WITH INVERTED BREVE\r
+ : 0045 0311\r
+0207 LATIN SMALL LETTER E WITH INVERTED BREVE\r
+ : 0065 0311\r
+0208 LATIN CAPITAL LETTER I WITH DOUBLE GRAVE\r
+ : 0049 030F\r
+0209 LATIN SMALL LETTER I WITH DOUBLE GRAVE\r
+ : 0069 030F\r
+020A LATIN CAPITAL LETTER I WITH INVERTED BREVE\r
+ : 0049 0311\r
+020B LATIN SMALL LETTER I WITH INVERTED BREVE\r
+ : 0069 0311\r
+020C LATIN CAPITAL LETTER O WITH DOUBLE GRAVE\r
+ : 004F 030F\r
+020D LATIN SMALL LETTER O WITH DOUBLE GRAVE\r
+ : 006F 030F\r
+020E LATIN CAPITAL LETTER O WITH INVERTED BREVE\r
+ : 004F 0311\r
+020F LATIN SMALL LETTER O WITH INVERTED BREVE\r
+ : 006F 0311\r
+0210 LATIN CAPITAL LETTER R WITH DOUBLE GRAVE\r
+ : 0052 030F\r
+0211 LATIN SMALL LETTER R WITH DOUBLE GRAVE\r
+ : 0072 030F\r
+0212 LATIN CAPITAL LETTER R WITH INVERTED BREVE\r
+ : 0052 0311\r
+0213 LATIN SMALL LETTER R WITH INVERTED BREVE\r
+ : 0072 0311\r
+0214 LATIN CAPITAL LETTER U WITH DOUBLE GRAVE\r
+ : 0055 030F\r
+0215 LATIN SMALL LETTER U WITH DOUBLE GRAVE\r
+ : 0075 030F\r
+0216 LATIN CAPITAL LETTER U WITH INVERTED BREVE\r
+ : 0055 0311\r
+0217 LATIN SMALL LETTER U WITH INVERTED BREVE\r
+ : 0075 0311\r
+@ Additions for Romanian\r
+0218 LATIN CAPITAL LETTER S WITH COMMA BELOW *\r
+ : 0053 0326\r
+0219 LATIN SMALL LETTER S WITH COMMA BELOW *\r
+ * Romanian, when distinct comma below form is required\r
+ x (latin small letter s with cedilla - 015F)\r
+ : 0073 0326\r
+021A LATIN CAPITAL LETTER T WITH COMMA BELOW *\r
+ : 0054 0326\r
+021B LATIN SMALL LETTER T WITH COMMA BELOW *\r
+ * Romanian, when distinct comma below form is required\r
+ x (latin small letter t with cedilla - 0163)\r
+ : 0074 0326\r
+@ Miscellaneous additions\r
+021C LATIN CAPITAL LETTER YOGH\r
+ x (latin capital letter ezh - 01B7)\r
+021D LATIN SMALL LETTER YOGH\r
+ * Middle English, Scots\r
+ x (latin small letter ezh - 0292)\r
+ x (ounce sign - 2125)\r
+021E LATIN CAPITAL LETTER H WITH CARON\r
+ : 0048 030C\r
+021F LATIN SMALL LETTER H WITH CARON\r
+ * Finnish Romany\r
+ : 0068 030C\r
+0222 LATIN CAPITAL LETTER OU\r
+0223 LATIN SMALL LETTER OU\r
+ * Algonquin, Huron\r
+ x (digit eight - 0038)\r
+0224 LATIN CAPITAL LETTER Z WITH HOOK\r
+0225 LATIN SMALL LETTER Z WITH HOOK\r
+ * Middle High German\r
+0226 LATIN CAPITAL LETTER A WITH DOT ABOVE\r
+ : 0041 0307\r
+0227 LATIN SMALL LETTER A WITH DOT ABOVE\r
+ * Uralicist usage\r
+ : 0061 0307\r
+0228 LATIN CAPITAL LETTER E WITH CEDILLA\r
+ : 0045 0327\r
+0229 LATIN SMALL LETTER E WITH CEDILLA\r
+ : 0065 0327\r
+@ Additions for Livonian\r
+022A LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON\r
+ : 00D6 0304\r
+022B LATIN SMALL LETTER O WITH DIAERESIS AND MACRON\r
+ * Livonian\r
+ : 00F6 0304\r
+022C LATIN CAPITAL LETTER O WITH TILDE AND MACRON\r
+ : 00D5 0304\r
+022D LATIN SMALL LETTER O WITH TILDE AND MACRON\r
+ * Livonian\r
+ : 00F5 0304\r
+022E LATIN CAPITAL LETTER O WITH DOT ABOVE\r
+ : 004F 0307\r
+022F LATIN SMALL LETTER O WITH DOT ABOVE\r
+ * Livonian\r
+ : 006F 0307\r
+0230 LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON\r
+ : 022E 0304\r
+0231 LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON\r
+ * Livonian\r
+ : 022F 0304\r
+0232 LATIN CAPITAL LETTER Y WITH MACRON\r
+ : 0059 0304\r
+0233 LATIN SMALL LETTER Y WITH MACRON\r
+ * Livonian, Cornish\r
+ : 0079 0304\r
+@@ 0250 IPA Extensions 02AF\r
+@ IPA extensions\r
+@+ IPA includes basic Latin letters and a number of Latin letters from other blocks.\r
+ x (latin small letter ae - 00E6)\r
+ x (latin small letter c with cedilla - 00E7)\r
+ x (latin small letter eth - 00F0)\r
+ x (latin small letter o with stroke - 00F8)\r
+ x (latin small letter h with stroke - 0127)\r
+ x (latin small letter eng - 014B)\r
+ x (latin small ligature oe - 0153)\r
+ x (greek small letter beta - 03B2)\r
+ x (greek small letter theta - 03B8)\r
+ x (greek small letter lamda - 03BB)\r
+ x (greek small letter chi - 03C7)\r
+0250 LATIN SMALL LETTER TURNED A\r
+ * low central unrounded vowel\r
+0251 LATIN SMALL LETTER ALPHA\r
+ = LATIN SMALL LETTER SCRIPT A\r
+ * low back unrounded vowel\r
+ x (greek small letter alpha - 03B1)\r
+0252 LATIN SMALL LETTER TURNED ALPHA\r
+ * low back rounded vowel\r
+0253 LATIN SMALL LETTER B WITH HOOK\r
+ * implosive bilabial stop\r
+ * Pan-Nigerian alphabet\r
+ x (latin capital letter b with hook - 0181)\r
+0254 LATIN SMALL LETTER OPEN O\r
+ * typographically a turned c\r
+ * lower-mid back rounded vowel\r
+ x (latin capital letter open o - 0186)\r
+0255 LATIN SMALL LETTER C WITH CURL\r
+ * voiceless alveolo-palatal laminal fricative\r
+ * used in transcription of Mandarin Chinese\r
+ * sound spelled with 015B in Polish\r
+0256 LATIN SMALL LETTER D WITH TAIL\r
+ = LATIN SMALL LETTER D RETROFLEX HOOK\r
+ * voiced retroflex stop\r
+ x (latin capital letter african d - 0189)\r
+0257 LATIN SMALL LETTER D WITH HOOK\r
+ * implosive dental or alveolar stop\r
+ * Ewe, Pan-Nigerian alphabet\r
+ x (latin capital letter d with hook - 018A)\r
+0258 LATIN SMALL LETTER REVERSED E\r
+ * upper-mid central unrounded vowel\r
+0259 LATIN SMALL LETTER SCHWA\r
+ * mid-central unrounded vowel\r
+ * variant uppercase form 018E is associated with 01DD\r
+ x (latin capital letter schwa - 018F)\r
+ x (latin small letter turned e - 01DD)\r
+ x (cyrillic small letter schwa - 04D9)\r
+025A LATIN SMALL LETTER SCHWA WITH HOOK\r
+ * rhotacized schwa\r
+025B LATIN SMALL LETTER OPEN E\r
+ = LATIN SMALL LETTER EPSILON\r
+ * lower-mid front unrounded vowel\r
+ x (latin capital letter open e - 0190)\r
+ x (greek small letter epsilon - 03B5)\r
+025C LATIN SMALL LETTER REVERSED OPEN E\r
+ * lower-mid central unrounded vowel\r
+025D LATIN SMALL LETTER REVERSED OPEN E WITH HOOK\r
+ * rhotacized lower-mid central vowel\r
+025E LATIN SMALL LETTER CLOSED REVERSED OPEN E\r
+ = LATIN SMALL LETTER CLOSED REVERSED EPSILON\r
+ * lower-mid central rounded vowel\r
+025F LATIN SMALL LETTER DOTLESS J WITH STROKE\r
+ * voiced palatal stop\r
+ * typographically a turned f, but better thought of as a form of j\r
+ * "gy" in Hungarian orthography\r
+ * also archaic phonetic for palatoalveolar affricate 02A4\r
+0260 LATIN SMALL LETTER G WITH HOOK\r
+ * implosive velar stop\r
+ x (latin capital letter g with hook - 0193)\r
+0261 LATIN SMALL LETTER SCRIPT G\r
+ * voiced velar stop\r
+ x (latin small letter g - 0067)\r
+0262 LATIN LETTER SMALL CAPITAL G\r
+ * voiced uvular stop\r
+0263 LATIN SMALL LETTER GAMMA\r
+ * voiced velar fricative\r
+ x (latin capital letter gamma - 0194)\r
+ x (greek small letter gamma - 03B3)\r
+0264 LATIN SMALL LETTER RAMS HORN\r
+ = LATIN SMALL LETTER BABY GAMMA\r
+ * upper-mid back unrounded vowel\r
+0265 LATIN SMALL LETTER TURNED H\r
+ * voiced rounded palatal approximant\r
+0266 LATIN SMALL LETTER H WITH HOOK\r
+ * breathy-voiced glottal fricative\r
+ x (modifier letter small h with hook - 02B1)\r
+0267 LATIN SMALL LETTER HENG WITH HOOK\r
+ * voiceless coarticulated velar and palatoalveolar fricative\r
+ * "tj" or "kj" or "sj" in some Swedish dialects\r
+0268 LATIN SMALL LETTER I WITH STROKE\r
+ = barred i, i bar\r
+ * high central unrounded vowel\r
+ * ISO 6438 gives lowercase of 0197 as 026A, not 0268\r
+0269 LATIN SMALL LETTER IOTA\r
+ * semi-high front unrounded vowel\r
+@+ * obsoleted by IPA in 1989\r
+ * preferred use is 026A LATIN LETTER SMALL CAPITAL I\r
+ x (latin capital letter iota - 0196)\r
+ x (greek small letter iota - 03B9)\r
+026A LATIN LETTER SMALL CAPITAL I\r
+ * semi-high front unrounded vowel\r
+ * preferred IPA alternate for 0269\r
+ x (latin capital letter i with stroke - 0197)\r
+026B LATIN SMALL LETTER L WITH MIDDLE TILDE\r
+ * velarized voiced alveolar lateral approximant\r
+026C LATIN SMALL LETTER L WITH BELT\r
+ * voiceless alveolar lateral fricative\r
+026D LATIN SMALL LETTER L WITH RETROFLEX HOOK\r
+ * voiced retroflex lateral\r
+026E LATIN SMALL LETTER LEZH\r
+ * voiced lateral fricative\r
+ * "dhl" in Zulu orthography\r
+026F LATIN SMALL LETTER TURNED M\r
+ * high back unrounded vowel\r
+ x (latin capital letter turned m - 019C)\r
+0270 LATIN SMALL LETTER TURNED M WITH LONG LEG\r
+ * voiced velar approximant\r
+0271 LATIN SMALL LETTER M WITH HOOK\r
+ * voiced labiodental nasal\r
+0272 LATIN SMALL LETTER N WITH LEFT HOOK\r
+ * voiced palatal nasal\r
+ x (latin capital letter n with left hook - 019D)\r
+0273 LATIN SMALL LETTER N WITH RETROFLEX HOOK\r
+ * voiced retroflex nasal\r
+0274 LATIN LETTER SMALL CAPITAL N\r
+ * voiced uvular nasal\r
+0275 LATIN SMALL LETTER BARRED O\r
+ = o bar\r
+ * rounded mid-central vowel, i.e. rounded schwa\r
+ * uppercase is 019F\r
+ x (greek small letter theta - 03B8)\r
+ x (cyrillic small letter fita - 0473)\r
+ x (cyrillic small letter barred o - 04E9)\r
+0276 LATIN LETTER SMALL CAPITAL OE\r
+ * low front rounded vowel\r
+ x (latin small ligature oe - 0153)\r
+0277 LATIN SMALL LETTER CLOSED OMEGA\r
+ * semi-high back rounded vowel\r
+@+ * obsoleted by IPA in 1989\r
+ * preferred use is 028A latin small letter upsilon\r
+0278 LATIN SMALL LETTER PHI\r
+ * voiceless bilabial fricative\r
+ x (greek small letter phi - 03C6)\r
+0279 LATIN SMALL LETTER TURNED R\r
+ * voiced alveolar approximant\r
+ x (modifier letter small turned r - 02B4)\r
+027A LATIN SMALL LETTER TURNED R WITH LONG LEG\r
+ * voiced lateral flap\r
+027B LATIN SMALL LETTER TURNED R WITH HOOK\r
+ * voiced retroflex approximant\r
+ x (modifier letter small turned r with hook - 02B5)\r
+027C LATIN SMALL LETTER R WITH LONG LEG\r
+ * voiced strident apico-alveolar trill\r
+@+ * obsoleted by IPA in 1989\r
+ * sound spelled with 0159 in Czech\r
+ * preferred phonetic representation for Czech is 0072 031D\r
+ * in current use in Gaelic types (as glyph variant of 0072)\r
+027D LATIN SMALL LETTER R WITH TAIL\r
+ * voiced retroflex flap\r
+027E LATIN SMALL LETTER R WITH FISHHOOK\r
+ * voiced alveolar flap or tap\r
+027F LATIN SMALL LETTER REVERSED R WITH FISHHOOK\r
+ * apical dental vowel\r
+ * used in Sinological tradition\r
+ * IPA spelling - 007A 0329\r
+0280 LATIN LETTER SMALL CAPITAL R *\r
+ * voiced uvular trill\r
+ * Germanic, Old Norse\r
+ * uppercase is 01A6\r
+0281 LATIN LETTER SMALL CAPITAL INVERTED R\r
+ * voiced uvular fricative or approximant\r
+ x (modifier letter small capital inverted r - 02B6)\r
+0282 LATIN SMALL LETTER S WITH HOOK\r
+ * voiceless retroflex fricative\r
+0283 LATIN SMALL LETTER ESH\r
+ * voiceless postalveolar fricative\r
+ x (latin capital letter esh - 01A9)\r
+ x (integral - 222B)\r
+0284 LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK\r
+ * implosive palatal stop\r
+ * typographically based on 025F, not on 0283\r
+0285 LATIN SMALL LETTER SQUAT REVERSED ESH\r
+ * apical retroflex vowel\r
+ * used in Sinological tradition\r
+ * IPA spelling - 0290 0329\r
+0286 LATIN SMALL LETTER ESH WITH CURL\r
+ * palatalized voiceless postalveolar fricative\r
+ * suggested spelling - 0283 02B2\r
+0287 LATIN SMALL LETTER TURNED T\r
+ * dental click (sound of "tsk tsk")\r
+ x (latin letter dental click - 01C0)\r
+0288 LATIN SMALL LETTER T WITH RETROFLEX HOOK\r
+ * voiceless retroflex stop\r
+ x (latin capital letter t with retroflex hook - 01AE)\r
+0289 LATIN SMALL LETTER U BAR\r
+ * high central rounded vowel\r
+028A LATIN SMALL LETTER UPSILON\r
+ * semi-high back rounded vowel\r
+ * preferred IPA alternate to 0277\r
+ x (latin capital letter upsilon - 01B1)\r
+ x (greek small letter upsilon - 03C5)\r
+028B LATIN SMALL LETTER V WITH HOOK\r
+ = LATIN SMALL LETTER SCRIPT V\r
+ * voiced labiodental approximant\r
+ x (latin capital letter v with hook - 01B2)\r
+ x (greek small letter upsilon - 03C5)\r
+028C LATIN SMALL LETTER TURNED V\r
+ = caret, wedge\r
+ * lower-mid back unrounded vowel\r
+ x (greek capital letter lamda - 039B)\r
+ x (caret - 2038)\r
+ x (logical and - 2227)\r
+028D LATIN SMALL LETTER TURNED W\r
+ * voiceless rounded labiovelar approximant\r
+028E LATIN SMALL LETTER TURNED Y\r
+ * voiced lateral approximant\r
+028F LATIN LETTER SMALL CAPITAL Y\r
+ * semi-high front rounded vowel\r
+0290 LATIN SMALL LETTER Z WITH RETROFLEX HOOK\r
+ * voiced retroflex fricative\r
+0291 LATIN SMALL LETTER Z WITH CURL\r
+ * voiced alveolo-palatal laminal fricative\r
+ * sound spelled with 017A in Polish\r
+0292 LATIN SMALL LETTER EZH\r
+ = LATIN SMALL LETTER YOGH\r
+ = dram\r
+ * voiced postalveolar fricative\r
+ * uppercase is 01B7\r
+ * Skolt Sámi\r
+ x (latin small letter yogh - 021D)\r
+ x (cyrillic small letter abkhasian dze - 04E1)\r
+ x (ounce sign - 2125)\r
+0293 LATIN SMALL LETTER EZH WITH CURL\r
+ * palatalized voiced postalveolar fricative\r
+0294 LATIN LETTER GLOTTAL STOP\r
+ x (modifier letter glottal stop - 02C0)\r
+0295 LATIN LETTER PHARYNGEAL VOICED FRICATIVE\r
+ = LATIN LETTER REVERSED GLOTTAL STOP\r
+ * voiced pharyngeal fricative\r
+ * ain\r
+ x (latin small letter ezh reversed - 01B9)\r
+ x (modifier letter reversed glottal stop - 02C1)\r
+0296 LATIN LETTER INVERTED GLOTTAL STOP\r
+ * lateral click\r
+ x (latin letter lateral click - 01C1)\r
+0297 LATIN LETTER STRETCHED C\r
+ * palatal (or alveolar) click\r
+ x (latin letter retroflex click - 01C3)\r
+ x (complement - 2201)\r
+0298 LATIN LETTER BILABIAL CLICK\r
+ = LATIN LETTER BULLSEYE\r
+ x (circled dot operator - 2299)\r
+0299 LATIN LETTER SMALL CAPITAL B\r
+ * bilabial trill\r
+029A LATIN SMALL LETTER CLOSED OPEN E\r
+ = LATIN SMALL LETTER CLOSED EPSILON\r
+ * lower-mid front rounded vowel\r
+ * non-IPA alternate for the preferred 0153\r
+029B LATIN LETTER SMALL CAPITAL G WITH HOOK\r
+ * voiced uvular implosive\r
+029C LATIN LETTER SMALL CAPITAL H\r
+ * voiceless epiglottal fricative\r
+029D LATIN SMALL LETTER J WITH CROSSED-TAIL\r
+ * voiced palatal fricative\r
+029E LATIN SMALL LETTER TURNED K\r
+ * proposed for velar click\r
+@+ * withdrawn by IPA in 1970\r
+029F LATIN LETTER SMALL CAPITAL L\r
+ * velar lateral approximant\r
+02A0 LATIN SMALL LETTER Q WITH HOOK\r
+ * voiceless uvular implosive\r
+02A1 LATIN LETTER GLOTTAL STOP WITH STROKE\r
+ * voiced epiglottal stop\r
+02A2 LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE\r
+ * voiced epiglottal fricative\r
+02A3 LATIN SMALL LETTER DZ DIGRAPH\r
+ * voiced dental affricate\r
+02A4 LATIN SMALL LETTER DEZH DIGRAPH\r
+ * voiced postalveolar affricate\r
+02A5 LATIN SMALL LETTER DZ DIGRAPH WITH CURL\r
+ * voiced alveolo-palatal affricate\r
+02A6 LATIN SMALL LETTER TS DIGRAPH\r
+ * voiceless dental affricate\r
+02A7 LATIN SMALL LETTER TESH DIGRAPH\r
+ * voiceless postalveolar affricate\r
+02A8 LATIN SMALL LETTER TC DIGRAPH WITH CURL\r
+ * voiceless alveolo-palatal affricate\r
+@ IPA characters for disordered speech\r
+02A9 LATIN SMALL LETTER FENG DIGRAPH\r
+ * velopharyngeal fricative\r
+02AA LATIN SMALL LETTER LS DIGRAPH\r
+ * lateral alveolar fricative (lisp)\r
+02AB LATIN SMALL LETTER LZ DIGRAPH\r
+ * voiced lateral alveolar fricative\r
+02AC LATIN LETTER BILABIAL PERCUSSIVE\r
+ * audible lip smack\r
+02AD LATIN LETTER BIDENTAL PERCUSSIVE\r
+ * audible teeth gnashing\r
+@@ 02B0 Spacing Modifier Letters 02FF\r
+@ Phonetic modifiers derived from Latin letters\r
+02B0 MODIFIER LETTER SMALL H\r
+ * aspiration\r
+ # <super> 0068\r
+02B1 MODIFIER LETTER SMALL H WITH HOOK\r
+ * breathy voiced, murmured\r
+ x (latin small letter h with hook - 0266)\r
+ x (combining diaeresis below - 0324)\r
+ # <super> 0266\r
+02B2 MODIFIER LETTER SMALL J\r
+ * palatalization\r
+ x (combining palatalized hook below - 0321)\r
+ # <super> 006A\r
+02B3 MODIFIER LETTER SMALL R\r
+ # <super> 0072\r
+02B4 MODIFIER LETTER SMALL TURNED R\r
+ x (latin small letter turned r - 0279)\r
+ # <super> 0279\r
+02B5 MODIFIER LETTER SMALL TURNED R WITH HOOK\r
+ x (latin small letter turned r with hook - 027B)\r
+ # <super> 027B\r
+02B6 MODIFIER LETTER SMALL CAPITAL INVERTED R\r
+ * preceding four used for r-coloring or r-offglides\r
+ x (latin letter small capital inverted r - 0281)\r
+ # <super> 0281\r
+02B7 MODIFIER LETTER SMALL W\r
+ * labialization\r
+ x (combining inverted double arch below - 032B)\r
+ # <super> 0077\r
+02B8 MODIFIER LETTER SMALL Y\r
+ * palatalization\r
+ * common Americanist substitution for 02B2\r
+ # <super> 0079\r
+@ Miscellaneous phonetic modifiers\r
+02B9 MODIFIER LETTER PRIME\r
+ * primary stress, emphasis\r
+ * transliteration of mjagkij znak (Cyrillic soft sign: palatalization)\r
+ x (apostrophe - 0027)\r
+ x (acute accent - 00B4)\r
+ x (modifier letter acute accent - 02CA)\r
+ x (combining acute accent - 0301)\r
+ x (greek numeral sign - 0374)\r
+ x (prime - 2032)\r
+02BA MODIFIER LETTER DOUBLE PRIME\r
+ * exaggerated stress, contrastive stress\r
+ * transliteration of tverdyj znak (Cyrillic hard sign: no palatalization)\r
+ x (quotation mark - 0022)\r
+ x (combining double acute accent - 030B)\r
+ x (double prime - 2033)\r
+02BB MODIFIER LETTER TURNED COMMA\r
+ * typographical alternate for 02BD or 02BF\r
+ x (combining turned comma above - 0312)\r
+ x (left single quotation mark - 2018)\r
+02BC MODIFIER LETTER APOSTROPHE\r
+ = apostrophe\r
+ * glottal stop, glottalization, ejective\r
+ * spacing clone of Greek smooth breathing mark\r
+ * many languages use this as a letter of their alphabets\r
+ x (apostrophe - 0027)\r
+ x (combining comma above - 0313)\r
+ x (combining comma above right - 0315)\r
+ x (armenian apostrophe - 055A)\r
+ x (right single quotation mark - 2019)\r
+02BD MODIFIER LETTER REVERSED COMMA\r
+ * weak aspiration\r
+ * spacing clone of Greek rough breathing mark\r
+ x (combining reversed comma above - 0314)\r
+ x (armenian modifier letter left half ring - 0559)\r
+ x (single high-reversed-9 quotation mark - 201B)\r
+02BE MODIFIER LETTER RIGHT HALF RING\r
+ * transliteration of Arabic hamza (glottal stop)\r
+ x (armenian apostrophe - 055A)\r
+ x (arabic letter hamza - 0621)\r
+02BF MODIFIER LETTER LEFT HALF RING\r
+ * transliteration of Arabic ain (voiced pharyngeal fricative)\r
+ x (armenian modifier letter left half ring - 0559)\r
+ x (arabic letter ain - 0639)\r
+02C0 MODIFIER LETTER GLOTTAL STOP\r
+ * ejective or glottalized\r
+ * typographical alternate for 02BC or 02BE\r
+ x (latin letter glottal stop - 0294)\r
+ x (combining hook above - 0309)\r
+02C1 MODIFIER LETTER REVERSED GLOTTAL STOP\r
+ * typographical alternate for 02BF\r
+ x (latin letter pharyngeal voiced fricative - 0295)\r
+02C2 MODIFIER LETTER LEFT ARROWHEAD\r
+ * fronted articulation\r
+02C3 MODIFIER LETTER RIGHT ARROWHEAD\r
+ * backed articulation\r
+02C4 MODIFIER LETTER UP ARROWHEAD\r
+ * raised articulation\r
+ x (circumflex accent - 005E)\r
+ x (up arrowhead - 2303)\r
+02C5 MODIFIER LETTER DOWN ARROWHEAD\r
+ * lowered articulation\r
+02C6 MODIFIER LETTER CIRCUMFLEX ACCENT\r
+ * rising-falling tone, falling tone, secondary stress, etc.\r
+ x (circumflex accent - 005E)\r
+ x (combining circumflex accent - 0302)\r
+02C7 CARON (Mandarin Chinese third tone)\r
+ = hacek\r
+ * falling-rising tone\r
+ * Mandarin Chinese third tone\r
+ x (combining caron - 030C)\r
+02C8 MODIFIER LETTER VERTICAL LINE\r
+ * primary stress, downstep\r
+ * precedes letter or syllable modified\r
+ x (apostrophe - 0027)\r
+ x (combining vertical line above - 030D)\r
+02C9 MODIFIER LETTER MACRON (Mandarin Chinese first tone)\r
+ * high level tone\r
+ * precedes or follows letter or syllable modified\r
+ * Mandarin Chinese first tone\r
+ x (macron - 00AF)\r
+ x (combining macron - 0304)\r
+02CA MODIFIER LETTER ACUTE ACCENT (Mandarin Chinese second tone)\r
+ * high-rising tone (IPA), high tone, primary stress\r
+ * Mandarin Chinese second tone\r
+ x (acute accent - 00B4)\r
+ x (modifier letter prime - 02B9)\r
+ x (combining acute accent - 0301)\r
+ x (greek numeral sign - 0374)\r
+ x (armenian emphasis mark - 055B)\r
+02CB MODIFIER LETTER GRAVE ACCENT (Mandarin Chinese fourth tone)\r
+ * high-falling tone (IPA), low tone, secondary or tertiary stress\r
+ * Mandarin Chinese fourth tone\r
+ x (grave accent - 0060)\r
+ x (combining grave accent - 0300)\r
+ x (armenian comma - 055D)\r
+02CC MODIFIER LETTER LOW VERTICAL LINE\r
+ * secondary stress\r
+ * precedes letter or syllable modified\r
+ x (combining vertical line below - 0329)\r
+02CD MODIFIER LETTER LOW MACRON\r
+ * low level tone\r
+ x (low line - 005F)\r
+ x (combining macron below - 0331)\r
+02CE MODIFIER LETTER LOW GRAVE ACCENT\r
+ * low-falling tone\r
+02CF MODIFIER LETTER LOW ACUTE ACCENT\r
+ * low-rising tone\r
+ x (greek lower numeral sign - 0375)\r
+02D0 MODIFIER LETTER TRIANGULAR COLON\r
+ * length mark\r
+ x (colon - 003A)\r
+02D1 MODIFIER LETTER HALF TRIANGULAR COLON\r
+ * half-length mark\r
+ x (middle dot - 00B7)\r
+02D2 MODIFIER LETTER CENTRED RIGHT HALF RING\r
+ * more rounded articulation\r
+02D3 MODIFIER LETTER CENTRED LEFT HALF RING\r
+ * less rounded articulation\r
+02D4 MODIFIER LETTER UP TACK\r
+ * vowel raising or closing\r
+ x (combining up tack below - 031D)\r
+ x (combining dot below - 0323)\r
+02D5 MODIFIER LETTER DOWN TACK\r
+ * vowel lowering or opening\r
+ x (combining left half ring below - 031C)\r
+ x (combining down tack below - 031E)\r
+02D6 MODIFIER LETTER PLUS SIGN\r
+ * advanced or fronted articulation\r
+ x (combining plus sign below - 031F)\r
+02D7 MODIFIER LETTER MINUS SIGN\r
+ * retracted or backed articulation\r
+ * glyph may have small end-serifs\r
+ x (combining minus sign below - 0320)\r
+@ Spacing clones of diacritics\r
+02D8 BREVE\r
+ x (combining breve - 0306)\r
+ # 0020 0306\r
+02D9 DOT ABOVE (Mandarin Chinese light tone)\r
+ * Mandarin Chinese fifth tone (light or neutral)\r
+ x (combining dot above - 0307)\r
+ # 0020 0307\r
+02DA RING ABOVE\r
+ x (degree sign - 00B0)\r
+ x (combining ring above - 030A)\r
+ # 0020 030A\r
+02DB OGONEK\r
+ x (combining ogonek - 0328)\r
+ # 0020 0328\r
+02DC SMALL TILDE\r
+ x (tilde - 007E)\r
+ x (combining tilde - 0303)\r
+ x (tilde operator - 223C)\r
+ # 0020 0303\r
+02DD DOUBLE ACUTE ACCENT\r
+ x (combining double acute accent - 030B)\r
+ # 0020 030B\r
+@ Additions based on 1989 IPA\r
+02DE MODIFIER LETTER RHOTIC HOOK\r
+ * rhotacization in vowel\r
+ * often ligated: 025A = 0259 + 02DE; 025D = 025C + 02DE\r
+02DF MODIFIER LETTER CROSS ACCENT\r
+ * Swedish grave accent\r
+02E0 MODIFIER LETTER SMALL GAMMA\r
+ * these modifier letters are occasionally used in transcription of affricates\r
+ # <super> 0263\r
+02E1 MODIFIER LETTER SMALL L\r
+ # <super> 006C\r
+02E2 MODIFIER LETTER SMALL S\r
+ # <super> 0073\r
+02E3 MODIFIER LETTER SMALL X\r
+ # <super> 0078\r
+02E4 MODIFIER LETTER SMALL REVERSED GLOTTAL STOP\r
+ # <super> 0295\r
+@ Tone letters\r
+02E5 MODIFIER LETTER EXTRA-HIGH TONE BAR\r
+02E6 MODIFIER LETTER HIGH TONE BAR\r
+02E7 MODIFIER LETTER MID TONE BAR\r
+02E8 MODIFIER LETTER LOW TONE BAR\r
+02E9 MODIFIER LETTER EXTRA-LOW TONE BAR\r
+02EA MODIFIER LETTER YIN DEPARTING TONE MARK\r
+02EB MODIFIER LETTER YANG DEPARTING TONE MARK\r
+@ IPA modifiers\r
+02EC MODIFIER LETTER VOICING\r
+02ED MODIFIER LETTER UNASPIRATED\r
+@ Other modifier letters\r
+02EE MODIFIER LETTER DOUBLE APOSTROPHE\r
+\r
+2000 EN QUAD\r
+ : 2002 en space\r
+2001 EM QUAD\r
+ = mutton quad\r
+ : 2003 em space\r
+2002 EN SPACE\r
+ = nut\r
+ * half an em\r
+ # 0020 space\r
+2003 EM SPACE\r
+ = mutton\r
+ * nominally, a space equal to the type size in points\r
+ * may scale by the condensation factor of a font\r
+ # 0020 space\r
+2004 THREE-PER-EM SPACE\r
+ = thick space\r
+ # 0020 space\r
+2005 FOUR-PER-EM SPACE\r
+ = mid space\r
+ # 0020 space\r
+2006 SIX-PER-EM SPACE\r
+ * in computer typography sometimes equated to thin space\r
+ # 0020 space\r
+2007 FIGURE SPACE\r
+ * space equal to tabular width of a font\r
+ * this is equivalent to the digit width of fonts with fixed-width digits\r
+ # <noBreak> 0020\r
+2008 PUNCTUATION SPACE\r
+ * space equal to narrow punctuation of a font\r
+ # 0020 space\r
+2009 THIN SPACE\r
+ * a fifth of an em (or sometimes a sixth)\r
+ # 0020 space\r
+200A HAIR SPACE\r
+ * thinner than a thin space\r
+ * in traditional typography, the thinnest space available\r
+ # 0020 space\r
+200B ZERO WIDTH SPACE\r
+ * nominally zero width, but may expand in justification\r
+@ Formatting characters\r
+200C ZERO WIDTH NON-JOINER\r
+ = ZWNJ\r
+200D ZERO WIDTH JOINER\r
+ = ZWJ\r
+200E LEFT-TO-RIGHT MARK\r
+ = LRM\r
+200F RIGHT-TO-LEFT MARK\r
+ = RLM\r
+@ Dashes\r
+2010 HYPHEN\r
+ x (hyphen-minus - 002D)\r
+2011 NON-BREAKING HYPHEN\r
+ x (hyphen-minus - 002D)\r
+ # <noBreak> 2010\r
+2012 FIGURE DASH\r
+2013 EN DASH\r
+2014 EM DASH\r
+ * may be used in pairs to offset parenthetical text\r
+ x (katakana-hiragana prolonged sound mark - 30FC)\r
+2015 HORIZONTAL BAR\r
+ = QUOTATION DASH\r
+ * long dash introducing quoted text\r
+@ General punctuation\r
+2016 DOUBLE VERTICAL LINE\r
+ * used in pairs to indicate norm of a matrix\r
+ x (parallel to - 2225)\r
+2017 DOUBLE LOW LINE\r
+ * this is a spacing character\r
+ x (low line - 005F)\r
+ x (combining double low line - 0333)\r
+ # 0020 0333\r
+2018 LEFT SINGLE QUOTATION MARK\r
+ = SINGLE TURNED COMMA QUOTATION MARK\r
+ * this is the preferred glyph (as opposed to 201B)\r
+ x (apostrophe - 0027)\r
+ x (modifier letter turned comma - 02BB)\r
+ x (heavy single turned comma quotation mark ornament - 275B)\r
+2019 RIGHT SINGLE QUOTATION MARK\r
+ = SINGLE COMMA QUOTATION MARK\r
+ * this is the preferred character to use for apostrophe\r
+ x (apostrophe - 0027)\r
+ x (modifier letter apostrophe - 02BC)\r
+ x (heavy single comma quotation mark ornament - 275C)\r
+201A SINGLE LOW-9 QUOTATION MARK\r
+ = LOW SINGLE COMMA QUOTATION MARK\r
+ * used as opening single quotation mark in some languages\r
+201B SINGLE HIGH-REVERSED-9 QUOTATION MARK\r
+ = SINGLE REVERSED COMMA QUOTATION MARK\r
+ * glyph variant of 2018\r
+ x (modifier letter reversed comma - 02BD)\r
+201C LEFT DOUBLE QUOTATION MARK\r
+ = DOUBLE TURNED COMMA QUOTATION MARK\r
+ * this is the preferred glyph (as opposed to 201F)\r
+ x (quotation mark - 0022)\r
+ x (heavy double turned comma quotation mark ornament - 275D)\r
+ x (reversed double prime quotation mark - 301D)\r
+201D RIGHT DOUBLE QUOTATION MARK\r
+ = DOUBLE COMMA QUOTATION MARK\r
+ x (quotation mark - 0022)\r
+ x (double prime - 2033)\r
+ x (heavy double comma quotation mark ornament - 275E)\r
+ x (double prime quotation mark - 301E)\r
+201E DOUBLE LOW-9 QUOTATION MARK\r
+ = LOW DOUBLE COMMA QUOTATION MARK\r
+ * used as opening double quotation mark in some languages\r
+ x (low double prime quotation mark - 301F)\r
+201F DOUBLE HIGH-REVERSED-9 QUOTATION MARK\r
+ = DOUBLE REVERSED COMMA QUOTATION MARK\r
+ * glyph variant of 201C\r
+2020 DAGGER\r
+ = obelisk, obelus, long cross\r
+2021 DOUBLE DAGGER\r
+ = diesis, double obelisk\r
+2022 BULLET\r
+ = black small circle\r
+ x (middle dot - 00B7)\r
+ x (one dot leader - 2024)\r
+ x (bullet operator - 2219)\r
+ x (inverse bullet - 25D8)\r
+ x (white bullet - 25E6)\r
+2023 TRIANGULAR BULLET\r
+ x (end of proof - 220E)\r
+ x (black right-pointing small triangle - 25B8)\r
+2024 ONE DOT LEADER\r
+ x (middle dot - 00B7)\r
+ x (bullet - 2022)\r
+ x (bullet operator - 2219)\r
+ # 002E full stop\r
+2025 TWO DOT LEADER\r
+ # 002E 002E\r
+2026 HORIZONTAL ELLIPSIS\r
+ = three dot leader\r
+ x (vertical ellipsis - 22EE)\r
+ # 002E 002E 002E\r
+2027 HYPHENATION POINT\r
+@ Formatting characters\r
+2028 LINE SEPARATOR\r
+ * may be used to represent this semantic unambiguously\r
+2029 PARAGRAPH SEPARATOR\r
+ * may be used to represent this semantic unambiguously\r
+202A LEFT-TO-RIGHT EMBEDDING\r
+ = LRE\r
+202B RIGHT-TO-LEFT EMBEDDING\r
+ = RLE\r
+202C POP DIRECTIONAL FORMATTING\r
+ = PDF\r
+202D LEFT-TO-RIGHT OVERRIDE\r
+ = LRO\r
+202E RIGHT-TO-LEFT OVERRIDE\r
+ = RLO\r
+202F NARROW NO-BREAK SPACE\r
+ x (no-break space - 00A0)\r
+ # <noBreak> 0020\r
+@ General punctuation\r
+2030 PER MILLE SIGN\r
+ x (percent sign - 0025)\r
+2031 PER TEN THOUSAND SIGN\r
+ x (percent sign - 0025)\r
+2032 PRIME\r
+ = minutes, feet\r
+ x (apostrophe - 0027)\r
+ x (acute accent - 00B4)\r
+ x (modifier letter prime - 02B9)\r
+2033 DOUBLE PRIME\r
+ = seconds, inches\r
+ x (quotation mark - 0022)\r
+ x (modifier letter double prime - 02BA)\r
+ x (right double quotation mark - 201D)\r
+ x (ditto mark - 3003)\r
+ x (double prime quotation mark - 301E)\r
+ # 2032 2032\r
+2034 TRIPLE PRIME\r
+ # 2032 2032 2032\r
+2035 REVERSED PRIME\r
+ x (grave accent - 0060)\r
+2036 REVERSED DOUBLE PRIME\r
+ x (reversed double prime quotation mark - 301D)\r
+ # 2035 2035\r
+2037 REVERSED TRIPLE PRIME\r
+ # 2035 2035 2035\r
+2038 CARET\r
+ x (up arrowhead - 2303)\r
+2039 SINGLE LEFT-POINTING ANGLE QUOTATION MARK\r
+ = LEFT POINTING SINGLE GUILLEMET\r
+ * usually opening, sometimes closing\r
+ x (less-than sign - 003C)\r
+ x (left-pointing angle bracket - 2329)\r
+ x (left angle bracket - 3008)\r
+203A SINGLE RIGHT-POINTING ANGLE QUOTATION MARK\r
+ = RIGHT POINTING SINGLE GUILLEMET\r
+ * usually closing, sometimes opening\r
+ x (greater-than sign - 003E)\r
+ x (right-pointing angle bracket - 232A)\r
+ x (right angle bracket - 3009)\r
+203B REFERENCE MARK\r
+ = Japanese kome\r
+ = Urdu paragraph separator\r
+ x (tibetan ku ru kha bzhi mig can - 0FBF)\r
+203C DOUBLE EXCLAMATION MARK\r
+ x (exclamation mark - 0021)\r
+ # 0021 0021\r
+203D INTERROBANG\r
+ x (exclamation mark - 0021)\r
+ x (question mark - 003F)\r
+203E OVERLINE\r
+ = SPACING OVERSCORE\r
+ # 0020 0305\r
+203F UNDERTIE (Enotikon)\r
+ = Greek enotikon\r
+ x (smile - 2323)\r
+2040 CHARACTER TIE\r
+ x (frown - 2322)\r
+2041 CARET INSERTION POINT\r
+ * proofreader's mark: insert here\r
+ x (right semidirect product - 22CC)\r
+2042 ASTERISM\r
+2043 HYPHEN BULLET\r
+2044 FRACTION SLASH\r
+ = solidus (in typography)\r
+ * for composing arbitrary fractions\r
+ x (solidus - 002F)\r
+ x (division slash - 2215)\r
+2045 LEFT SQUARE BRACKET WITH QUILL\r
+2046 RIGHT SQUARE BRACKET WITH QUILL\r
+2048 QUESTION EXCLAMATION MARK\r
+ * designed for use in vertical text\r
+ # 003F 0021\r
+2049 EXCLAMATION QUESTION MARK\r
+ * designed for use in vertical text\r
+ # 0021 003F\r
+204A TIRONIAN SIGN ET\r
+ * Irish Gaelic, ...\r
+204B REVERSED PILCROW SIGN\r
+ x (pilcrow sign - 00B6)\r
+204C BLACK LEFTWARDS BULLET\r
+204D BLACK RIGHTWARDS BULLET\r
+@ Deprecated\r
+206A INHIBIT SYMMETRIC SWAPPING\r
+206B ACTIVATE SYMMETRIC SWAPPING\r
+206C INHIBIT ARABIC FORM SHAPING\r
+206D ACTIVATE ARABIC FORM SHAPING\r
+206E NATIONAL DIGIT SHAPES\r
+206F NOMINAL DIGIT SHAPES\r
+@@ 2070 Superscripts and Subscripts 209F\r
+@ Superscripts\r
+2070 SUPERSCRIPT ZERO\r
+ # <super> 0030\r
+2071 <reserved>\r
+ x (superscript one - 00B9)\r
+2072 <reserved>\r
+ x (superscript two - 00B2)\r
+2073 <reserved>\r
+ x (superscript three - 00B3)\r
+2074 SUPERSCRIPT FOUR\r
+ # <super> 0034\r
+2075 SUPERSCRIPT FIVE\r
+ # <super> 0035\r
+2076 SUPERSCRIPT SIX\r
+ # <super> 0036\r
+2077 SUPERSCRIPT SEVEN\r
+ # <super> 0037\r
+2078 SUPERSCRIPT EIGHT\r
+ # <super> 0038\r
+2079 SUPERSCRIPT NINE\r
+ # <super> 0039\r
+207A SUPERSCRIPT PLUS SIGN\r
+ # <super> 002B\r
+207B SUPERSCRIPT MINUS\r
+ # <super> 2212\r
+207C SUPERSCRIPT EQUALS SIGN\r
+ # <super> 003D\r
+207D SUPERSCRIPT LEFT PARENTHESIS\r
+ # <super> 0028\r
+207E SUPERSCRIPT RIGHT PARENTHESIS\r
+ # <super> 0029\r
+207F SUPERSCRIPT LATIN SMALL LETTER N\r
+ # <super> 006E\r
+@ Subscripts\r
+2080 SUBSCRIPT ZERO\r
+ # <sub> 0030\r
+2081 SUBSCRIPT ONE\r
+ # <sub> 0031\r
+2082 SUBSCRIPT TWO\r
+ # <sub> 0032\r
+2083 SUBSCRIPT THREE\r
+ # <sub> 0033\r
+2084 SUBSCRIPT FOUR\r
+ # <sub> 0034\r
+2085 SUBSCRIPT FIVE\r
+ # <sub> 0035\r
+2086 SUBSCRIPT SIX\r
+ # <sub> 0036\r
+2087 SUBSCRIPT SEVEN\r
+ # <sub> 0037\r
+2088 SUBSCRIPT EIGHT\r
+ # <sub> 0038\r
+2089 SUBSCRIPT NINE\r
+ # <sub> 0039\r
+208A SUBSCRIPT PLUS SIGN\r
+ # <sub> 002B\r
+208B SUBSCRIPT MINUS\r
+ # <sub> 2212\r
+208C SUBSCRIPT EQUALS SIGN\r
+ # <sub> 003D\r
+208D SUBSCRIPT LEFT PARENTHESIS\r
+ # <sub> 0028\r
+208E SUBSCRIPT RIGHT PARENTHESIS\r
+ # <sub> 0029\r
+@@ 20A0 Currency Symbols 20CF\r
+@ Currency symbols\r
+@+ A number of currency symbols are found in other blocks.\r
+ x (dollar sign - 0024)\r
+ x (cent sign - 00A2)\r
+ x (pound sign - 00A3)\r
+ x (currency sign - 00A4)\r
+ x (yen sign - 00A5)\r
+ x (bengali rupee mark - 09F2)\r
+ x (bengali rupee sign - 09F3)\r
+ x (thai currency symbol baht - 0E3F)\r
+ x (khmer currency symbol riel - 17DB)\r
+20A0 EURO-CURRENCY SIGN\r
+ * intended for ECU, but not widely used\r
+ * historical character, this is NOT the euro!\r
+ x (euro sign - 20AC)\r
+20A1 COLON SIGN\r
+ * Costa Rica, El Salvador\r
+20A2 CRUZEIRO SIGN\r
+ * Brazil\r
+20A3 FRENCH FRANC SIGN\r
+ * France\r
+20A4 LIRA SIGN\r
+ * Italy, Turkey\r
+ x (pound sign - 00A3)\r
+20A5 MILL SIGN\r
+ * USA (1/10 cent)\r
+20A6 NAIRA SIGN\r
+ * Nigeria\r
+20A7 PESETA SIGN\r
+ * Spain\r
+20A8 RUPEE SIGN\r
+ * India\r
+ # 0052 0073\r
+20A9 WON SIGN\r
+ * Korea\r
+20AA NEW SHEQEL SIGN\r
+ * Israel\r
+20AB DONG SIGN\r
+ * Vietnam\r
+20AC EURO SIGN\r
+ * currency sign for the European Monetary Union\r
+ * euro, not ECU\r
+ x (euro-currency sign - 20A0)\r
+20AD KIP SIGN\r
+ * Laos\r
+20AE TUGRIK SIGN\r
+ * Mongolia\r
+ * also transliterated as tugrug, tugric, tugrog, togrog\r
+20AF DRACHMA SIGN\r
+ * Greece\r
+@@ 20D0 Combining Diacritical Marks for Symbols 20FF\r
+@ Combining diacritical marks for symbols\r
+20D0 COMBINING LEFT HARPOON ABOVE\r
+20D1 COMBINING RIGHT HARPOON ABOVE\r
+ * vector\r
+20D2 COMBINING LONG VERTICAL LINE OVERLAY\r
+20D3 COMBINING SHORT VERTICAL LINE OVERLAY\r
+ * negation\r
+20D4 COMBINING ANTICLOCKWISE ARROW ABOVE\r
+20D5 COMBINING CLOCKWISE ARROW ABOVE\r
+ * rotation\r
+20D6 COMBINING LEFT ARROW ABOVE\r
+20D7 COMBINING RIGHT ARROW ABOVE\r
+ * vector\r
+20D8 COMBINING RING OVERLAY\r
+20D9 COMBINING CLOCKWISE RING OVERLAY\r
+20DA COMBINING ANTICLOCKWISE RING OVERLAY\r
+20DB COMBINING THREE DOTS ABOVE\r
+ = third derivative\r
+20DC COMBINING FOUR DOTS ABOVE\r
+ = fourth derivative\r
+@ Enclosing diacritics\r
+20DD COMBINING ENCLOSING CIRCLE\r
+ = JIS composition circle\r
+ x (white circle - 25CB)\r
+ x (large circle - 25EF)\r
+ x (ideographic number zero - 3007)\r
+20DE COMBINING ENCLOSING SQUARE\r
+ x (white square - 25A1)\r
+20DF COMBINING ENCLOSING DIAMOND\r
+ x (white diamond - 25C7)\r
+20E0 COMBINING ENCLOSING CIRCLE BACKSLASH\r
+ * prohibition\r
+@ Additional diacritical mark for symbols\r
+20E1 COMBINING LEFT RIGHT ARROW ABOVE\r
+ * tensor\r
+@ Additional enclosing diacritics\r
+20E2 COMBINING ENCLOSING SCREEN\r
+ x (clear screen symbol - 239A)\r
+20E3 COMBINING ENCLOSING KEYCAP\r
+\r
+*/\r
+\r